Ref #51: added blas extensions simatcopy, dimatcopy, cimatcopy, zimatcopy
This commit is contained in:
		
							parent
							
								
									cee257f384
								
							
						
					
					
						commit
						faeab93df0
					
				| 
						 | 
					@ -769,6 +769,11 @@ void    BLASFUNC(domatcopy) (char *, char *, blasint *, blasint *, double  *, do
 | 
				
			||||||
void    BLASFUNC(comatcopy) (char *, char *, blasint *, blasint *, float  *, float  *, blasint *, float  *, blasint *);
 | 
					void    BLASFUNC(comatcopy) (char *, char *, blasint *, blasint *, float  *, float  *, blasint *, float  *, blasint *);
 | 
				
			||||||
void    BLASFUNC(zomatcopy) (char *, char *, blasint *, blasint *, double  *, double  *, blasint *, double  *, blasint *);
 | 
					void    BLASFUNC(zomatcopy) (char *, char *, blasint *, blasint *, double  *, double  *, blasint *, double  *, blasint *);
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					void    BLASFUNC(simatcopy) (char *, char *, blasint *, blasint *, float  *, float  *, blasint *, blasint *);
 | 
				
			||||||
 | 
					void    BLASFUNC(dimatcopy) (char *, char *, blasint *, blasint *, double  *, double  *, blasint *, blasint *);
 | 
				
			||||||
 | 
					void    BLASFUNC(cimatcopy) (char *, char *, blasint *, blasint *, float  *, float  *, blasint *, blasint *);
 | 
				
			||||||
 | 
					void    BLASFUNC(zimatcopy) (char *, char *, blasint *, blasint *, double  *, double  *, blasint *, blasint *);
 | 
				
			||||||
 | 
					
 | 
				
			||||||
#ifdef __cplusplus
 | 
					#ifdef __cplusplus
 | 
				
			||||||
}
 | 
					}
 | 
				
			||||||
     
 | 
					     
 | 
				
			||||||
| 
						 | 
					
 | 
				
			||||||
| 
						 | 
					@ -41,7 +41,7 @@ SBLAS2OBJS    = \
 | 
				
			||||||
SBLAS3OBJS    = \
 | 
					SBLAS3OBJS    = \
 | 
				
			||||||
		sgemm.$(SUFFIX) ssymm.$(SUFFIX) strmm.$(SUFFIX) \
 | 
							sgemm.$(SUFFIX) ssymm.$(SUFFIX) strmm.$(SUFFIX) \
 | 
				
			||||||
		strsm.$(SUFFIX) ssyrk.$(SUFFIX) ssyr2k.$(SUFFIX) \
 | 
							strsm.$(SUFFIX) ssyrk.$(SUFFIX) ssyr2k.$(SUFFIX) \
 | 
				
			||||||
		somatcopy.$(SUFFIX)
 | 
							somatcopy.$(SUFFIX) simatcopy.$(SUFFIX)
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					
 | 
				
			||||||
DBLAS1OBJS    = \
 | 
					DBLAS1OBJS    = \
 | 
				
			||||||
| 
						 | 
					@ -66,7 +66,7 @@ DBLAS2OBJS    = \
 | 
				
			||||||
DBLAS3OBJS    = \
 | 
					DBLAS3OBJS    = \
 | 
				
			||||||
		dgemm.$(SUFFIX) dsymm.$(SUFFIX) dtrmm.$(SUFFIX) \
 | 
							dgemm.$(SUFFIX) dsymm.$(SUFFIX) dtrmm.$(SUFFIX) \
 | 
				
			||||||
		dtrsm.$(SUFFIX) dsyrk.$(SUFFIX) dsyr2k.$(SUFFIX) \
 | 
							dtrsm.$(SUFFIX) dsyrk.$(SUFFIX) dsyr2k.$(SUFFIX) \
 | 
				
			||||||
		domatcopy.$(SUFFIX)
 | 
							domatcopy.$(SUFFIX) dimatcopy.$(SUFFIX)
 | 
				
			||||||
 | 
					
 | 
				
			||||||
CBLAS1OBJS    = \
 | 
					CBLAS1OBJS    = \
 | 
				
			||||||
		caxpy.$(SUFFIX) caxpyc.$(SUFFIX) cswap.$(SUFFIX) \
 | 
							caxpy.$(SUFFIX) caxpyc.$(SUFFIX) cswap.$(SUFFIX) \
 | 
				
			||||||
| 
						 | 
					@ -94,7 +94,7 @@ CBLAS3OBJS    = \
 | 
				
			||||||
		cgemm.$(SUFFIX) csymm.$(SUFFIX) ctrmm.$(SUFFIX) \
 | 
							cgemm.$(SUFFIX) csymm.$(SUFFIX) ctrmm.$(SUFFIX) \
 | 
				
			||||||
		ctrsm.$(SUFFIX) csyrk.$(SUFFIX) csyr2k.$(SUFFIX) \
 | 
							ctrsm.$(SUFFIX) csyrk.$(SUFFIX) csyr2k.$(SUFFIX) \
 | 
				
			||||||
	       	chemm.$(SUFFIX) cherk.$(SUFFIX) cher2k.$(SUFFIX) \
 | 
						       	chemm.$(SUFFIX) cherk.$(SUFFIX) cher2k.$(SUFFIX) \
 | 
				
			||||||
		comatcopy.$(SUFFIX)
 | 
							comatcopy.$(SUFFIX) cimatcopy.$(SUFFIX)
 | 
				
			||||||
 | 
					
 | 
				
			||||||
ZBLAS1OBJS    = \
 | 
					ZBLAS1OBJS    = \
 | 
				
			||||||
		zaxpy.$(SUFFIX) zaxpyc.$(SUFFIX) zswap.$(SUFFIX) \
 | 
							zaxpy.$(SUFFIX) zaxpyc.$(SUFFIX) zswap.$(SUFFIX) \
 | 
				
			||||||
| 
						 | 
					@ -122,7 +122,7 @@ ZBLAS3OBJS    = \
 | 
				
			||||||
		zgemm.$(SUFFIX) zsymm.$(SUFFIX) ztrmm.$(SUFFIX) \
 | 
							zgemm.$(SUFFIX) zsymm.$(SUFFIX) ztrmm.$(SUFFIX) \
 | 
				
			||||||
		ztrsm.$(SUFFIX) zsyrk.$(SUFFIX) zsyr2k.$(SUFFIX) \
 | 
							ztrsm.$(SUFFIX) zsyrk.$(SUFFIX) zsyr2k.$(SUFFIX) \
 | 
				
			||||||
	       	zhemm.$(SUFFIX) zherk.$(SUFFIX) zher2k.$(SUFFIX) \
 | 
						       	zhemm.$(SUFFIX) zherk.$(SUFFIX) zher2k.$(SUFFIX) \
 | 
				
			||||||
		zomatcopy.$(SUFFIX)
 | 
							zomatcopy.$(SUFFIX) zimatcopy.$(SUFFIX)
 | 
				
			||||||
 | 
					
 | 
				
			||||||
ifdef SUPPORT_GEMM3M
 | 
					ifdef SUPPORT_GEMM3M
 | 
				
			||||||
 | 
					
 | 
				
			||||||
| 
						 | 
					@ -2032,13 +2032,25 @@ cblas_caxpby.$(SUFFIX) cblas_caxpby.$(PSUFFIX) : zaxpby.c
 | 
				
			||||||
domatcopy.$(SUFFIX) domatcopy.$(PSUFFIX) : omatcopy.c 
 | 
					domatcopy.$(SUFFIX) domatcopy.$(PSUFFIX) : omatcopy.c 
 | 
				
			||||||
	$(CC) -c $(CFLAGS) $< -o $(@F)
 | 
						$(CC) -c $(CFLAGS) $< -o $(@F)
 | 
				
			||||||
 | 
					
 | 
				
			||||||
somatcopy.$(SUFFIX) domatcopy.$(PSUFFIX) : omatcopy.c 
 | 
					somatcopy.$(SUFFIX) somatcopy.$(PSUFFIX) : omatcopy.c 
 | 
				
			||||||
	$(CC) -c $(CFLAGS) $< -o $(@F)
 | 
						$(CC) -c $(CFLAGS) $< -o $(@F)
 | 
				
			||||||
 | 
					
 | 
				
			||||||
comatcopy.$(SUFFIX) domatcopy.$(PSUFFIX) : zomatcopy.c 
 | 
					comatcopy.$(SUFFIX) comatcopy.$(PSUFFIX) : zomatcopy.c 
 | 
				
			||||||
	$(CC) -c $(CFLAGS) $< -o $(@F)
 | 
						$(CC) -c $(CFLAGS) $< -o $(@F)
 | 
				
			||||||
 | 
					
 | 
				
			||||||
zomatcopy.$(SUFFIX) domatcopy.$(PSUFFIX) : zomatcopy.c 
 | 
					zomatcopy.$(SUFFIX) zomatcopy.$(PSUFFIX) : zomatcopy.c 
 | 
				
			||||||
 | 
						$(CC) -c $(CFLAGS) $< -o $(@F)
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					dimatcopy.$(SUFFIX) dimatcopy.$(PSUFFIX) : imatcopy.c 
 | 
				
			||||||
 | 
						$(CC) -c $(CFLAGS) $< -o $(@F)
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					simatcopy.$(SUFFIX) simatcopy.$(PSUFFIX) : imatcopy.c 
 | 
				
			||||||
 | 
						$(CC) -c $(CFLAGS) $< -o $(@F)
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					cimatcopy.$(SUFFIX) cimatcopy.$(PSUFFIX) : zimatcopy.c 
 | 
				
			||||||
 | 
						$(CC) -c $(CFLAGS) $< -o $(@F)
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					zimatcopy.$(SUFFIX) zimatcopy.$(PSUFFIX) : zimatcopy.c 
 | 
				
			||||||
	$(CC) -c $(CFLAGS) $< -o $(@F)
 | 
						$(CC) -c $(CFLAGS) $< -o $(@F)
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					
 | 
				
			||||||
| 
						 | 
					
 | 
				
			||||||
| 
						 | 
					@ -0,0 +1,142 @@
 | 
				
			||||||
 | 
					/***************************************************************************
 | 
				
			||||||
 | 
					Copyright (c) 2014, The OpenBLAS Project
 | 
				
			||||||
 | 
					All rights reserved.
 | 
				
			||||||
 | 
					Redistribution and use in source and binary forms, with or without
 | 
				
			||||||
 | 
					modification, are permitted provided that the following conditions are
 | 
				
			||||||
 | 
					met:
 | 
				
			||||||
 | 
					1. Redistributions of source code must retain the above copyright
 | 
				
			||||||
 | 
					notice, this list of conditions and the following disclaimer.
 | 
				
			||||||
 | 
					2. Redistributions in binary form must reproduce the above copyright
 | 
				
			||||||
 | 
					notice, this list of conditions and the following disclaimer in
 | 
				
			||||||
 | 
					the documentation and/or other materials provided with the
 | 
				
			||||||
 | 
					distribution.
 | 
				
			||||||
 | 
					3. Neither the name of the OpenBLAS project nor the names of
 | 
				
			||||||
 | 
					its contributors may be used to endorse or promote products
 | 
				
			||||||
 | 
					derived from this software without specific prior written permission.
 | 
				
			||||||
 | 
					THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
 | 
				
			||||||
 | 
					AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 | 
				
			||||||
 | 
					IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 | 
				
			||||||
 | 
					ARE DISCLAIMED. IN NO EVENT SHALL THE OPENBLAS PROJECT OR CONTRIBUTORS BE
 | 
				
			||||||
 | 
					LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
 | 
				
			||||||
 | 
					DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
 | 
				
			||||||
 | 
					SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
 | 
				
			||||||
 | 
					CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
 | 
				
			||||||
 | 
					OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE
 | 
				
			||||||
 | 
					USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 | 
				
			||||||
 | 
					*****************************************************************************/
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					/***********************************************************
 | 
				
			||||||
 | 
					 * 2014/06/10 Saar
 | 
				
			||||||
 | 
					***********************************************************/
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					#include <stdio.h>
 | 
				
			||||||
 | 
					#include <stdlib.h>
 | 
				
			||||||
 | 
					#include "common.h"
 | 
				
			||||||
 | 
					#ifdef FUNCTION_PROFILE
 | 
				
			||||||
 | 
					#include "functable.h"
 | 
				
			||||||
 | 
					#endif
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					#if defined(DOUBLE)
 | 
				
			||||||
 | 
					#define ERROR_NAME "DIMATCOPY"
 | 
				
			||||||
 | 
					#else
 | 
				
			||||||
 | 
					#define ERROR_NAME "SIMATCOPY"
 | 
				
			||||||
 | 
					#endif
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					#define BlasRowMajor 0
 | 
				
			||||||
 | 
					#define BlasColMajor 1
 | 
				
			||||||
 | 
					#define BlasNoTrans  0
 | 
				
			||||||
 | 
					#define BlasTrans    1
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					#undef malloc
 | 
				
			||||||
 | 
					#undef free
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					void NAME( char* ORDER, char* TRANS, blasint *rows, blasint *cols, FLOAT *alpha, FLOAT *a, blasint *lda, blasint *ldb)
 | 
				
			||||||
 | 
					{
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
						char Order, Trans;
 | 
				
			||||||
 | 
						int order=-1,trans=-1;	
 | 
				
			||||||
 | 
						blasint info = -1;
 | 
				
			||||||
 | 
						FLOAT *b;
 | 
				
			||||||
 | 
						size_t msize;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
						Order = *ORDER;
 | 
				
			||||||
 | 
						Trans = *TRANS;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
						TOUPPER(Order);
 | 
				
			||||||
 | 
						TOUPPER(Trans);
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
						if ( Order == 'C' ) order = BlasColMajor;
 | 
				
			||||||
 | 
						if ( Order == 'R' ) order = BlasRowMajor;
 | 
				
			||||||
 | 
						if ( Trans == 'N' ) trans = BlasNoTrans;
 | 
				
			||||||
 | 
						if ( Trans == 'R' ) trans = BlasNoTrans;
 | 
				
			||||||
 | 
						if ( Trans == 'T' ) trans = BlasTrans;
 | 
				
			||||||
 | 
						if ( Trans == 'C' ) trans = BlasTrans;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
						if ( order == BlasColMajor)
 | 
				
			||||||
 | 
						{
 | 
				
			||||||
 | 
					        	if ( trans == BlasNoTrans  &&  *ldb < *rows ) info = 9;
 | 
				
			||||||
 | 
					        	if ( trans == BlasTrans    &&  *ldb < *cols ) info = 9;
 | 
				
			||||||
 | 
						}
 | 
				
			||||||
 | 
						if ( order == BlasRowMajor)
 | 
				
			||||||
 | 
						{
 | 
				
			||||||
 | 
					        	if ( trans == BlasNoTrans  &&  *ldb < *cols ) info = 9;
 | 
				
			||||||
 | 
					        	if ( trans == BlasTrans    &&  *ldb < *rows ) info = 9;
 | 
				
			||||||
 | 
						}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
						if ( order == BlasColMajor &&  *lda < *rows ) info = 7;
 | 
				
			||||||
 | 
						if ( order == BlasRowMajor &&  *lda < *cols ) info = 7;
 | 
				
			||||||
 | 
						if ( *cols <= 0 ) info = 4;
 | 
				
			||||||
 | 
						if ( *rows <= 0 ) info = 3;
 | 
				
			||||||
 | 
						if ( trans < 0  ) info = 2;
 | 
				
			||||||
 | 
						if ( order < 0  ) info = 1;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
						if (info >= 0) {
 | 
				
			||||||
 | 
					    		BLASFUNC(xerbla)(ERROR_NAME, &info, sizeof(ERROR_NAME));
 | 
				
			||||||
 | 
					    		return;
 | 
				
			||||||
 | 
					  	}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
						if ( *lda >  *ldb )
 | 
				
			||||||
 | 
							msize = (*lda) * (*ldb)  * sizeof(FLOAT);
 | 
				
			||||||
 | 
						else
 | 
				
			||||||
 | 
							msize = (*ldb) * (*ldb)  * sizeof(FLOAT);
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
						b = malloc(msize);
 | 
				
			||||||
 | 
						if ( b == NULL )
 | 
				
			||||||
 | 
						{
 | 
				
			||||||
 | 
							printf("Memory alloc failed\n");
 | 
				
			||||||
 | 
							exit(1);
 | 
				
			||||||
 | 
						}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
						if ( order == BlasColMajor )
 | 
				
			||||||
 | 
						{
 | 
				
			||||||
 | 
							if ( trans == BlasNoTrans )
 | 
				
			||||||
 | 
							{
 | 
				
			||||||
 | 
								OMATCOPY_K_CN(*rows, *cols, *alpha, a, *lda, b, *ldb );
 | 
				
			||||||
 | 
								OMATCOPY_K_CN(*rows, *cols, (FLOAT) 1.0 , b, *ldb, a, *ldb );
 | 
				
			||||||
 | 
							}
 | 
				
			||||||
 | 
							else
 | 
				
			||||||
 | 
							{
 | 
				
			||||||
 | 
								OMATCOPY_K_CT(*rows, *cols, *alpha, a, *lda, b, *ldb );
 | 
				
			||||||
 | 
								OMATCOPY_K_CN(*rows, *cols, (FLOAT) 1.0, b, *ldb, a, *ldb );
 | 
				
			||||||
 | 
							}
 | 
				
			||||||
 | 
						}
 | 
				
			||||||
 | 
						else
 | 
				
			||||||
 | 
						{
 | 
				
			||||||
 | 
							if ( trans == BlasNoTrans )
 | 
				
			||||||
 | 
							{
 | 
				
			||||||
 | 
								OMATCOPY_K_RN(*rows, *cols, *alpha, a, *lda, b, *ldb );
 | 
				
			||||||
 | 
								OMATCOPY_K_RN(*rows, *cols, (FLOAT) 1.0, b, *ldb, a, *ldb );
 | 
				
			||||||
 | 
							}
 | 
				
			||||||
 | 
							else
 | 
				
			||||||
 | 
							{
 | 
				
			||||||
 | 
								OMATCOPY_K_RT(*rows, *cols, *alpha, a, *lda, b, *ldb );
 | 
				
			||||||
 | 
								OMATCOPY_K_RN(*rows, *cols, (FLOAT) 1.0, b, *ldb, a, *ldb );
 | 
				
			||||||
 | 
							}
 | 
				
			||||||
 | 
						}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
						free(b);
 | 
				
			||||||
 | 
						return;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					
 | 
				
			||||||
| 
						 | 
					@ -0,0 +1,185 @@
 | 
				
			||||||
 | 
					/***************************************************************************
 | 
				
			||||||
 | 
					Copyright (c) 2014, The OpenBLAS Project
 | 
				
			||||||
 | 
					All rights reserved.
 | 
				
			||||||
 | 
					Redistribution and use in source and binary forms, with or without
 | 
				
			||||||
 | 
					modification, are permitted provided that the following conditions are
 | 
				
			||||||
 | 
					met:
 | 
				
			||||||
 | 
					1. Redistributions of source code must retain the above copyright
 | 
				
			||||||
 | 
					notice, this list of conditions and the following disclaimer.
 | 
				
			||||||
 | 
					2. Redistributions in binary form must reproduce the above copyright
 | 
				
			||||||
 | 
					notice, this list of conditions and the following disclaimer in
 | 
				
			||||||
 | 
					the documentation and/or other materials provided with the
 | 
				
			||||||
 | 
					distribution.
 | 
				
			||||||
 | 
					3. Neither the name of the OpenBLAS project nor the names of
 | 
				
			||||||
 | 
					its contributors may be used to endorse or promote products
 | 
				
			||||||
 | 
					derived from this software without specific prior written permission.
 | 
				
			||||||
 | 
					THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
 | 
				
			||||||
 | 
					AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 | 
				
			||||||
 | 
					IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 | 
				
			||||||
 | 
					ARE DISCLAIMED. IN NO EVENT SHALL THE OPENBLAS PROJECT OR CONTRIBUTORS BE
 | 
				
			||||||
 | 
					LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
 | 
				
			||||||
 | 
					DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
 | 
				
			||||||
 | 
					SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
 | 
				
			||||||
 | 
					CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
 | 
				
			||||||
 | 
					OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE
 | 
				
			||||||
 | 
					USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 | 
				
			||||||
 | 
					*****************************************************************************/
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					/***********************************************************
 | 
				
			||||||
 | 
					 * 2014/06/10 Saar
 | 
				
			||||||
 | 
					***********************************************************/
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					#include <stdio.h>
 | 
				
			||||||
 | 
					#include <stdlib.h>
 | 
				
			||||||
 | 
					#include "common.h"
 | 
				
			||||||
 | 
					#ifdef FUNCTION_PROFILE
 | 
				
			||||||
 | 
					#include "functable.h"
 | 
				
			||||||
 | 
					#endif
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					#if defined(DOUBLE)
 | 
				
			||||||
 | 
					#define ERROR_NAME "ZIMATCOPY"
 | 
				
			||||||
 | 
					#else
 | 
				
			||||||
 | 
					#define ERROR_NAME "CIMATCOPY"
 | 
				
			||||||
 | 
					#endif
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					#define BlasRowMajor     0
 | 
				
			||||||
 | 
					#define BlasColMajor     1
 | 
				
			||||||
 | 
					#define BlasNoTrans      0
 | 
				
			||||||
 | 
					#define BlasTrans        1
 | 
				
			||||||
 | 
					#define BlasTransConj    2
 | 
				
			||||||
 | 
					#define BlasConj         3
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					void NAME( char* ORDER, char* TRANS, blasint *rows, blasint *cols, FLOAT *alpha, FLOAT *a, blasint *lda, blasint *ldb)
 | 
				
			||||||
 | 
					{
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
						char Order, Trans;
 | 
				
			||||||
 | 
						int order=-1,trans=-1;	
 | 
				
			||||||
 | 
						blasint info = -1;
 | 
				
			||||||
 | 
						FLOAT *b;
 | 
				
			||||||
 | 
						size_t msize;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
						Order = *ORDER;
 | 
				
			||||||
 | 
						Trans = *TRANS;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
						TOUPPER(Order);
 | 
				
			||||||
 | 
						TOUPPER(Trans);
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
						if ( Order == 'C' ) order = BlasColMajor;
 | 
				
			||||||
 | 
						if ( Order == 'R' ) order = BlasRowMajor;
 | 
				
			||||||
 | 
						if ( Trans == 'N' ) trans = BlasNoTrans;
 | 
				
			||||||
 | 
						if ( Trans == 'T' ) trans = BlasTrans;
 | 
				
			||||||
 | 
						if ( Trans == 'C' ) trans = BlasTransConj;
 | 
				
			||||||
 | 
						if ( Trans == 'R' ) trans = BlasConj;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
						if ( order == BlasColMajor)
 | 
				
			||||||
 | 
						{
 | 
				
			||||||
 | 
					        	if ( trans == BlasNoTrans      &&  *ldb < *rows ) info = 9;
 | 
				
			||||||
 | 
					        	if ( trans == BlasConj         &&  *ldb < *rows ) info = 9;
 | 
				
			||||||
 | 
					        	if ( trans == BlasTrans        &&  *ldb < *cols ) info = 9;
 | 
				
			||||||
 | 
					        	if ( trans == BlasTransConj    &&  *ldb < *cols ) info = 9;
 | 
				
			||||||
 | 
						}
 | 
				
			||||||
 | 
						if ( order == BlasRowMajor)
 | 
				
			||||||
 | 
						{
 | 
				
			||||||
 | 
					        	if ( trans == BlasNoTrans    &&  *ldb < *cols ) info = 9;
 | 
				
			||||||
 | 
					        	if ( trans == BlasConj       &&  *ldb < *cols ) info = 9;
 | 
				
			||||||
 | 
					        	if ( trans == BlasTrans      &&  *ldb < *rows ) info = 9;
 | 
				
			||||||
 | 
					        	if ( trans == BlasTransConj  &&  *ldb < *rows ) info = 9;
 | 
				
			||||||
 | 
						}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
						if ( order == BlasColMajor &&  *lda < *rows ) info = 7;
 | 
				
			||||||
 | 
						if ( order == BlasRowMajor &&  *lda < *cols ) info = 7;
 | 
				
			||||||
 | 
						if ( *cols <= 0 ) info = 4;
 | 
				
			||||||
 | 
						if ( *rows <= 0 ) info = 3;
 | 
				
			||||||
 | 
						if ( trans < 0  ) info = 2;
 | 
				
			||||||
 | 
						if ( order < 0  ) info = 1;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
						if (info >= 0) {
 | 
				
			||||||
 | 
					    		BLASFUNC(xerbla)(ERROR_NAME, &info, sizeof(ERROR_NAME));
 | 
				
			||||||
 | 
					    		return;
 | 
				
			||||||
 | 
					  	}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
						if ( *lda >  *ldb )
 | 
				
			||||||
 | 
					                msize = (*lda) * (*ldb)  * sizeof(FLOAT) * 2;
 | 
				
			||||||
 | 
					        else
 | 
				
			||||||
 | 
					                msize = (*ldb) * (*ldb)  * sizeof(FLOAT) * 2;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					        b = malloc(msize);
 | 
				
			||||||
 | 
					        if ( b == NULL )
 | 
				
			||||||
 | 
					        {
 | 
				
			||||||
 | 
					                printf("Memory alloc failed\n");
 | 
				
			||||||
 | 
					                exit(1);
 | 
				
			||||||
 | 
					        }
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
						if ( order == BlasColMajor )
 | 
				
			||||||
 | 
						{
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
							if ( trans == BlasNoTrans )
 | 
				
			||||||
 | 
							{
 | 
				
			||||||
 | 
						  		OMATCOPY_K_CN(*rows, *cols, alpha[0], alpha[1], a, *lda, b, *ldb );
 | 
				
			||||||
 | 
						  		OMATCOPY_K_CN(*rows, *cols, (FLOAT) 1.0, (FLOAT) 0.0 , b, *ldb, a, *ldb );
 | 
				
			||||||
 | 
								free(b);
 | 
				
			||||||
 | 
								return;
 | 
				
			||||||
 | 
							}
 | 
				
			||||||
 | 
							if ( trans == BlasConj )
 | 
				
			||||||
 | 
							{
 | 
				
			||||||
 | 
								OMATCOPY_K_CNC(*rows, *cols, alpha[0], alpha[1], a, *lda, b, *ldb );
 | 
				
			||||||
 | 
						  		OMATCOPY_K_CN(*rows, *cols, (FLOAT) 1.0, (FLOAT) 0.0 , b, *ldb, a, *ldb );
 | 
				
			||||||
 | 
								free(b);
 | 
				
			||||||
 | 
								return;
 | 
				
			||||||
 | 
							}
 | 
				
			||||||
 | 
							if ( trans == BlasTrans )
 | 
				
			||||||
 | 
							{
 | 
				
			||||||
 | 
								OMATCOPY_K_CT(*rows, *cols, alpha[0], alpha[1], a, *lda, b, *ldb );
 | 
				
			||||||
 | 
						  		OMATCOPY_K_CN(*rows, *cols, (FLOAT) 1.0, (FLOAT) 0.0 , b, *ldb, a, *ldb );
 | 
				
			||||||
 | 
								free(b);
 | 
				
			||||||
 | 
								return;
 | 
				
			||||||
 | 
							}
 | 
				
			||||||
 | 
							if ( trans == BlasTransConj )
 | 
				
			||||||
 | 
							{
 | 
				
			||||||
 | 
								OMATCOPY_K_CTC(*rows, *cols, alpha[0], alpha[1], a, *lda, b, *ldb );
 | 
				
			||||||
 | 
						  		OMATCOPY_K_CN(*rows, *cols, (FLOAT) 1.0, (FLOAT) 0.0 , b, *ldb, a, *ldb );
 | 
				
			||||||
 | 
								free(b);
 | 
				
			||||||
 | 
								return;
 | 
				
			||||||
 | 
							}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
						}
 | 
				
			||||||
 | 
						else
 | 
				
			||||||
 | 
						{
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
							if ( trans == BlasNoTrans )
 | 
				
			||||||
 | 
							{
 | 
				
			||||||
 | 
								OMATCOPY_K_RN(*rows, *cols, alpha[0], alpha[1], a, *lda, b, *ldb );
 | 
				
			||||||
 | 
						  		OMATCOPY_K_RN(*rows, *cols, (FLOAT) 1.0, (FLOAT) 0.0 , b, *ldb, a, *ldb );
 | 
				
			||||||
 | 
								free(b);
 | 
				
			||||||
 | 
								return;
 | 
				
			||||||
 | 
							}
 | 
				
			||||||
 | 
							if ( trans == BlasConj )
 | 
				
			||||||
 | 
							{
 | 
				
			||||||
 | 
								OMATCOPY_K_RNC(*rows, *cols, alpha[0], alpha[1], a, *lda, b, *ldb );
 | 
				
			||||||
 | 
						  		OMATCOPY_K_RN(*rows, *cols, (FLOAT) 1.0, (FLOAT) 0.0 , b, *ldb, a, *ldb );
 | 
				
			||||||
 | 
								free(b);
 | 
				
			||||||
 | 
								return;
 | 
				
			||||||
 | 
							}
 | 
				
			||||||
 | 
							if ( trans == BlasTrans )
 | 
				
			||||||
 | 
							{
 | 
				
			||||||
 | 
								OMATCOPY_K_RT(*rows, *cols, alpha[0], alpha[1], a, *lda, b, *ldb );
 | 
				
			||||||
 | 
						  		OMATCOPY_K_RN(*rows, *cols, (FLOAT) 1.0, (FLOAT) 0.0 , b, *ldb, a, *ldb );
 | 
				
			||||||
 | 
								free(b);
 | 
				
			||||||
 | 
								return;
 | 
				
			||||||
 | 
							}
 | 
				
			||||||
 | 
							if ( trans == BlasTransConj )
 | 
				
			||||||
 | 
							{
 | 
				
			||||||
 | 
								OMATCOPY_K_RTC(*rows, *cols, alpha[0], alpha[1], a, *lda, b, *ldb );
 | 
				
			||||||
 | 
						  		OMATCOPY_K_RN(*rows, *cols, (FLOAT) 1.0, (FLOAT) 0.0 , b, *ldb, a, *ldb );
 | 
				
			||||||
 | 
								free(b);
 | 
				
			||||||
 | 
								return;
 | 
				
			||||||
 | 
							}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
						}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
						return;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					
 | 
				
			||||||
		Loading…
	
		Reference in New Issue