Ref #51: added blas extensions simatcopy, dimatcopy, cimatcopy, zimatcopy
This commit is contained in:
		
							parent
							
								
									cee257f384
								
							
						
					
					
						commit
						faeab93df0
					
				|  | @ -769,6 +769,11 @@ void    BLASFUNC(domatcopy) (char *, char *, blasint *, blasint *, double  *, do | ||||||
| void    BLASFUNC(comatcopy) (char *, char *, blasint *, blasint *, float  *, float  *, blasint *, float  *, blasint *); | void    BLASFUNC(comatcopy) (char *, char *, blasint *, blasint *, float  *, float  *, blasint *, float  *, blasint *); | ||||||
| void    BLASFUNC(zomatcopy) (char *, char *, blasint *, blasint *, double  *, double  *, blasint *, double  *, blasint *); | void    BLASFUNC(zomatcopy) (char *, char *, blasint *, blasint *, double  *, double  *, blasint *, double  *, blasint *); | ||||||
| 
 | 
 | ||||||
|  | void    BLASFUNC(simatcopy) (char *, char *, blasint *, blasint *, float  *, float  *, blasint *, blasint *); | ||||||
|  | void    BLASFUNC(dimatcopy) (char *, char *, blasint *, blasint *, double  *, double  *, blasint *, blasint *); | ||||||
|  | void    BLASFUNC(cimatcopy) (char *, char *, blasint *, blasint *, float  *, float  *, blasint *, blasint *); | ||||||
|  | void    BLASFUNC(zimatcopy) (char *, char *, blasint *, blasint *, double  *, double  *, blasint *, blasint *); | ||||||
|  | 
 | ||||||
| #ifdef __cplusplus | #ifdef __cplusplus | ||||||
| } | } | ||||||
|       |       | ||||||
|  |  | ||||||
|  | @ -41,7 +41,7 @@ SBLAS2OBJS    = \ | ||||||
| SBLAS3OBJS    = \
 | SBLAS3OBJS    = \
 | ||||||
| 		sgemm.$(SUFFIX) ssymm.$(SUFFIX) strmm.$(SUFFIX) \
 | 		sgemm.$(SUFFIX) ssymm.$(SUFFIX) strmm.$(SUFFIX) \
 | ||||||
| 		strsm.$(SUFFIX) ssyrk.$(SUFFIX) ssyr2k.$(SUFFIX) \
 | 		strsm.$(SUFFIX) ssyrk.$(SUFFIX) ssyr2k.$(SUFFIX) \
 | ||||||
| 		somatcopy.$(SUFFIX) | 		somatcopy.$(SUFFIX) simatcopy.$(SUFFIX) | ||||||
| 
 | 
 | ||||||
| 
 | 
 | ||||||
| DBLAS1OBJS    = \
 | DBLAS1OBJS    = \
 | ||||||
|  | @ -66,7 +66,7 @@ DBLAS2OBJS    = \ | ||||||
| DBLAS3OBJS    = \
 | DBLAS3OBJS    = \
 | ||||||
| 		dgemm.$(SUFFIX) dsymm.$(SUFFIX) dtrmm.$(SUFFIX) \
 | 		dgemm.$(SUFFIX) dsymm.$(SUFFIX) dtrmm.$(SUFFIX) \
 | ||||||
| 		dtrsm.$(SUFFIX) dsyrk.$(SUFFIX) dsyr2k.$(SUFFIX) \
 | 		dtrsm.$(SUFFIX) dsyrk.$(SUFFIX) dsyr2k.$(SUFFIX) \
 | ||||||
| 		domatcopy.$(SUFFIX) | 		domatcopy.$(SUFFIX) dimatcopy.$(SUFFIX) | ||||||
| 
 | 
 | ||||||
| CBLAS1OBJS    = \
 | CBLAS1OBJS    = \
 | ||||||
| 		caxpy.$(SUFFIX) caxpyc.$(SUFFIX) cswap.$(SUFFIX) \
 | 		caxpy.$(SUFFIX) caxpyc.$(SUFFIX) cswap.$(SUFFIX) \
 | ||||||
|  | @ -94,7 +94,7 @@ CBLAS3OBJS    = \ | ||||||
| 		cgemm.$(SUFFIX) csymm.$(SUFFIX) ctrmm.$(SUFFIX) \
 | 		cgemm.$(SUFFIX) csymm.$(SUFFIX) ctrmm.$(SUFFIX) \
 | ||||||
| 		ctrsm.$(SUFFIX) csyrk.$(SUFFIX) csyr2k.$(SUFFIX) \
 | 		ctrsm.$(SUFFIX) csyrk.$(SUFFIX) csyr2k.$(SUFFIX) \
 | ||||||
| 	       	chemm.$(SUFFIX) cherk.$(SUFFIX) cher2k.$(SUFFIX) \
 | 	       	chemm.$(SUFFIX) cherk.$(SUFFIX) cher2k.$(SUFFIX) \
 | ||||||
| 		comatcopy.$(SUFFIX) | 		comatcopy.$(SUFFIX) cimatcopy.$(SUFFIX) | ||||||
| 
 | 
 | ||||||
| ZBLAS1OBJS    = \
 | ZBLAS1OBJS    = \
 | ||||||
| 		zaxpy.$(SUFFIX) zaxpyc.$(SUFFIX) zswap.$(SUFFIX) \
 | 		zaxpy.$(SUFFIX) zaxpyc.$(SUFFIX) zswap.$(SUFFIX) \
 | ||||||
|  | @ -122,7 +122,7 @@ ZBLAS3OBJS    = \ | ||||||
| 		zgemm.$(SUFFIX) zsymm.$(SUFFIX) ztrmm.$(SUFFIX) \
 | 		zgemm.$(SUFFIX) zsymm.$(SUFFIX) ztrmm.$(SUFFIX) \
 | ||||||
| 		ztrsm.$(SUFFIX) zsyrk.$(SUFFIX) zsyr2k.$(SUFFIX) \
 | 		ztrsm.$(SUFFIX) zsyrk.$(SUFFIX) zsyr2k.$(SUFFIX) \
 | ||||||
| 	       	zhemm.$(SUFFIX) zherk.$(SUFFIX) zher2k.$(SUFFIX) \
 | 	       	zhemm.$(SUFFIX) zherk.$(SUFFIX) zher2k.$(SUFFIX) \
 | ||||||
| 		zomatcopy.$(SUFFIX) | 		zomatcopy.$(SUFFIX) zimatcopy.$(SUFFIX) | ||||||
| 
 | 
 | ||||||
| ifdef SUPPORT_GEMM3M | ifdef SUPPORT_GEMM3M | ||||||
| 
 | 
 | ||||||
|  | @ -2032,13 +2032,25 @@ cblas_caxpby.$(SUFFIX) cblas_caxpby.$(PSUFFIX) : zaxpby.c | ||||||
| domatcopy.$(SUFFIX) domatcopy.$(PSUFFIX) : omatcopy.c  | domatcopy.$(SUFFIX) domatcopy.$(PSUFFIX) : omatcopy.c  | ||||||
| 	$(CC) -c $(CFLAGS) $< -o $(@F) | 	$(CC) -c $(CFLAGS) $< -o $(@F) | ||||||
| 
 | 
 | ||||||
| somatcopy.$(SUFFIX) domatcopy.$(PSUFFIX) : omatcopy.c  | somatcopy.$(SUFFIX) somatcopy.$(PSUFFIX) : omatcopy.c  | ||||||
| 	$(CC) -c $(CFLAGS) $< -o $(@F) | 	$(CC) -c $(CFLAGS) $< -o $(@F) | ||||||
| 
 | 
 | ||||||
| comatcopy.$(SUFFIX) domatcopy.$(PSUFFIX) : zomatcopy.c  | comatcopy.$(SUFFIX) comatcopy.$(PSUFFIX) : zomatcopy.c  | ||||||
| 	$(CC) -c $(CFLAGS) $< -o $(@F) | 	$(CC) -c $(CFLAGS) $< -o $(@F) | ||||||
| 
 | 
 | ||||||
| zomatcopy.$(SUFFIX) domatcopy.$(PSUFFIX) : zomatcopy.c  | zomatcopy.$(SUFFIX) zomatcopy.$(PSUFFIX) : zomatcopy.c  | ||||||
|  | 	$(CC) -c $(CFLAGS) $< -o $(@F) | ||||||
|  | 
 | ||||||
|  | dimatcopy.$(SUFFIX) dimatcopy.$(PSUFFIX) : imatcopy.c  | ||||||
|  | 	$(CC) -c $(CFLAGS) $< -o $(@F) | ||||||
|  | 
 | ||||||
|  | simatcopy.$(SUFFIX) simatcopy.$(PSUFFIX) : imatcopy.c  | ||||||
|  | 	$(CC) -c $(CFLAGS) $< -o $(@F) | ||||||
|  | 
 | ||||||
|  | cimatcopy.$(SUFFIX) cimatcopy.$(PSUFFIX) : zimatcopy.c  | ||||||
|  | 	$(CC) -c $(CFLAGS) $< -o $(@F) | ||||||
|  | 
 | ||||||
|  | zimatcopy.$(SUFFIX) zimatcopy.$(PSUFFIX) : zimatcopy.c  | ||||||
| 	$(CC) -c $(CFLAGS) $< -o $(@F) | 	$(CC) -c $(CFLAGS) $< -o $(@F) | ||||||
| 
 | 
 | ||||||
| 
 | 
 | ||||||
|  |  | ||||||
|  | @ -0,0 +1,142 @@ | ||||||
|  | /***************************************************************************
 | ||||||
|  | Copyright (c) 2014, The OpenBLAS Project | ||||||
|  | All rights reserved. | ||||||
|  | Redistribution and use in source and binary forms, with or without | ||||||
|  | modification, are permitted provided that the following conditions are | ||||||
|  | met: | ||||||
|  | 1. Redistributions of source code must retain the above copyright | ||||||
|  | notice, this list of conditions and the following disclaimer. | ||||||
|  | 2. Redistributions in binary form must reproduce the above copyright | ||||||
|  | notice, this list of conditions and the following disclaimer in | ||||||
|  | the documentation and/or other materials provided with the | ||||||
|  | distribution. | ||||||
|  | 3. Neither the name of the OpenBLAS project nor the names of | ||||||
|  | its contributors may be used to endorse or promote products | ||||||
|  | derived from this software without specific prior written permission. | ||||||
|  | THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" | ||||||
|  | AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE | ||||||
|  | IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE | ||||||
|  | ARE DISCLAIMED. IN NO EVENT SHALL THE OPENBLAS PROJECT OR CONTRIBUTORS BE | ||||||
|  | LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL | ||||||
|  | DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR | ||||||
|  | SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER | ||||||
|  | CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, | ||||||
|  | OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE | ||||||
|  | USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||||
|  | *****************************************************************************/ | ||||||
|  | 
 | ||||||
|  | /***********************************************************
 | ||||||
|  |  * 2014/06/10 Saar | ||||||
|  | ***********************************************************/ | ||||||
|  | 
 | ||||||
|  | #include <stdio.h> | ||||||
|  | #include <stdlib.h> | ||||||
|  | #include "common.h" | ||||||
|  | #ifdef FUNCTION_PROFILE | ||||||
|  | #include "functable.h" | ||||||
|  | #endif | ||||||
|  | 
 | ||||||
|  | #if defined(DOUBLE) | ||||||
|  | #define ERROR_NAME "DIMATCOPY" | ||||||
|  | #else | ||||||
|  | #define ERROR_NAME "SIMATCOPY" | ||||||
|  | #endif | ||||||
|  | 
 | ||||||
|  | #define BlasRowMajor 0 | ||||||
|  | #define BlasColMajor 1 | ||||||
|  | #define BlasNoTrans  0 | ||||||
|  | #define BlasTrans    1 | ||||||
|  | 
 | ||||||
|  | #undef malloc | ||||||
|  | #undef free | ||||||
|  | 
 | ||||||
|  | void NAME( char* ORDER, char* TRANS, blasint *rows, blasint *cols, FLOAT *alpha, FLOAT *a, blasint *lda, blasint *ldb) | ||||||
|  | { | ||||||
|  | 
 | ||||||
|  | 	char Order, Trans; | ||||||
|  | 	int order=-1,trans=-1;	 | ||||||
|  | 	blasint info = -1; | ||||||
|  | 	FLOAT *b; | ||||||
|  | 	size_t msize; | ||||||
|  | 
 | ||||||
|  | 	Order = *ORDER; | ||||||
|  | 	Trans = *TRANS; | ||||||
|  | 
 | ||||||
|  | 	TOUPPER(Order); | ||||||
|  | 	TOUPPER(Trans); | ||||||
|  | 
 | ||||||
|  | 	if ( Order == 'C' ) order = BlasColMajor; | ||||||
|  | 	if ( Order == 'R' ) order = BlasRowMajor; | ||||||
|  | 	if ( Trans == 'N' ) trans = BlasNoTrans; | ||||||
|  | 	if ( Trans == 'R' ) trans = BlasNoTrans; | ||||||
|  | 	if ( Trans == 'T' ) trans = BlasTrans; | ||||||
|  | 	if ( Trans == 'C' ) trans = BlasTrans; | ||||||
|  | 
 | ||||||
|  | 	if ( order == BlasColMajor) | ||||||
|  | 	{ | ||||||
|  |         	if ( trans == BlasNoTrans  &&  *ldb < *rows ) info = 9; | ||||||
|  |         	if ( trans == BlasTrans    &&  *ldb < *cols ) info = 9; | ||||||
|  | 	} | ||||||
|  | 	if ( order == BlasRowMajor) | ||||||
|  | 	{ | ||||||
|  |         	if ( trans == BlasNoTrans  &&  *ldb < *cols ) info = 9; | ||||||
|  |         	if ( trans == BlasTrans    &&  *ldb < *rows ) info = 9; | ||||||
|  | 	} | ||||||
|  | 
 | ||||||
|  | 	if ( order == BlasColMajor &&  *lda < *rows ) info = 7; | ||||||
|  | 	if ( order == BlasRowMajor &&  *lda < *cols ) info = 7; | ||||||
|  | 	if ( *cols <= 0 ) info = 4; | ||||||
|  | 	if ( *rows <= 0 ) info = 3; | ||||||
|  | 	if ( trans < 0  ) info = 2; | ||||||
|  | 	if ( order < 0  ) info = 1; | ||||||
|  | 
 | ||||||
|  | 	if (info >= 0) { | ||||||
|  |     		BLASFUNC(xerbla)(ERROR_NAME, &info, sizeof(ERROR_NAME)); | ||||||
|  |     		return; | ||||||
|  |   	} | ||||||
|  | 
 | ||||||
|  | 	if ( *lda >  *ldb ) | ||||||
|  | 		msize = (*lda) * (*ldb)  * sizeof(FLOAT); | ||||||
|  | 	else | ||||||
|  | 		msize = (*ldb) * (*ldb)  * sizeof(FLOAT); | ||||||
|  | 
 | ||||||
|  | 	b = malloc(msize); | ||||||
|  | 	if ( b == NULL ) | ||||||
|  | 	{ | ||||||
|  | 		printf("Memory alloc failed\n"); | ||||||
|  | 		exit(1); | ||||||
|  | 	} | ||||||
|  | 
 | ||||||
|  | 	if ( order == BlasColMajor ) | ||||||
|  | 	{ | ||||||
|  | 		if ( trans == BlasNoTrans ) | ||||||
|  | 		{ | ||||||
|  | 			OMATCOPY_K_CN(*rows, *cols, *alpha, a, *lda, b, *ldb ); | ||||||
|  | 			OMATCOPY_K_CN(*rows, *cols, (FLOAT) 1.0 , b, *ldb, a, *ldb ); | ||||||
|  | 		} | ||||||
|  | 		else | ||||||
|  | 		{ | ||||||
|  | 			OMATCOPY_K_CT(*rows, *cols, *alpha, a, *lda, b, *ldb ); | ||||||
|  | 			OMATCOPY_K_CN(*rows, *cols, (FLOAT) 1.0, b, *ldb, a, *ldb ); | ||||||
|  | 		} | ||||||
|  | 	} | ||||||
|  | 	else | ||||||
|  | 	{ | ||||||
|  | 		if ( trans == BlasNoTrans ) | ||||||
|  | 		{ | ||||||
|  | 			OMATCOPY_K_RN(*rows, *cols, *alpha, a, *lda, b, *ldb ); | ||||||
|  | 			OMATCOPY_K_RN(*rows, *cols, (FLOAT) 1.0, b, *ldb, a, *ldb ); | ||||||
|  | 		} | ||||||
|  | 		else | ||||||
|  | 		{ | ||||||
|  | 			OMATCOPY_K_RT(*rows, *cols, *alpha, a, *lda, b, *ldb ); | ||||||
|  | 			OMATCOPY_K_RN(*rows, *cols, (FLOAT) 1.0, b, *ldb, a, *ldb ); | ||||||
|  | 		} | ||||||
|  | 	} | ||||||
|  | 
 | ||||||
|  | 	free(b); | ||||||
|  | 	return; | ||||||
|  | 
 | ||||||
|  | } | ||||||
|  | 
 | ||||||
|  | 
 | ||||||
|  | @ -0,0 +1,185 @@ | ||||||
|  | /***************************************************************************
 | ||||||
|  | Copyright (c) 2014, The OpenBLAS Project | ||||||
|  | All rights reserved. | ||||||
|  | Redistribution and use in source and binary forms, with or without | ||||||
|  | modification, are permitted provided that the following conditions are | ||||||
|  | met: | ||||||
|  | 1. Redistributions of source code must retain the above copyright | ||||||
|  | notice, this list of conditions and the following disclaimer. | ||||||
|  | 2. Redistributions in binary form must reproduce the above copyright | ||||||
|  | notice, this list of conditions and the following disclaimer in | ||||||
|  | the documentation and/or other materials provided with the | ||||||
|  | distribution. | ||||||
|  | 3. Neither the name of the OpenBLAS project nor the names of | ||||||
|  | its contributors may be used to endorse or promote products | ||||||
|  | derived from this software without specific prior written permission. | ||||||
|  | THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" | ||||||
|  | AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE | ||||||
|  | IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE | ||||||
|  | ARE DISCLAIMED. IN NO EVENT SHALL THE OPENBLAS PROJECT OR CONTRIBUTORS BE | ||||||
|  | LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL | ||||||
|  | DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR | ||||||
|  | SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER | ||||||
|  | CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, | ||||||
|  | OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE | ||||||
|  | USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||||
|  | *****************************************************************************/ | ||||||
|  | 
 | ||||||
|  | /***********************************************************
 | ||||||
|  |  * 2014/06/10 Saar | ||||||
|  | ***********************************************************/ | ||||||
|  | 
 | ||||||
|  | #include <stdio.h> | ||||||
|  | #include <stdlib.h> | ||||||
|  | #include "common.h" | ||||||
|  | #ifdef FUNCTION_PROFILE | ||||||
|  | #include "functable.h" | ||||||
|  | #endif | ||||||
|  | 
 | ||||||
|  | #if defined(DOUBLE) | ||||||
|  | #define ERROR_NAME "ZIMATCOPY" | ||||||
|  | #else | ||||||
|  | #define ERROR_NAME "CIMATCOPY" | ||||||
|  | #endif | ||||||
|  | 
 | ||||||
|  | #define BlasRowMajor     0 | ||||||
|  | #define BlasColMajor     1 | ||||||
|  | #define BlasNoTrans      0 | ||||||
|  | #define BlasTrans        1 | ||||||
|  | #define BlasTransConj    2 | ||||||
|  | #define BlasConj         3 | ||||||
|  | 
 | ||||||
|  | void NAME( char* ORDER, char* TRANS, blasint *rows, blasint *cols, FLOAT *alpha, FLOAT *a, blasint *lda, blasint *ldb) | ||||||
|  | { | ||||||
|  | 
 | ||||||
|  | 	char Order, Trans; | ||||||
|  | 	int order=-1,trans=-1;	 | ||||||
|  | 	blasint info = -1; | ||||||
|  | 	FLOAT *b; | ||||||
|  | 	size_t msize; | ||||||
|  | 
 | ||||||
|  | 	Order = *ORDER; | ||||||
|  | 	Trans = *TRANS; | ||||||
|  | 
 | ||||||
|  | 	TOUPPER(Order); | ||||||
|  | 	TOUPPER(Trans); | ||||||
|  | 
 | ||||||
|  | 	if ( Order == 'C' ) order = BlasColMajor; | ||||||
|  | 	if ( Order == 'R' ) order = BlasRowMajor; | ||||||
|  | 	if ( Trans == 'N' ) trans = BlasNoTrans; | ||||||
|  | 	if ( Trans == 'T' ) trans = BlasTrans; | ||||||
|  | 	if ( Trans == 'C' ) trans = BlasTransConj; | ||||||
|  | 	if ( Trans == 'R' ) trans = BlasConj; | ||||||
|  | 
 | ||||||
|  | 	if ( order == BlasColMajor) | ||||||
|  | 	{ | ||||||
|  |         	if ( trans == BlasNoTrans      &&  *ldb < *rows ) info = 9; | ||||||
|  |         	if ( trans == BlasConj         &&  *ldb < *rows ) info = 9; | ||||||
|  |         	if ( trans == BlasTrans        &&  *ldb < *cols ) info = 9; | ||||||
|  |         	if ( trans == BlasTransConj    &&  *ldb < *cols ) info = 9; | ||||||
|  | 	} | ||||||
|  | 	if ( order == BlasRowMajor) | ||||||
|  | 	{ | ||||||
|  |         	if ( trans == BlasNoTrans    &&  *ldb < *cols ) info = 9; | ||||||
|  |         	if ( trans == BlasConj       &&  *ldb < *cols ) info = 9; | ||||||
|  |         	if ( trans == BlasTrans      &&  *ldb < *rows ) info = 9; | ||||||
|  |         	if ( trans == BlasTransConj  &&  *ldb < *rows ) info = 9; | ||||||
|  | 	} | ||||||
|  | 
 | ||||||
|  | 	if ( order == BlasColMajor &&  *lda < *rows ) info = 7; | ||||||
|  | 	if ( order == BlasRowMajor &&  *lda < *cols ) info = 7; | ||||||
|  | 	if ( *cols <= 0 ) info = 4; | ||||||
|  | 	if ( *rows <= 0 ) info = 3; | ||||||
|  | 	if ( trans < 0  ) info = 2; | ||||||
|  | 	if ( order < 0  ) info = 1; | ||||||
|  | 
 | ||||||
|  | 	if (info >= 0) { | ||||||
|  |     		BLASFUNC(xerbla)(ERROR_NAME, &info, sizeof(ERROR_NAME)); | ||||||
|  |     		return; | ||||||
|  |   	} | ||||||
|  | 
 | ||||||
|  | 	if ( *lda >  *ldb ) | ||||||
|  |                 msize = (*lda) * (*ldb)  * sizeof(FLOAT) * 2; | ||||||
|  |         else | ||||||
|  |                 msize = (*ldb) * (*ldb)  * sizeof(FLOAT) * 2; | ||||||
|  | 
 | ||||||
|  |         b = malloc(msize); | ||||||
|  |         if ( b == NULL ) | ||||||
|  |         { | ||||||
|  |                 printf("Memory alloc failed\n"); | ||||||
|  |                 exit(1); | ||||||
|  |         } | ||||||
|  | 
 | ||||||
|  | 
 | ||||||
|  | 	if ( order == BlasColMajor ) | ||||||
|  | 	{ | ||||||
|  | 
 | ||||||
|  | 		if ( trans == BlasNoTrans ) | ||||||
|  | 		{ | ||||||
|  | 	  		OMATCOPY_K_CN(*rows, *cols, alpha[0], alpha[1], a, *lda, b, *ldb ); | ||||||
|  | 	  		OMATCOPY_K_CN(*rows, *cols, (FLOAT) 1.0, (FLOAT) 0.0 , b, *ldb, a, *ldb ); | ||||||
|  | 			free(b); | ||||||
|  | 			return; | ||||||
|  | 		} | ||||||
|  | 		if ( trans == BlasConj ) | ||||||
|  | 		{ | ||||||
|  | 			OMATCOPY_K_CNC(*rows, *cols, alpha[0], alpha[1], a, *lda, b, *ldb ); | ||||||
|  | 	  		OMATCOPY_K_CN(*rows, *cols, (FLOAT) 1.0, (FLOAT) 0.0 , b, *ldb, a, *ldb ); | ||||||
|  | 			free(b); | ||||||
|  | 			return; | ||||||
|  | 		} | ||||||
|  | 		if ( trans == BlasTrans ) | ||||||
|  | 		{ | ||||||
|  | 			OMATCOPY_K_CT(*rows, *cols, alpha[0], alpha[1], a, *lda, b, *ldb ); | ||||||
|  | 	  		OMATCOPY_K_CN(*rows, *cols, (FLOAT) 1.0, (FLOAT) 0.0 , b, *ldb, a, *ldb ); | ||||||
|  | 			free(b); | ||||||
|  | 			return; | ||||||
|  | 		} | ||||||
|  | 		if ( trans == BlasTransConj ) | ||||||
|  | 		{ | ||||||
|  | 			OMATCOPY_K_CTC(*rows, *cols, alpha[0], alpha[1], a, *lda, b, *ldb ); | ||||||
|  | 	  		OMATCOPY_K_CN(*rows, *cols, (FLOAT) 1.0, (FLOAT) 0.0 , b, *ldb, a, *ldb ); | ||||||
|  | 			free(b); | ||||||
|  | 			return; | ||||||
|  | 		} | ||||||
|  | 
 | ||||||
|  | 	} | ||||||
|  | 	else | ||||||
|  | 	{ | ||||||
|  | 
 | ||||||
|  | 		if ( trans == BlasNoTrans ) | ||||||
|  | 		{ | ||||||
|  | 			OMATCOPY_K_RN(*rows, *cols, alpha[0], alpha[1], a, *lda, b, *ldb ); | ||||||
|  | 	  		OMATCOPY_K_RN(*rows, *cols, (FLOAT) 1.0, (FLOAT) 0.0 , b, *ldb, a, *ldb ); | ||||||
|  | 			free(b); | ||||||
|  | 			return; | ||||||
|  | 		} | ||||||
|  | 		if ( trans == BlasConj ) | ||||||
|  | 		{ | ||||||
|  | 			OMATCOPY_K_RNC(*rows, *cols, alpha[0], alpha[1], a, *lda, b, *ldb ); | ||||||
|  | 	  		OMATCOPY_K_RN(*rows, *cols, (FLOAT) 1.0, (FLOAT) 0.0 , b, *ldb, a, *ldb ); | ||||||
|  | 			free(b); | ||||||
|  | 			return; | ||||||
|  | 		} | ||||||
|  | 		if ( trans == BlasTrans ) | ||||||
|  | 		{ | ||||||
|  | 			OMATCOPY_K_RT(*rows, *cols, alpha[0], alpha[1], a, *lda, b, *ldb ); | ||||||
|  | 	  		OMATCOPY_K_RN(*rows, *cols, (FLOAT) 1.0, (FLOAT) 0.0 , b, *ldb, a, *ldb ); | ||||||
|  | 			free(b); | ||||||
|  | 			return; | ||||||
|  | 		} | ||||||
|  | 		if ( trans == BlasTransConj ) | ||||||
|  | 		{ | ||||||
|  | 			OMATCOPY_K_RTC(*rows, *cols, alpha[0], alpha[1], a, *lda, b, *ldb ); | ||||||
|  | 	  		OMATCOPY_K_RN(*rows, *cols, (FLOAT) 1.0, (FLOAT) 0.0 , b, *ldb, a, *ldb ); | ||||||
|  | 			free(b); | ||||||
|  | 			return; | ||||||
|  | 		} | ||||||
|  | 
 | ||||||
|  | 	} | ||||||
|  | 
 | ||||||
|  | 	return; | ||||||
|  | 
 | ||||||
|  | } | ||||||
|  | 
 | ||||||
|  | 
 | ||||||
		Loading…
	
		Reference in New Issue