136 lines
5.8 KiB
C
136 lines
5.8 KiB
C
/*****************************************************************************
|
|
Copyright (c) 2014, Intel Corp.
|
|
All rights reserved.
|
|
|
|
Redistribution and use in source and binary forms, with or without
|
|
modification, are permitted provided that the following conditions are met:
|
|
|
|
* Redistributions of source code must retain the above copyright notice,
|
|
this list of conditions and the following disclaimer.
|
|
* Redistributions in binary form must reproduce the above copyright
|
|
notice, this list of conditions and the following disclaimer in the
|
|
documentation and/or other materials provided with the distribution.
|
|
* Neither the name of Intel Corporation nor the names of its contributors
|
|
may be used to endorse or promote products derived from this software
|
|
without specific prior written permission.
|
|
|
|
THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
|
|
AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
|
IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
|
|
ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
|
|
LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
|
|
CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
|
|
SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
|
|
INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
|
|
CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
|
|
ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF
|
|
THE POSSIBILITY OF SUCH DAMAGE.
|
|
*****************************************************************************
|
|
* Contents: Native middle-level C interface to LAPACK function clarfb
|
|
* Author: Intel Corporation
|
|
*****************************************************************************/
|
|
|
|
#include "lapacke_utils.h"
|
|
|
|
lapack_int LAPACKE_clarfb_work( int matrix_layout, char side, char trans,
|
|
char direct, char storev, lapack_int m,
|
|
lapack_int n, lapack_int k,
|
|
const lapack_complex_float* v, lapack_int ldv,
|
|
const lapack_complex_float* t, lapack_int ldt,
|
|
lapack_complex_float* c, lapack_int ldc,
|
|
lapack_complex_float* work, lapack_int ldwork )
|
|
{
|
|
lapack_int info = 0;
|
|
lapack_int nrows_v, ncols_v;
|
|
lapack_logical left, col, forward;
|
|
char uplo;
|
|
lapack_int ldc_t, ldt_t, ldv_t;
|
|
lapack_complex_float *v_t = NULL, *t_t = NULL, *c_t = NULL;
|
|
if( matrix_layout == LAPACK_COL_MAJOR ) {
|
|
/* Call LAPACK function and adjust info */
|
|
LAPACK_clarfb( &side, &trans, &direct, &storev, &m, &n, &k, v, &ldv, t,
|
|
&ldt, c, &ldc, work, &ldwork );
|
|
if( info < 0 ) {
|
|
info = info - 1;
|
|
}
|
|
} else if( matrix_layout == LAPACK_ROW_MAJOR ) {
|
|
left = LAPACKE_lsame( side, 'l' );
|
|
col = LAPACKE_lsame( storev, 'c' );
|
|
forward = LAPACKE_lsame( direct, 'f' );
|
|
|
|
nrows_v = ( col && left ) ? m : ( ( col && !left ) ? n : ( !col ? k : 1) );
|
|
ncols_v = ( !col && left ) ? m : ( ( !col && !left ) ? n : ( col ? k : 1 ) );
|
|
uplo = ( ( forward && col ) || !( forward || col ) ) ? 'l' : 'u';
|
|
|
|
ldc_t = MAX(1,m);
|
|
ldt_t = MAX(1,k);
|
|
ldv_t = MAX(1,nrows_v);
|
|
/* Check leading dimension(s) */
|
|
if( ldc < n ) {
|
|
info = -14;
|
|
LAPACKE_xerbla( "LAPACKE_clarfb_work", info );
|
|
return info;
|
|
}
|
|
if( ldt < k ) {
|
|
info = -12;
|
|
LAPACKE_xerbla( "LAPACKE_clarfb_work", info );
|
|
return info;
|
|
}
|
|
if( ldv < ncols_v ) {
|
|
info = -10;
|
|
LAPACKE_xerbla( "LAPACKE_clarfb_work", info );
|
|
return info;
|
|
}
|
|
if( ( col && k > nrows_v ) || ( !col && k > ncols_v ) ) {
|
|
info = -8;
|
|
LAPACKE_xerbla( "LAPACKE_clarfb_work", info );
|
|
return info;
|
|
}
|
|
/* Allocate memory for temporary array(s) */
|
|
v_t = (lapack_complex_float*)
|
|
LAPACKE_malloc( sizeof(lapack_complex_float) *
|
|
ldv_t * MAX(1,ncols_v) );
|
|
if( v_t == NULL ) {
|
|
info = LAPACK_TRANSPOSE_MEMORY_ERROR;
|
|
goto exit_level_0;
|
|
}
|
|
t_t = (lapack_complex_float*)
|
|
LAPACKE_malloc( sizeof(lapack_complex_float) * ldt_t * MAX(1,k) );
|
|
if( t_t == NULL ) {
|
|
info = LAPACK_TRANSPOSE_MEMORY_ERROR;
|
|
goto exit_level_1;
|
|
}
|
|
c_t = (lapack_complex_float*)
|
|
LAPACKE_malloc( sizeof(lapack_complex_float) * ldc_t * MAX(1,n) );
|
|
if( c_t == NULL ) {
|
|
info = LAPACK_TRANSPOSE_MEMORY_ERROR;
|
|
goto exit_level_2;
|
|
}
|
|
/* Transpose input matrices */
|
|
LAPACKE_ctz_trans( matrix_layout, direct, uplo, 'u', nrows_v, ncols_v,
|
|
v, ldv, v_t, ldv_t );
|
|
LAPACKE_cge_trans( matrix_layout, k, k, t, ldt, t_t, ldt_t );
|
|
LAPACKE_cge_trans( matrix_layout, m, n, c, ldc, c_t, ldc_t );
|
|
/* Call LAPACK function and adjust info */
|
|
LAPACK_clarfb( &side, &trans, &direct, &storev, &m, &n, &k, v_t, &ldv_t,
|
|
t_t, &ldt_t, c_t, &ldc_t, work, &ldwork );
|
|
info = 0; /* LAPACK call is ok! */
|
|
/* Transpose output matrices */
|
|
LAPACKE_cge_trans( LAPACK_COL_MAJOR, m, n, c_t, ldc_t, c, ldc );
|
|
/* Release memory and exit */
|
|
LAPACKE_free( c_t );
|
|
exit_level_2:
|
|
LAPACKE_free( t_t );
|
|
exit_level_1:
|
|
LAPACKE_free( v_t );
|
|
exit_level_0:
|
|
if( info == LAPACK_TRANSPOSE_MEMORY_ERROR ) {
|
|
LAPACKE_xerbla( "LAPACKE_clarfb_work", info );
|
|
}
|
|
} else {
|
|
info = -1;
|
|
LAPACKE_xerbla( "LAPACKE_clarfb_work", info );
|
|
}
|
|
return info;
|
|
}
|