277 lines
		
	
	
		
			12 KiB
		
	
	
	
		
			C
		
	
	
	
			
		
		
	
	
			277 lines
		
	
	
		
			12 KiB
		
	
	
	
		
			C
		
	
	
	
| /*****************************************************************************
 | |
|   Copyright (c) 2011, Intel Corp.
 | |
|   All rights reserved.
 | |
| 
 | |
|   Redistribution and use in source and binary forms, with or without
 | |
|   modification, are permitted provided that the following conditions are met:
 | |
| 
 | |
|     * Redistributions of source code must retain the above copyright notice,
 | |
|       this list of conditions and the following disclaimer.
 | |
|     * Redistributions in binary form must reproduce the above copyright
 | |
|       notice, this list of conditions and the following disclaimer in the
 | |
|       documentation and/or other materials provided with the distribution.
 | |
|     * Neither the name of Intel Corporation nor the names of its contributors
 | |
|       may be used to endorse or promote products derived from this software
 | |
|       without specific prior written permission.
 | |
| 
 | |
|   THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
 | |
|   AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 | |
|   IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 | |
|   ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
 | |
|   LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
 | |
|   CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
 | |
|   SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
 | |
|   INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
 | |
|   CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
 | |
|   ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF
 | |
|   THE POSSIBILITY OF SUCH DAMAGE.
 | |
| *****************************************************************************
 | |
| * Contents: Native middle-level C interface to LAPACK function cuncsd
 | |
| * Author: Intel Corporation
 | |
| * Generated November, 2011
 | |
| *****************************************************************************/
 | |
| 
 | |
| #include "lapacke_utils.h"
 | |
| 
 | |
| lapack_int LAPACKE_cuncsd_work( int matrix_order, char jobu1, char jobu2,
 | |
|                                 char jobv1t, char jobv2t, char trans,
 | |
|                                 char signs, lapack_int m, lapack_int p,
 | |
|                                 lapack_int q, lapack_complex_float* x11,
 | |
|                                 lapack_int ldx11, lapack_complex_float* x12,
 | |
|                                 lapack_int ldx12, lapack_complex_float* x21,
 | |
|                                 lapack_int ldx21, lapack_complex_float* x22,
 | |
|                                 lapack_int ldx22, float* theta,
 | |
|                                 lapack_complex_float* u1, lapack_int ldu1,
 | |
|                                 lapack_complex_float* u2, lapack_int ldu2,
 | |
|                                 lapack_complex_float* v1t, lapack_int ldv1t,
 | |
|                                 lapack_complex_float* v2t, lapack_int ldv2t,
 | |
|                                 lapack_complex_float* work, lapack_int lwork,
 | |
|                                 float* rwork, lapack_int lrwork,
 | |
|                                 lapack_int* iwork )
 | |
| {
 | |
|     lapack_int info = 0;
 | |
|     if( matrix_order == LAPACK_COL_MAJOR ) {
 | |
|         /* Call LAPACK function and adjust info */
 | |
|         LAPACK_cuncsd( &jobu1, &jobu2, &jobv1t, &jobv2t, &trans, &signs, &m, &p,
 | |
|                        &q, x11, &ldx11, x12, &ldx12, x21, &ldx21, x22, &ldx22,
 | |
|                        theta, u1, &ldu1, u2, &ldu2, v1t, &ldv1t, v2t, &ldv2t,
 | |
|                        work, &lwork, rwork, &lrwork, iwork, &info );
 | |
|         if( info < 0 ) {
 | |
|             info = info - 1;
 | |
|         }
 | |
|     } else if( matrix_order == LAPACK_ROW_MAJOR ) {
 | |
|         lapack_int nrows_x11 = ( LAPACKE_lsame( trans, 'n' ) ? p : q);
 | |
|         lapack_int nrows_x12 = ( LAPACKE_lsame( trans, 'n' ) ? p : m-q);
 | |
|         lapack_int nrows_x21 = ( LAPACKE_lsame( trans, 'n' ) ? m-p : q);
 | |
|         lapack_int nrows_x22 = ( LAPACKE_lsame( trans, 'n' ) ? m-p : m-q);
 | |
|         lapack_int nrows_u1 = ( LAPACKE_lsame( jobu1, 'y' ) ? p : 1);
 | |
|         lapack_int nrows_u2 = ( LAPACKE_lsame( jobu2, 'y' ) ? m-p : 1);
 | |
|         lapack_int nrows_v1t = ( LAPACKE_lsame( jobv1t, 'y' ) ? q : 1);
 | |
|         lapack_int nrows_v2t = ( LAPACKE_lsame( jobv2t, 'y' ) ? m-q : 1);
 | |
|         lapack_int ldu1_t = MAX(1,nrows_u1);
 | |
|         lapack_int ldu2_t = MAX(1,nrows_u2);
 | |
|         lapack_int ldv1t_t = MAX(1,nrows_v1t);
 | |
|         lapack_int ldv2t_t = MAX(1,nrows_v2t);
 | |
|         lapack_int ldx11_t = MAX(1,nrows_x11);
 | |
|         lapack_int ldx12_t = MAX(1,nrows_x12);
 | |
|         lapack_int ldx21_t = MAX(1,nrows_x21);
 | |
|         lapack_int ldx22_t = MAX(1,nrows_x22);
 | |
|         lapack_complex_float* x11_t = NULL;
 | |
|         lapack_complex_float* x12_t = NULL;
 | |
|         lapack_complex_float* x21_t = NULL;
 | |
|         lapack_complex_float* x22_t = NULL;
 | |
|         lapack_complex_float* u1_t = NULL;
 | |
|         lapack_complex_float* u2_t = NULL;
 | |
|         lapack_complex_float* v1t_t = NULL;
 | |
|         lapack_complex_float* v2t_t = NULL;
 | |
|         /* Check leading dimension(s) */
 | |
|         if( ldu1 < p ) {
 | |
|             info = -21;
 | |
|             LAPACKE_xerbla( "LAPACKE_cuncsd_work", info );
 | |
|             return info;
 | |
|         }
 | |
|         if( ldu2 < m-p ) {
 | |
|             info = -23;
 | |
|             LAPACKE_xerbla( "LAPACKE_cuncsd_work", info );
 | |
|             return info;
 | |
|         }
 | |
|         if( ldv1t < q ) {
 | |
|             info = -25;
 | |
|             LAPACKE_xerbla( "LAPACKE_cuncsd_work", info );
 | |
|             return info;
 | |
|         }
 | |
|         if( ldv2t < m-q ) {
 | |
|             info = -27;
 | |
|             LAPACKE_xerbla( "LAPACKE_cuncsd_work", info );
 | |
|             return info;
 | |
|         }
 | |
|         if( ldx11 < q ) {
 | |
|             info = -12;
 | |
|             LAPACKE_xerbla( "LAPACKE_cuncsd_work", info );
 | |
|             return info;
 | |
|         }
 | |
|         if( ldx12 < m-q ) {
 | |
|             info = -14;
 | |
|             LAPACKE_xerbla( "LAPACKE_cuncsd_work", info );
 | |
|             return info;
 | |
|         }
 | |
|         if( ldx21 < q ) {
 | |
|             info = -16;
 | |
|             LAPACKE_xerbla( "LAPACKE_cuncsd_work", info );
 | |
|             return info;
 | |
|         }
 | |
|         if( ldx22 < m-q ) {
 | |
|             info = -18;
 | |
|             LAPACKE_xerbla( "LAPACKE_cuncsd_work", info );
 | |
|             return info;
 | |
|         }
 | |
|         /* Query optimal working array(s) size if requested */
 | |
|         if( lrwork == -1 || lwork == -1 ) {
 | |
|             LAPACK_cuncsd( &jobu1, &jobu2, &jobv1t, &jobv2t, &trans, &signs, &m,
 | |
|                            &p, &q, x11, &ldx11_t, x12, &ldx12_t, x21, &ldx21_t,
 | |
|                            x22, &ldx22_t, theta, u1, &ldu1_t, u2, &ldu2_t, v1t,
 | |
|                            &ldv1t_t, v2t, &ldv2t_t, work, &lwork, rwork,
 | |
|                            &lrwork, iwork, &info );
 | |
|             return (info < 0) ? (info - 1) : info;
 | |
|         }
 | |
|         /* Allocate memory for temporary array(s) */
 | |
|         x11_t = (lapack_complex_float*)
 | |
|             LAPACKE_malloc( sizeof(lapack_complex_float) * ldx11_t * MAX(1,q) );
 | |
|         if( x11_t == NULL ) {
 | |
|             info = LAPACK_TRANSPOSE_MEMORY_ERROR;
 | |
|             goto exit_level_0;
 | |
|         }
 | |
|         x12_t = (lapack_complex_float*)
 | |
|             LAPACKE_malloc( sizeof(lapack_complex_float) *
 | |
|                             ldx12_t * MAX(1,m-q) );
 | |
|         if( x12_t == NULL ) {
 | |
|             info = LAPACK_TRANSPOSE_MEMORY_ERROR;
 | |
|             goto exit_level_1;
 | |
|         }
 | |
|         x21_t = (lapack_complex_float*)
 | |
|             LAPACKE_malloc( sizeof(lapack_complex_float) * ldx21_t * MAX(1,q) );
 | |
|         if( x21_t == NULL ) {
 | |
|             info = LAPACK_TRANSPOSE_MEMORY_ERROR;
 | |
|             goto exit_level_2;
 | |
|         }
 | |
|         x22_t = (lapack_complex_float*)
 | |
|             LAPACKE_malloc( sizeof(lapack_complex_float) *
 | |
|                             ldx22_t * MAX(1,m-q) );
 | |
|         if( x22_t == NULL ) {
 | |
|             info = LAPACK_TRANSPOSE_MEMORY_ERROR;
 | |
|             goto exit_level_3;
 | |
|         }
 | |
|         if( LAPACKE_lsame( jobu1, 'y' ) ) {
 | |
|             u1_t = (lapack_complex_float*)
 | |
|                 LAPACKE_malloc( sizeof(lapack_complex_float) *
 | |
|                                 ldu1_t * MAX(1,p) );
 | |
|             if( u1_t == NULL ) {
 | |
|                 info = LAPACK_TRANSPOSE_MEMORY_ERROR;
 | |
|                 goto exit_level_4;
 | |
|             }
 | |
|         }
 | |
|         if( LAPACKE_lsame( jobu2, 'y' ) ) {
 | |
|             u2_t = (lapack_complex_float*)
 | |
|                 LAPACKE_malloc( sizeof(lapack_complex_float) *
 | |
|                                 ldu2_t * MAX(1,m-p) );
 | |
|             if( u2_t == NULL ) {
 | |
|                 info = LAPACK_TRANSPOSE_MEMORY_ERROR;
 | |
|                 goto exit_level_5;
 | |
|             }
 | |
|         }
 | |
|         if( LAPACKE_lsame( jobv1t, 'y' ) ) {
 | |
|             v1t_t = (lapack_complex_float*)
 | |
|                 LAPACKE_malloc( sizeof(lapack_complex_float) *
 | |
|                                 ldv1t_t * MAX(1,q) );
 | |
|             if( v1t_t == NULL ) {
 | |
|                 info = LAPACK_TRANSPOSE_MEMORY_ERROR;
 | |
|                 goto exit_level_6;
 | |
|             }
 | |
|         }
 | |
|         if( LAPACKE_lsame( jobv2t, 'y' ) ) {
 | |
|             v2t_t = (lapack_complex_float*)
 | |
|                 LAPACKE_malloc( sizeof(lapack_complex_float) *
 | |
|                                 ldv2t_t * MAX(1,m-q) );
 | |
|             if( v2t_t == NULL ) {
 | |
|                 info = LAPACK_TRANSPOSE_MEMORY_ERROR;
 | |
|                 goto exit_level_7;
 | |
|             }
 | |
|         }
 | |
|         /* Transpose input matrices */
 | |
|         LAPACKE_cge_trans( matrix_order, nrows_x11, q, x11, ldx11, x11_t,
 | |
|                            ldx11_t );
 | |
|         LAPACKE_cge_trans( matrix_order, nrows_x12, m-q, x12, ldx12, x12_t,
 | |
|                            ldx12_t );
 | |
|         LAPACKE_cge_trans( matrix_order, nrows_x21, q, x21, ldx21, x21_t,
 | |
|                            ldx21_t );
 | |
|         LAPACKE_cge_trans( matrix_order, nrows_x22, m-q, x22, ldx22, x22_t,
 | |
|                            ldx22_t );
 | |
|         /* Call LAPACK function and adjust info */
 | |
|         LAPACK_cuncsd( &jobu1, &jobu2, &jobv1t, &jobv2t, &trans, &signs, &m, &p,
 | |
|                        &q, x11_t, &ldx11_t, x12_t, &ldx12_t, x21_t, &ldx21_t,
 | |
|                        x22_t, &ldx22_t, theta, u1_t, &ldu1_t, u2_t, &ldu2_t,
 | |
|                        v1t_t, &ldv1t_t, v2t_t, &ldv2t_t, work, &lwork, rwork,
 | |
|                        &lrwork, iwork, &info );
 | |
|         if( info < 0 ) {
 | |
|             info = info - 1;
 | |
|         }
 | |
|         /* Transpose output matrices */
 | |
|         LAPACKE_cge_trans( LAPACK_COL_MAJOR, nrows_x11, q, x11_t, ldx11_t, x11,
 | |
|                            ldx11 );
 | |
|         LAPACKE_cge_trans( LAPACK_COL_MAJOR, nrows_x12, m-q, x12_t, ldx12_t,
 | |
|                            x12, ldx12 );
 | |
|         LAPACKE_cge_trans( LAPACK_COL_MAJOR, nrows_x21, q, x21_t, ldx21_t, x21,
 | |
|                            ldx21 );
 | |
|         LAPACKE_cge_trans( LAPACK_COL_MAJOR, nrows_x22, m-q, x22_t, ldx22_t,
 | |
|                            x22, ldx22 );
 | |
|         if( LAPACKE_lsame( jobu1, 'y' ) ) {
 | |
|             LAPACKE_cge_trans( LAPACK_COL_MAJOR, nrows_u1, p, u1_t, ldu1_t, u1,
 | |
|                                ldu1 );
 | |
|         }
 | |
|         if( LAPACKE_lsame( jobu2, 'y' ) ) {
 | |
|             LAPACKE_cge_trans( LAPACK_COL_MAJOR, nrows_u2, m-p, u2_t, ldu2_t,
 | |
|                                u2, ldu2 );
 | |
|         }
 | |
|         if( LAPACKE_lsame( jobv1t, 'y' ) ) {
 | |
|             LAPACKE_cge_trans( LAPACK_COL_MAJOR, nrows_v1t, q, v1t_t, ldv1t_t,
 | |
|                                v1t, ldv1t );
 | |
|         }
 | |
|         if( LAPACKE_lsame( jobv2t, 'y' ) ) {
 | |
|             LAPACKE_cge_trans( LAPACK_COL_MAJOR, nrows_v2t, m-q, v2t_t, ldv2t_t,
 | |
|                                v2t, ldv2t );
 | |
|         }
 | |
|         /* Release memory and exit */
 | |
|         if( LAPACKE_lsame( jobv2t, 'y' ) ) {
 | |
|             LAPACKE_free( v2t_t );
 | |
|         }
 | |
| exit_level_7:
 | |
|         if( LAPACKE_lsame( jobv1t, 'y' ) ) {
 | |
|             LAPACKE_free( v1t_t );
 | |
|         }
 | |
| exit_level_6:
 | |
|         if( LAPACKE_lsame( jobu2, 'y' ) ) {
 | |
|             LAPACKE_free( u2_t );
 | |
|         }
 | |
| exit_level_5:
 | |
|         if( LAPACKE_lsame( jobu1, 'y' ) ) {
 | |
|             LAPACKE_free( u1_t );
 | |
|         }
 | |
| exit_level_4:
 | |
|         LAPACKE_free( x22_t );
 | |
| exit_level_3:
 | |
|         LAPACKE_free( x21_t );
 | |
| exit_level_2:
 | |
|         LAPACKE_free( x12_t );
 | |
| exit_level_1:
 | |
|         LAPACKE_free( x11_t );
 | |
| exit_level_0:
 | |
|         if( info == LAPACK_TRANSPOSE_MEMORY_ERROR ) {
 | |
|             LAPACKE_xerbla( "LAPACKE_cuncsd_work", info );
 | |
|         }
 | |
|     } else {
 | |
|         info = -1;
 | |
|         LAPACKE_xerbla( "LAPACKE_cuncsd_work", info );
 | |
|     }
 | |
|     return info;
 | |
| }
 |