3502 lines
		
	
	
		
			133 KiB
		
	
	
	
		
			Fortran
		
	
	
	
			
		
		
	
	
			3502 lines
		
	
	
		
			133 KiB
		
	
	
	
		
			Fortran
		
	
	
	
*> \brief <b> DGESVD computes the singular value decomposition (SVD) for GE matrices</b>
 | 
						|
*
 | 
						|
*  =========== DOCUMENTATION ===========
 | 
						|
*
 | 
						|
* Online html documentation available at
 | 
						|
*            http://www.netlib.org/lapack/explore-html/
 | 
						|
*
 | 
						|
*> \htmlonly
 | 
						|
*> Download DGESVD + dependencies
 | 
						|
*> <a href="http://www.netlib.org/cgi-bin/netlibfiles.tgz?format=tgz&filename=/lapack/lapack_routine/dgesvd.f">
 | 
						|
*> [TGZ]</a>
 | 
						|
*> <a href="http://www.netlib.org/cgi-bin/netlibfiles.zip?format=zip&filename=/lapack/lapack_routine/dgesvd.f">
 | 
						|
*> [ZIP]</a>
 | 
						|
*> <a href="http://www.netlib.org/cgi-bin/netlibfiles.txt?format=txt&filename=/lapack/lapack_routine/dgesvd.f">
 | 
						|
*> [TXT]</a>
 | 
						|
*> \endhtmlonly
 | 
						|
*
 | 
						|
*  Definition:
 | 
						|
*  ===========
 | 
						|
*
 | 
						|
*       SUBROUTINE DGESVD( JOBU, JOBVT, M, N, A, LDA, S, U, LDU, VT, LDVT,
 | 
						|
*                          WORK, LWORK, INFO )
 | 
						|
*
 | 
						|
*       .. Scalar Arguments ..
 | 
						|
*       CHARACTER          JOBU, JOBVT
 | 
						|
*       INTEGER            INFO, LDA, LDU, LDVT, LWORK, M, N
 | 
						|
*       ..
 | 
						|
*       .. Array Arguments ..
 | 
						|
*       DOUBLE PRECISION   A( LDA, * ), S( * ), U( LDU, * ),
 | 
						|
*      $                   VT( LDVT, * ), WORK( * )
 | 
						|
*       ..
 | 
						|
*
 | 
						|
*
 | 
						|
*> \par Purpose:
 | 
						|
*  =============
 | 
						|
*>
 | 
						|
*> \verbatim
 | 
						|
*>
 | 
						|
*> DGESVD computes the singular value decomposition (SVD) of a real
 | 
						|
*> M-by-N matrix A, optionally computing the left and/or right singular
 | 
						|
*> vectors. The SVD is written
 | 
						|
*>
 | 
						|
*>      A = U * SIGMA * transpose(V)
 | 
						|
*>
 | 
						|
*> where SIGMA is an M-by-N matrix which is zero except for its
 | 
						|
*> min(m,n) diagonal elements, U is an M-by-M orthogonal matrix, and
 | 
						|
*> V is an N-by-N orthogonal matrix.  The diagonal elements of SIGMA
 | 
						|
*> are the singular values of A; they are real and non-negative, and
 | 
						|
*> are returned in descending order.  The first min(m,n) columns of
 | 
						|
*> U and V are the left and right singular vectors of A.
 | 
						|
*>
 | 
						|
*> Note that the routine returns V**T, not V.
 | 
						|
*> \endverbatim
 | 
						|
*
 | 
						|
*  Arguments:
 | 
						|
*  ==========
 | 
						|
*
 | 
						|
*> \param[in] JOBU
 | 
						|
*> \verbatim
 | 
						|
*>          JOBU is CHARACTER*1
 | 
						|
*>          Specifies options for computing all or part of the matrix U:
 | 
						|
*>          = 'A':  all M columns of U are returned in array U:
 | 
						|
*>          = 'S':  the first min(m,n) columns of U (the left singular
 | 
						|
*>                  vectors) are returned in the array U;
 | 
						|
*>          = 'O':  the first min(m,n) columns of U (the left singular
 | 
						|
*>                  vectors) are overwritten on the array A;
 | 
						|
*>          = 'N':  no columns of U (no left singular vectors) are
 | 
						|
*>                  computed.
 | 
						|
*> \endverbatim
 | 
						|
*>
 | 
						|
*> \param[in] JOBVT
 | 
						|
*> \verbatim
 | 
						|
*>          JOBVT is CHARACTER*1
 | 
						|
*>          Specifies options for computing all or part of the matrix
 | 
						|
*>          V**T:
 | 
						|
*>          = 'A':  all N rows of V**T are returned in the array VT;
 | 
						|
*>          = 'S':  the first min(m,n) rows of V**T (the right singular
 | 
						|
*>                  vectors) are returned in the array VT;
 | 
						|
*>          = 'O':  the first min(m,n) rows of V**T (the right singular
 | 
						|
*>                  vectors) are overwritten on the array A;
 | 
						|
*>          = 'N':  no rows of V**T (no right singular vectors) are
 | 
						|
*>                  computed.
 | 
						|
*>
 | 
						|
*>          JOBVT and JOBU cannot both be 'O'.
 | 
						|
*> \endverbatim
 | 
						|
*>
 | 
						|
*> \param[in] M
 | 
						|
*> \verbatim
 | 
						|
*>          M is INTEGER
 | 
						|
*>          The number of rows of the input matrix A.  M >= 0.
 | 
						|
*> \endverbatim
 | 
						|
*>
 | 
						|
*> \param[in] N
 | 
						|
*> \verbatim
 | 
						|
*>          N is INTEGER
 | 
						|
*>          The number of columns of the input matrix A.  N >= 0.
 | 
						|
*> \endverbatim
 | 
						|
*>
 | 
						|
*> \param[in,out] A
 | 
						|
*> \verbatim
 | 
						|
*>          A is DOUBLE PRECISION array, dimension (LDA,N)
 | 
						|
*>          On entry, the M-by-N matrix A.
 | 
						|
*>          On exit,
 | 
						|
*>          if JOBU = 'O',  A is overwritten with the first min(m,n)
 | 
						|
*>                          columns of U (the left singular vectors,
 | 
						|
*>                          stored columnwise);
 | 
						|
*>          if JOBVT = 'O', A is overwritten with the first min(m,n)
 | 
						|
*>                          rows of V**T (the right singular vectors,
 | 
						|
*>                          stored rowwise);
 | 
						|
*>          if JOBU .ne. 'O' and JOBVT .ne. 'O', the contents of A
 | 
						|
*>                          are destroyed.
 | 
						|
*> \endverbatim
 | 
						|
*>
 | 
						|
*> \param[in] LDA
 | 
						|
*> \verbatim
 | 
						|
*>          LDA is INTEGER
 | 
						|
*>          The leading dimension of the array A.  LDA >= max(1,M).
 | 
						|
*> \endverbatim
 | 
						|
*>
 | 
						|
*> \param[out] S
 | 
						|
*> \verbatim
 | 
						|
*>          S is DOUBLE PRECISION array, dimension (min(M,N))
 | 
						|
*>          The singular values of A, sorted so that S(i) >= S(i+1).
 | 
						|
*> \endverbatim
 | 
						|
*>
 | 
						|
*> \param[out] U
 | 
						|
*> \verbatim
 | 
						|
*>          U is DOUBLE PRECISION array, dimension (LDU,UCOL)
 | 
						|
*>          (LDU,M) if JOBU = 'A' or (LDU,min(M,N)) if JOBU = 'S'.
 | 
						|
*>          If JOBU = 'A', U contains the M-by-M orthogonal matrix U;
 | 
						|
*>          if JOBU = 'S', U contains the first min(m,n) columns of U
 | 
						|
*>          (the left singular vectors, stored columnwise);
 | 
						|
*>          if JOBU = 'N' or 'O', U is not referenced.
 | 
						|
*> \endverbatim
 | 
						|
*>
 | 
						|
*> \param[in] LDU
 | 
						|
*> \verbatim
 | 
						|
*>          LDU is INTEGER
 | 
						|
*>          The leading dimension of the array U.  LDU >= 1; if
 | 
						|
*>          JOBU = 'S' or 'A', LDU >= M.
 | 
						|
*> \endverbatim
 | 
						|
*>
 | 
						|
*> \param[out] VT
 | 
						|
*> \verbatim
 | 
						|
*>          VT is DOUBLE PRECISION array, dimension (LDVT,N)
 | 
						|
*>          If JOBVT = 'A', VT contains the N-by-N orthogonal matrix
 | 
						|
*>          V**T;
 | 
						|
*>          if JOBVT = 'S', VT contains the first min(m,n) rows of
 | 
						|
*>          V**T (the right singular vectors, stored rowwise);
 | 
						|
*>          if JOBVT = 'N' or 'O', VT is not referenced.
 | 
						|
*> \endverbatim
 | 
						|
*>
 | 
						|
*> \param[in] LDVT
 | 
						|
*> \verbatim
 | 
						|
*>          LDVT is INTEGER
 | 
						|
*>          The leading dimension of the array VT.  LDVT >= 1; if
 | 
						|
*>          JOBVT = 'A', LDVT >= N; if JOBVT = 'S', LDVT >= min(M,N).
 | 
						|
*> \endverbatim
 | 
						|
*>
 | 
						|
*> \param[out] WORK
 | 
						|
*> \verbatim
 | 
						|
*>          WORK is DOUBLE PRECISION array, dimension (MAX(1,LWORK))
 | 
						|
*>          On exit, if INFO = 0, WORK(1) returns the optimal LWORK;
 | 
						|
*>          if INFO > 0, WORK(2:MIN(M,N)) contains the unconverged
 | 
						|
*>          superdiagonal elements of an upper bidiagonal matrix B
 | 
						|
*>          whose diagonal is in S (not necessarily sorted). B
 | 
						|
*>          satisfies A = U * B * VT, so it has the same singular values
 | 
						|
*>          as A, and singular vectors related by U and VT.
 | 
						|
*> \endverbatim
 | 
						|
*>
 | 
						|
*> \param[in] LWORK
 | 
						|
*> \verbatim
 | 
						|
*>          LWORK is INTEGER
 | 
						|
*>          The dimension of the array WORK.
 | 
						|
*>          LWORK >= MAX(1,5*MIN(M,N)) for the paths (see comments inside code):
 | 
						|
*>             - PATH 1  (M much larger than N, JOBU='N')
 | 
						|
*>             - PATH 1t (N much larger than M, JOBVT='N')
 | 
						|
*>          LWORK >= MAX(1,3*MIN(M,N) + MAX(M,N),5*MIN(M,N)) for the other paths
 | 
						|
*>          For good performance, LWORK should generally be larger.
 | 
						|
*>
 | 
						|
*>          If LWORK = -1, then a workspace query is assumed; the routine
 | 
						|
*>          only calculates the optimal size of the WORK array, returns
 | 
						|
*>          this value as the first entry of the WORK array, and no error
 | 
						|
*>          message related to LWORK is issued by XERBLA.
 | 
						|
*> \endverbatim
 | 
						|
*>
 | 
						|
*> \param[out] INFO
 | 
						|
*> \verbatim
 | 
						|
*>          INFO is INTEGER
 | 
						|
*>          = 0:  successful exit.
 | 
						|
*>          < 0:  if INFO = -i, the i-th argument had an illegal value.
 | 
						|
*>          > 0:  if DBDSQR did not converge, INFO specifies how many
 | 
						|
*>                superdiagonals of an intermediate bidiagonal form B
 | 
						|
*>                did not converge to zero. See the description of WORK
 | 
						|
*>                above for details.
 | 
						|
*> \endverbatim
 | 
						|
*
 | 
						|
*  Authors:
 | 
						|
*  ========
 | 
						|
*
 | 
						|
*> \author Univ. of Tennessee
 | 
						|
*> \author Univ. of California Berkeley
 | 
						|
*> \author Univ. of Colorado Denver
 | 
						|
*> \author NAG Ltd.
 | 
						|
*
 | 
						|
*> \ingroup doubleGEsing
 | 
						|
*
 | 
						|
*  =====================================================================
 | 
						|
      SUBROUTINE DGESVD( JOBU, JOBVT, M, N, A, LDA, S, U, LDU,
 | 
						|
     $                   VT, LDVT, WORK, LWORK, INFO )
 | 
						|
*
 | 
						|
*  -- LAPACK driver routine --
 | 
						|
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
 | 
						|
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
 | 
						|
*
 | 
						|
*     .. Scalar Arguments ..
 | 
						|
      CHARACTER          JOBU, JOBVT
 | 
						|
      INTEGER            INFO, LDA, LDU, LDVT, LWORK, M, N
 | 
						|
*     ..
 | 
						|
*     .. Array Arguments ..
 | 
						|
      DOUBLE PRECISION   A( LDA, * ), S( * ), U( LDU, * ),
 | 
						|
     $                   VT( LDVT, * ), WORK( * )
 | 
						|
*     ..
 | 
						|
*
 | 
						|
*  =====================================================================
 | 
						|
*
 | 
						|
*     .. Parameters ..
 | 
						|
      DOUBLE PRECISION   ZERO, ONE
 | 
						|
      PARAMETER          ( ZERO = 0.0D0, ONE = 1.0D0 )
 | 
						|
*     ..
 | 
						|
*     .. Local Scalars ..
 | 
						|
      LOGICAL            LQUERY, WNTUA, WNTUAS, WNTUN, WNTUO, WNTUS,
 | 
						|
     $                   WNTVA, WNTVAS, WNTVN, WNTVO, WNTVS
 | 
						|
      INTEGER            BDSPAC, BLK, CHUNK, I, IE, IERR, IR, ISCL,
 | 
						|
     $                   ITAU, ITAUP, ITAUQ, IU, IWORK, LDWRKR, LDWRKU,
 | 
						|
     $                   MAXWRK, MINMN, MINWRK, MNTHR, NCU, NCVT, NRU,
 | 
						|
     $                   NRVT, WRKBL
 | 
						|
      INTEGER            LWORK_DGEQRF, LWORK_DORGQR_N, LWORK_DORGQR_M,
 | 
						|
     $                   LWORK_DGEBRD, LWORK_DORGBR_P, LWORK_DORGBR_Q,
 | 
						|
     $                   LWORK_DGELQF, LWORK_DORGLQ_N, LWORK_DORGLQ_M
 | 
						|
      DOUBLE PRECISION   ANRM, BIGNUM, EPS, SMLNUM
 | 
						|
*     ..
 | 
						|
*     .. Local Arrays ..
 | 
						|
      DOUBLE PRECISION   DUM( 1 )
 | 
						|
*     ..
 | 
						|
*     .. External Subroutines ..
 | 
						|
      EXTERNAL           DBDSQR, DGEBRD, DGELQF, DGEMM, DGEQRF, DLACPY,
 | 
						|
     $                   DLASCL, DLASET, DORGBR, DORGLQ, DORGQR, DORMBR,
 | 
						|
     $                   XERBLA
 | 
						|
*     ..
 | 
						|
*     .. External Functions ..
 | 
						|
      LOGICAL            LSAME
 | 
						|
      INTEGER            ILAENV
 | 
						|
      DOUBLE PRECISION   DLAMCH, DLANGE
 | 
						|
      EXTERNAL           LSAME, ILAENV, DLAMCH, DLANGE
 | 
						|
*     ..
 | 
						|
*     .. Intrinsic Functions ..
 | 
						|
      INTRINSIC          MAX, MIN, SQRT
 | 
						|
*     ..
 | 
						|
*     .. Executable Statements ..
 | 
						|
*
 | 
						|
*     Test the input arguments
 | 
						|
*
 | 
						|
      INFO = 0
 | 
						|
      MINMN = MIN( M, N )
 | 
						|
      WNTUA = LSAME( JOBU, 'A' )
 | 
						|
      WNTUS = LSAME( JOBU, 'S' )
 | 
						|
      WNTUAS = WNTUA .OR. WNTUS
 | 
						|
      WNTUO = LSAME( JOBU, 'O' )
 | 
						|
      WNTUN = LSAME( JOBU, 'N' )
 | 
						|
      WNTVA = LSAME( JOBVT, 'A' )
 | 
						|
      WNTVS = LSAME( JOBVT, 'S' )
 | 
						|
      WNTVAS = WNTVA .OR. WNTVS
 | 
						|
      WNTVO = LSAME( JOBVT, 'O' )
 | 
						|
      WNTVN = LSAME( JOBVT, 'N' )
 | 
						|
      LQUERY = ( LWORK.EQ.-1 )
 | 
						|
*
 | 
						|
      IF( .NOT.( WNTUA .OR. WNTUS .OR. WNTUO .OR. WNTUN ) ) THEN
 | 
						|
         INFO = -1
 | 
						|
      ELSE IF( .NOT.( WNTVA .OR. WNTVS .OR. WNTVO .OR. WNTVN ) .OR.
 | 
						|
     $         ( WNTVO .AND. WNTUO ) ) THEN
 | 
						|
         INFO = -2
 | 
						|
      ELSE IF( M.LT.0 ) THEN
 | 
						|
         INFO = -3
 | 
						|
      ELSE IF( N.LT.0 ) THEN
 | 
						|
         INFO = -4
 | 
						|
      ELSE IF( LDA.LT.MAX( 1, M ) ) THEN
 | 
						|
         INFO = -6
 | 
						|
      ELSE IF( LDU.LT.1 .OR. ( WNTUAS .AND. LDU.LT.M ) ) THEN
 | 
						|
         INFO = -9
 | 
						|
      ELSE IF( LDVT.LT.1 .OR. ( WNTVA .AND. LDVT.LT.N ) .OR.
 | 
						|
     $         ( WNTVS .AND. LDVT.LT.MINMN ) ) THEN
 | 
						|
         INFO = -11
 | 
						|
      END IF
 | 
						|
*
 | 
						|
*     Compute workspace
 | 
						|
*      (Note: Comments in the code beginning "Workspace:" describe the
 | 
						|
*       minimal amount of workspace needed at that point in the code,
 | 
						|
*       as well as the preferred amount for good performance.
 | 
						|
*       NB refers to the optimal block size for the immediately
 | 
						|
*       following subroutine, as returned by ILAENV.)
 | 
						|
*
 | 
						|
      IF( INFO.EQ.0 ) THEN
 | 
						|
         MINWRK = 1
 | 
						|
         MAXWRK = 1
 | 
						|
         IF( M.GE.N .AND. MINMN.GT.0 ) THEN
 | 
						|
*
 | 
						|
*           Compute space needed for DBDSQR
 | 
						|
*
 | 
						|
            MNTHR = ILAENV( 6, 'DGESVD', JOBU // JOBVT, M, N, 0, 0 )
 | 
						|
            BDSPAC = 5*N
 | 
						|
*           Compute space needed for DGEQRF
 | 
						|
            CALL DGEQRF( M, N, A, LDA, DUM(1), DUM(1), -1, IERR )
 | 
						|
            LWORK_DGEQRF = INT( DUM(1) )
 | 
						|
*           Compute space needed for DORGQR
 | 
						|
            CALL DORGQR( M, N, N, A, LDA, DUM(1), DUM(1), -1, IERR )
 | 
						|
            LWORK_DORGQR_N = INT( DUM(1) )
 | 
						|
            CALL DORGQR( M, M, N, A, LDA, DUM(1), DUM(1), -1, IERR )
 | 
						|
            LWORK_DORGQR_M = INT( DUM(1) )
 | 
						|
*           Compute space needed for DGEBRD
 | 
						|
            CALL DGEBRD( N, N, A, LDA, S, DUM(1), DUM(1),
 | 
						|
     $                   DUM(1), DUM(1), -1, IERR )
 | 
						|
            LWORK_DGEBRD = INT( DUM(1) )
 | 
						|
*           Compute space needed for DORGBR P
 | 
						|
            CALL DORGBR( 'P', N, N, N, A, LDA, DUM(1),
 | 
						|
     $                   DUM(1), -1, IERR )
 | 
						|
            LWORK_DORGBR_P = INT( DUM(1) )
 | 
						|
*           Compute space needed for DORGBR Q
 | 
						|
            CALL DORGBR( 'Q', N, N, N, A, LDA, DUM(1),
 | 
						|
     $                   DUM(1), -1, IERR )
 | 
						|
            LWORK_DORGBR_Q = INT( DUM(1) )
 | 
						|
*
 | 
						|
            IF( M.GE.MNTHR ) THEN
 | 
						|
               IF( WNTUN ) THEN
 | 
						|
*
 | 
						|
*                 Path 1 (M much larger than N, JOBU='N')
 | 
						|
*
 | 
						|
                  MAXWRK = N + LWORK_DGEQRF
 | 
						|
                  MAXWRK = MAX( MAXWRK, 3*N + LWORK_DGEBRD )
 | 
						|
                  IF( WNTVO .OR. WNTVAS )
 | 
						|
     $               MAXWRK = MAX( MAXWRK, 3*N + LWORK_DORGBR_P )
 | 
						|
                  MAXWRK = MAX( MAXWRK, BDSPAC )
 | 
						|
                  MINWRK = MAX( 4*N, BDSPAC )
 | 
						|
               ELSE IF( WNTUO .AND. WNTVN ) THEN
 | 
						|
*
 | 
						|
*                 Path 2 (M much larger than N, JOBU='O', JOBVT='N')
 | 
						|
*
 | 
						|
                  WRKBL = N + LWORK_DGEQRF
 | 
						|
                  WRKBL = MAX( WRKBL, N + LWORK_DORGQR_N )
 | 
						|
                  WRKBL = MAX( WRKBL, 3*N + LWORK_DGEBRD )
 | 
						|
                  WRKBL = MAX( WRKBL, 3*N + LWORK_DORGBR_Q )
 | 
						|
                  WRKBL = MAX( WRKBL, BDSPAC )
 | 
						|
                  MAXWRK = MAX( N*N + WRKBL, N*N + M*N + N )
 | 
						|
                  MINWRK = MAX( 3*N + M, BDSPAC )
 | 
						|
               ELSE IF( WNTUO .AND. WNTVAS ) THEN
 | 
						|
*
 | 
						|
*                 Path 3 (M much larger than N, JOBU='O', JOBVT='S' or
 | 
						|
*                 'A')
 | 
						|
*
 | 
						|
                  WRKBL = N + LWORK_DGEQRF
 | 
						|
                  WRKBL = MAX( WRKBL, N + LWORK_DORGQR_N )
 | 
						|
                  WRKBL = MAX( WRKBL, 3*N + LWORK_DGEBRD )
 | 
						|
                  WRKBL = MAX( WRKBL, 3*N + LWORK_DORGBR_Q )
 | 
						|
                  WRKBL = MAX( WRKBL, 3*N + LWORK_DORGBR_P )
 | 
						|
                  WRKBL = MAX( WRKBL, BDSPAC )
 | 
						|
                  MAXWRK = MAX( N*N + WRKBL, N*N + M*N + N )
 | 
						|
                  MINWRK = MAX( 3*N + M, BDSPAC )
 | 
						|
               ELSE IF( WNTUS .AND. WNTVN ) THEN
 | 
						|
*
 | 
						|
*                 Path 4 (M much larger than N, JOBU='S', JOBVT='N')
 | 
						|
*
 | 
						|
                  WRKBL = N + LWORK_DGEQRF
 | 
						|
                  WRKBL = MAX( WRKBL, N + LWORK_DORGQR_N )
 | 
						|
                  WRKBL = MAX( WRKBL, 3*N + LWORK_DGEBRD )
 | 
						|
                  WRKBL = MAX( WRKBL, 3*N + LWORK_DORGBR_Q )
 | 
						|
                  WRKBL = MAX( WRKBL, BDSPAC )
 | 
						|
                  MAXWRK = N*N + WRKBL
 | 
						|
                  MINWRK = MAX( 3*N + M, BDSPAC )
 | 
						|
               ELSE IF( WNTUS .AND. WNTVO ) THEN
 | 
						|
*
 | 
						|
*                 Path 5 (M much larger than N, JOBU='S', JOBVT='O')
 | 
						|
*
 | 
						|
                  WRKBL = N + LWORK_DGEQRF
 | 
						|
                  WRKBL = MAX( WRKBL, N + LWORK_DORGQR_N )
 | 
						|
                  WRKBL = MAX( WRKBL, 3*N + LWORK_DGEBRD )
 | 
						|
                  WRKBL = MAX( WRKBL, 3*N + LWORK_DORGBR_Q )
 | 
						|
                  WRKBL = MAX( WRKBL, 3*N + LWORK_DORGBR_P )
 | 
						|
                  WRKBL = MAX( WRKBL, BDSPAC )
 | 
						|
                  MAXWRK = 2*N*N + WRKBL
 | 
						|
                  MINWRK = MAX( 3*N + M, BDSPAC )
 | 
						|
               ELSE IF( WNTUS .AND. WNTVAS ) THEN
 | 
						|
*
 | 
						|
*                 Path 6 (M much larger than N, JOBU='S', JOBVT='S' or
 | 
						|
*                 'A')
 | 
						|
*
 | 
						|
                  WRKBL = N + LWORK_DGEQRF
 | 
						|
                  WRKBL = MAX( WRKBL, N + LWORK_DORGQR_N )
 | 
						|
                  WRKBL = MAX( WRKBL, 3*N + LWORK_DGEBRD )
 | 
						|
                  WRKBL = MAX( WRKBL, 3*N + LWORK_DORGBR_Q )
 | 
						|
                  WRKBL = MAX( WRKBL, 3*N + LWORK_DORGBR_P )
 | 
						|
                  WRKBL = MAX( WRKBL, BDSPAC )
 | 
						|
                  MAXWRK = N*N + WRKBL
 | 
						|
                  MINWRK = MAX( 3*N + M, BDSPAC )
 | 
						|
               ELSE IF( WNTUA .AND. WNTVN ) THEN
 | 
						|
*
 | 
						|
*                 Path 7 (M much larger than N, JOBU='A', JOBVT='N')
 | 
						|
*
 | 
						|
                  WRKBL = N + LWORK_DGEQRF
 | 
						|
                  WRKBL = MAX( WRKBL, N + LWORK_DORGQR_M )
 | 
						|
                  WRKBL = MAX( WRKBL, 3*N + LWORK_DGEBRD )
 | 
						|
                  WRKBL = MAX( WRKBL, 3*N + LWORK_DORGBR_Q )
 | 
						|
                  WRKBL = MAX( WRKBL, BDSPAC )
 | 
						|
                  MAXWRK = N*N + WRKBL
 | 
						|
                  MINWRK = MAX( 3*N + M, BDSPAC )
 | 
						|
               ELSE IF( WNTUA .AND. WNTVO ) THEN
 | 
						|
*
 | 
						|
*                 Path 8 (M much larger than N, JOBU='A', JOBVT='O')
 | 
						|
*
 | 
						|
                  WRKBL = N + LWORK_DGEQRF
 | 
						|
                  WRKBL = MAX( WRKBL, N + LWORK_DORGQR_M )
 | 
						|
                  WRKBL = MAX( WRKBL, 3*N + LWORK_DGEBRD )
 | 
						|
                  WRKBL = MAX( WRKBL, 3*N + LWORK_DORGBR_Q )
 | 
						|
                  WRKBL = MAX( WRKBL, 3*N + LWORK_DORGBR_P )
 | 
						|
                  WRKBL = MAX( WRKBL, BDSPAC )
 | 
						|
                  MAXWRK = 2*N*N + WRKBL
 | 
						|
                  MINWRK = MAX( 3*N + M, BDSPAC )
 | 
						|
               ELSE IF( WNTUA .AND. WNTVAS ) THEN
 | 
						|
*
 | 
						|
*                 Path 9 (M much larger than N, JOBU='A', JOBVT='S' or
 | 
						|
*                 'A')
 | 
						|
*
 | 
						|
                  WRKBL = N + LWORK_DGEQRF
 | 
						|
                  WRKBL = MAX( WRKBL, N + LWORK_DORGQR_M )
 | 
						|
                  WRKBL = MAX( WRKBL, 3*N + LWORK_DGEBRD )
 | 
						|
                  WRKBL = MAX( WRKBL, 3*N + LWORK_DORGBR_Q )
 | 
						|
                  WRKBL = MAX( WRKBL, 3*N + LWORK_DORGBR_P )
 | 
						|
                  WRKBL = MAX( WRKBL, BDSPAC )
 | 
						|
                  MAXWRK = N*N + WRKBL
 | 
						|
                  MINWRK = MAX( 3*N + M, BDSPAC )
 | 
						|
               END IF
 | 
						|
            ELSE
 | 
						|
*
 | 
						|
*              Path 10 (M at least N, but not much larger)
 | 
						|
*
 | 
						|
               CALL DGEBRD( M, N, A, LDA, S, DUM(1), DUM(1),
 | 
						|
     $                   DUM(1), DUM(1), -1, IERR )
 | 
						|
               LWORK_DGEBRD = INT( DUM(1) )
 | 
						|
               MAXWRK = 3*N + LWORK_DGEBRD
 | 
						|
               IF( WNTUS .OR. WNTUO ) THEN
 | 
						|
                  CALL DORGBR( 'Q', M, N, N, A, LDA, DUM(1),
 | 
						|
     $                   DUM(1), -1, IERR )
 | 
						|
                  LWORK_DORGBR_Q = INT( DUM(1) )
 | 
						|
                  MAXWRK = MAX( MAXWRK, 3*N + LWORK_DORGBR_Q )
 | 
						|
               END IF
 | 
						|
               IF( WNTUA ) THEN
 | 
						|
                  CALL DORGBR( 'Q', M, M, N, A, LDA, DUM(1),
 | 
						|
     $                   DUM(1), -1, IERR )
 | 
						|
                  LWORK_DORGBR_Q = INT( DUM(1) )
 | 
						|
                  MAXWRK = MAX( MAXWRK, 3*N + LWORK_DORGBR_Q )
 | 
						|
               END IF
 | 
						|
               IF( .NOT.WNTVN ) THEN
 | 
						|
                 MAXWRK = MAX( MAXWRK, 3*N + LWORK_DORGBR_P )
 | 
						|
               END IF
 | 
						|
               MAXWRK = MAX( MAXWRK, BDSPAC )
 | 
						|
               MINWRK = MAX( 3*N + M, BDSPAC )
 | 
						|
            END IF
 | 
						|
         ELSE IF( MINMN.GT.0 ) THEN
 | 
						|
*
 | 
						|
*           Compute space needed for DBDSQR
 | 
						|
*
 | 
						|
            MNTHR = ILAENV( 6, 'DGESVD', JOBU // JOBVT, M, N, 0, 0 )
 | 
						|
            BDSPAC = 5*M
 | 
						|
*           Compute space needed for DGELQF
 | 
						|
            CALL DGELQF( M, N, A, LDA, DUM(1), DUM(1), -1, IERR )
 | 
						|
            LWORK_DGELQF = INT( DUM(1) )
 | 
						|
*           Compute space needed for DORGLQ
 | 
						|
            CALL DORGLQ( N, N, M, DUM(1), N, DUM(1), DUM(1), -1, IERR )
 | 
						|
            LWORK_DORGLQ_N = INT( DUM(1) )
 | 
						|
            CALL DORGLQ( M, N, M, A, LDA, DUM(1), DUM(1), -1, IERR )
 | 
						|
            LWORK_DORGLQ_M = INT( DUM(1) )
 | 
						|
*           Compute space needed for DGEBRD
 | 
						|
            CALL DGEBRD( M, M, A, LDA, S, DUM(1), DUM(1),
 | 
						|
     $                   DUM(1), DUM(1), -1, IERR )
 | 
						|
            LWORK_DGEBRD = INT( DUM(1) )
 | 
						|
*            Compute space needed for DORGBR P
 | 
						|
            CALL DORGBR( 'P', M, M, M, A, N, DUM(1),
 | 
						|
     $                   DUM(1), -1, IERR )
 | 
						|
            LWORK_DORGBR_P = INT( DUM(1) )
 | 
						|
*           Compute space needed for DORGBR Q
 | 
						|
            CALL DORGBR( 'Q', M, M, M, A, N, DUM(1),
 | 
						|
     $                   DUM(1), -1, IERR )
 | 
						|
            LWORK_DORGBR_Q = INT( DUM(1) )
 | 
						|
            IF( N.GE.MNTHR ) THEN
 | 
						|
               IF( WNTVN ) THEN
 | 
						|
*
 | 
						|
*                 Path 1t(N much larger than M, JOBVT='N')
 | 
						|
*
 | 
						|
                  MAXWRK = M + LWORK_DGELQF
 | 
						|
                  MAXWRK = MAX( MAXWRK, 3*M + LWORK_DGEBRD )
 | 
						|
                  IF( WNTUO .OR. WNTUAS )
 | 
						|
     $               MAXWRK = MAX( MAXWRK, 3*M + LWORK_DORGBR_Q )
 | 
						|
                  MAXWRK = MAX( MAXWRK, BDSPAC )
 | 
						|
                  MINWRK = MAX( 4*M, BDSPAC )
 | 
						|
               ELSE IF( WNTVO .AND. WNTUN ) THEN
 | 
						|
*
 | 
						|
*                 Path 2t(N much larger than M, JOBU='N', JOBVT='O')
 | 
						|
*
 | 
						|
                  WRKBL = M + LWORK_DGELQF
 | 
						|
                  WRKBL = MAX( WRKBL, M + LWORK_DORGLQ_M )
 | 
						|
                  WRKBL = MAX( WRKBL, 3*M + LWORK_DGEBRD )
 | 
						|
                  WRKBL = MAX( WRKBL, 3*M + LWORK_DORGBR_P )
 | 
						|
                  WRKBL = MAX( WRKBL, BDSPAC )
 | 
						|
                  MAXWRK = MAX( M*M + WRKBL, M*M + M*N + M )
 | 
						|
                  MINWRK = MAX( 3*M + N, BDSPAC )
 | 
						|
               ELSE IF( WNTVO .AND. WNTUAS ) THEN
 | 
						|
*
 | 
						|
*                 Path 3t(N much larger than M, JOBU='S' or 'A',
 | 
						|
*                 JOBVT='O')
 | 
						|
*
 | 
						|
                  WRKBL = M + LWORK_DGELQF
 | 
						|
                  WRKBL = MAX( WRKBL, M + LWORK_DORGLQ_M )
 | 
						|
                  WRKBL = MAX( WRKBL, 3*M + LWORK_DGEBRD )
 | 
						|
                  WRKBL = MAX( WRKBL, 3*M + LWORK_DORGBR_P )
 | 
						|
                  WRKBL = MAX( WRKBL, 3*M + LWORK_DORGBR_Q )
 | 
						|
                  WRKBL = MAX( WRKBL, BDSPAC )
 | 
						|
                  MAXWRK = MAX( M*M + WRKBL, M*M + M*N + M )
 | 
						|
                  MINWRK = MAX( 3*M + N, BDSPAC )
 | 
						|
               ELSE IF( WNTVS .AND. WNTUN ) THEN
 | 
						|
*
 | 
						|
*                 Path 4t(N much larger than M, JOBU='N', JOBVT='S')
 | 
						|
*
 | 
						|
                  WRKBL = M + LWORK_DGELQF
 | 
						|
                  WRKBL = MAX( WRKBL, M + LWORK_DORGLQ_M )
 | 
						|
                  WRKBL = MAX( WRKBL, 3*M + LWORK_DGEBRD )
 | 
						|
                  WRKBL = MAX( WRKBL, 3*M + LWORK_DORGBR_P )
 | 
						|
                  WRKBL = MAX( WRKBL, BDSPAC )
 | 
						|
                  MAXWRK = M*M + WRKBL
 | 
						|
                  MINWRK = MAX( 3*M + N, BDSPAC )
 | 
						|
               ELSE IF( WNTVS .AND. WNTUO ) THEN
 | 
						|
*
 | 
						|
*                 Path 5t(N much larger than M, JOBU='O', JOBVT='S')
 | 
						|
*
 | 
						|
                  WRKBL = M + LWORK_DGELQF
 | 
						|
                  WRKBL = MAX( WRKBL, M + LWORK_DORGLQ_M )
 | 
						|
                  WRKBL = MAX( WRKBL, 3*M + LWORK_DGEBRD )
 | 
						|
                  WRKBL = MAX( WRKBL, 3*M + LWORK_DORGBR_P )
 | 
						|
                  WRKBL = MAX( WRKBL, 3*M + LWORK_DORGBR_Q )
 | 
						|
                  WRKBL = MAX( WRKBL, BDSPAC )
 | 
						|
                  MAXWRK = 2*M*M + WRKBL
 | 
						|
                  MINWRK = MAX( 3*M + N, BDSPAC )
 | 
						|
               ELSE IF( WNTVS .AND. WNTUAS ) THEN
 | 
						|
*
 | 
						|
*                 Path 6t(N much larger than M, JOBU='S' or 'A',
 | 
						|
*                 JOBVT='S')
 | 
						|
*
 | 
						|
                  WRKBL = M + LWORK_DGELQF
 | 
						|
                  WRKBL = MAX( WRKBL, M + LWORK_DORGLQ_M )
 | 
						|
                  WRKBL = MAX( WRKBL, 3*M + LWORK_DGEBRD )
 | 
						|
                  WRKBL = MAX( WRKBL, 3*M + LWORK_DORGBR_P )
 | 
						|
                  WRKBL = MAX( WRKBL, 3*M + LWORK_DORGBR_Q )
 | 
						|
                  WRKBL = MAX( WRKBL, BDSPAC )
 | 
						|
                  MAXWRK = M*M + WRKBL
 | 
						|
                  MINWRK = MAX( 3*M + N, BDSPAC )
 | 
						|
               ELSE IF( WNTVA .AND. WNTUN ) THEN
 | 
						|
*
 | 
						|
*                 Path 7t(N much larger than M, JOBU='N', JOBVT='A')
 | 
						|
*
 | 
						|
                  WRKBL = M + LWORK_DGELQF
 | 
						|
                  WRKBL = MAX( WRKBL, M + LWORK_DORGLQ_N )
 | 
						|
                  WRKBL = MAX( WRKBL, 3*M + LWORK_DGEBRD )
 | 
						|
                  WRKBL = MAX( WRKBL, 3*M + LWORK_DORGBR_P )
 | 
						|
                  WRKBL = MAX( WRKBL, BDSPAC )
 | 
						|
                  MAXWRK = M*M + WRKBL
 | 
						|
                  MINWRK = MAX( 3*M + N, BDSPAC )
 | 
						|
               ELSE IF( WNTVA .AND. WNTUO ) THEN
 | 
						|
*
 | 
						|
*                 Path 8t(N much larger than M, JOBU='O', JOBVT='A')
 | 
						|
*
 | 
						|
                  WRKBL = M + LWORK_DGELQF
 | 
						|
                  WRKBL = MAX( WRKBL, M + LWORK_DORGLQ_N )
 | 
						|
                  WRKBL = MAX( WRKBL, 3*M + LWORK_DGEBRD )
 | 
						|
                  WRKBL = MAX( WRKBL, 3*M + LWORK_DORGBR_P )
 | 
						|
                  WRKBL = MAX( WRKBL, 3*M + LWORK_DORGBR_Q )
 | 
						|
                  WRKBL = MAX( WRKBL, BDSPAC )
 | 
						|
                  MAXWRK = 2*M*M + WRKBL
 | 
						|
                  MINWRK = MAX( 3*M + N, BDSPAC )
 | 
						|
               ELSE IF( WNTVA .AND. WNTUAS ) THEN
 | 
						|
*
 | 
						|
*                 Path 9t(N much larger than M, JOBU='S' or 'A',
 | 
						|
*                 JOBVT='A')
 | 
						|
*
 | 
						|
                  WRKBL = M + LWORK_DGELQF
 | 
						|
                  WRKBL = MAX( WRKBL, M + LWORK_DORGLQ_N )
 | 
						|
                  WRKBL = MAX( WRKBL, 3*M + LWORK_DGEBRD )
 | 
						|
                  WRKBL = MAX( WRKBL, 3*M + LWORK_DORGBR_P )
 | 
						|
                  WRKBL = MAX( WRKBL, 3*M + LWORK_DORGBR_Q )
 | 
						|
                  WRKBL = MAX( WRKBL, BDSPAC )
 | 
						|
                  MAXWRK = M*M + WRKBL
 | 
						|
                  MINWRK = MAX( 3*M + N, BDSPAC )
 | 
						|
               END IF
 | 
						|
            ELSE
 | 
						|
*
 | 
						|
*              Path 10t(N greater than M, but not much larger)
 | 
						|
*
 | 
						|
               CALL DGEBRD( M, N, A, LDA, S, DUM(1), DUM(1),
 | 
						|
     $                   DUM(1), DUM(1), -1, IERR )
 | 
						|
               LWORK_DGEBRD = INT( DUM(1) )
 | 
						|
               MAXWRK = 3*M + LWORK_DGEBRD
 | 
						|
               IF( WNTVS .OR. WNTVO ) THEN
 | 
						|
*                Compute space needed for DORGBR P
 | 
						|
                 CALL DORGBR( 'P', M, N, M, A, N, DUM(1),
 | 
						|
     $                   DUM(1), -1, IERR )
 | 
						|
                 LWORK_DORGBR_P = INT( DUM(1) )
 | 
						|
                 MAXWRK = MAX( MAXWRK, 3*M + LWORK_DORGBR_P )
 | 
						|
               END IF
 | 
						|
               IF( WNTVA ) THEN
 | 
						|
                 CALL DORGBR( 'P', N, N, M, A, N, DUM(1),
 | 
						|
     $                   DUM(1), -1, IERR )
 | 
						|
                 LWORK_DORGBR_P = INT( DUM(1) )
 | 
						|
                 MAXWRK = MAX( MAXWRK, 3*M + LWORK_DORGBR_P )
 | 
						|
               END IF
 | 
						|
               IF( .NOT.WNTUN ) THEN
 | 
						|
                  MAXWRK = MAX( MAXWRK, 3*M + LWORK_DORGBR_Q )
 | 
						|
               END IF
 | 
						|
               MAXWRK = MAX( MAXWRK, BDSPAC )
 | 
						|
               MINWRK = MAX( 3*M + N, BDSPAC )
 | 
						|
            END IF
 | 
						|
         END IF
 | 
						|
         MAXWRK = MAX( MAXWRK, MINWRK )
 | 
						|
         WORK( 1 ) = MAXWRK
 | 
						|
*
 | 
						|
         IF( LWORK.LT.MINWRK .AND. .NOT.LQUERY ) THEN
 | 
						|
            INFO = -13
 | 
						|
         END IF
 | 
						|
      END IF
 | 
						|
*
 | 
						|
      IF( INFO.NE.0 ) THEN
 | 
						|
         CALL XERBLA( 'DGESVD', -INFO )
 | 
						|
         RETURN
 | 
						|
      ELSE IF( LQUERY ) THEN
 | 
						|
         RETURN
 | 
						|
      END IF
 | 
						|
*
 | 
						|
*     Quick return if possible
 | 
						|
*
 | 
						|
      IF( M.EQ.0 .OR. N.EQ.0 ) THEN
 | 
						|
         RETURN
 | 
						|
      END IF
 | 
						|
*
 | 
						|
*     Get machine constants
 | 
						|
*
 | 
						|
      EPS = DLAMCH( 'P' )
 | 
						|
      SMLNUM = SQRT( DLAMCH( 'S' ) ) / EPS
 | 
						|
      BIGNUM = ONE / SMLNUM
 | 
						|
*
 | 
						|
*     Scale A if max element outside range [SMLNUM,BIGNUM]
 | 
						|
*
 | 
						|
      ANRM = DLANGE( 'M', M, N, A, LDA, DUM )
 | 
						|
      ISCL = 0
 | 
						|
      IF( ANRM.GT.ZERO .AND. ANRM.LT.SMLNUM ) THEN
 | 
						|
         ISCL = 1
 | 
						|
         CALL DLASCL( 'G', 0, 0, ANRM, SMLNUM, M, N, A, LDA, IERR )
 | 
						|
      ELSE IF( ANRM.GT.BIGNUM ) THEN
 | 
						|
         ISCL = 1
 | 
						|
         CALL DLASCL( 'G', 0, 0, ANRM, BIGNUM, M, N, A, LDA, IERR )
 | 
						|
      END IF
 | 
						|
*
 | 
						|
      IF( M.GE.N ) THEN
 | 
						|
*
 | 
						|
*        A has at least as many rows as columns. If A has sufficiently
 | 
						|
*        more rows than columns, first reduce using the QR
 | 
						|
*        decomposition (if sufficient workspace available)
 | 
						|
*
 | 
						|
         IF( M.GE.MNTHR ) THEN
 | 
						|
*
 | 
						|
            IF( WNTUN ) THEN
 | 
						|
*
 | 
						|
*              Path 1 (M much larger than N, JOBU='N')
 | 
						|
*              No left singular vectors to be computed
 | 
						|
*
 | 
						|
               ITAU = 1
 | 
						|
               IWORK = ITAU + N
 | 
						|
*
 | 
						|
*              Compute A=Q*R
 | 
						|
*              (Workspace: need 2*N, prefer N + N*NB)
 | 
						|
*
 | 
						|
               CALL DGEQRF( M, N, A, LDA, WORK( ITAU ), WORK( IWORK ),
 | 
						|
     $                      LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*              Zero out below R
 | 
						|
*
 | 
						|
               IF( N .GT. 1 ) THEN
 | 
						|
                  CALL DLASET( 'L', N-1, N-1, ZERO, ZERO, A( 2, 1 ),
 | 
						|
     $                         LDA )
 | 
						|
               END IF
 | 
						|
               IE = 1
 | 
						|
               ITAUQ = IE + N
 | 
						|
               ITAUP = ITAUQ + N
 | 
						|
               IWORK = ITAUP + N
 | 
						|
*
 | 
						|
*              Bidiagonalize R in A
 | 
						|
*              (Workspace: need 4*N, prefer 3*N + 2*N*NB)
 | 
						|
*
 | 
						|
               CALL DGEBRD( N, N, A, LDA, S, WORK( IE ), WORK( ITAUQ ),
 | 
						|
     $                      WORK( ITAUP ), WORK( IWORK ), LWORK-IWORK+1,
 | 
						|
     $                      IERR )
 | 
						|
               NCVT = 0
 | 
						|
               IF( WNTVO .OR. WNTVAS ) THEN
 | 
						|
*
 | 
						|
*                 If right singular vectors desired, generate P'.
 | 
						|
*                 (Workspace: need 4*N-1, prefer 3*N + (N-1)*NB)
 | 
						|
*
 | 
						|
                  CALL DORGBR( 'P', N, N, N, A, LDA, WORK( ITAUP ),
 | 
						|
     $                         WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                  NCVT = N
 | 
						|
               END IF
 | 
						|
               IWORK = IE + N
 | 
						|
*
 | 
						|
*              Perform bidiagonal QR iteration, computing right
 | 
						|
*              singular vectors of A in A if desired
 | 
						|
*              (Workspace: need BDSPAC)
 | 
						|
*
 | 
						|
               CALL DBDSQR( 'U', N, NCVT, 0, 0, S, WORK( IE ), A, LDA,
 | 
						|
     $                      DUM, 1, DUM, 1, WORK( IWORK ), INFO )
 | 
						|
*
 | 
						|
*              If right singular vectors desired in VT, copy them there
 | 
						|
*
 | 
						|
               IF( WNTVAS )
 | 
						|
     $            CALL DLACPY( 'F', N, N, A, LDA, VT, LDVT )
 | 
						|
*
 | 
						|
            ELSE IF( WNTUO .AND. WNTVN ) THEN
 | 
						|
*
 | 
						|
*              Path 2 (M much larger than N, JOBU='O', JOBVT='N')
 | 
						|
*              N left singular vectors to be overwritten on A and
 | 
						|
*              no right singular vectors to be computed
 | 
						|
*
 | 
						|
               IF( LWORK.GE.N*N+MAX( 4*N, BDSPAC ) ) THEN
 | 
						|
*
 | 
						|
*                 Sufficient workspace for a fast algorithm
 | 
						|
*
 | 
						|
                  IR = 1
 | 
						|
                  IF( LWORK.GE.MAX( WRKBL, LDA*N + N ) + LDA*N ) THEN
 | 
						|
*
 | 
						|
*                    WORK(IU) is LDA by N, WORK(IR) is LDA by N
 | 
						|
*
 | 
						|
                     LDWRKU = LDA
 | 
						|
                     LDWRKR = LDA
 | 
						|
                  ELSE IF( LWORK.GE.MAX( WRKBL, LDA*N + N ) + N*N ) THEN
 | 
						|
*
 | 
						|
*                    WORK(IU) is LDA by N, WORK(IR) is N by N
 | 
						|
*
 | 
						|
                     LDWRKU = LDA
 | 
						|
                     LDWRKR = N
 | 
						|
                  ELSE
 | 
						|
*
 | 
						|
*                    WORK(IU) is LDWRKU by N, WORK(IR) is N by N
 | 
						|
*
 | 
						|
                     LDWRKU = ( LWORK-N*N-N ) / N
 | 
						|
                     LDWRKR = N
 | 
						|
                  END IF
 | 
						|
                  ITAU = IR + LDWRKR*N
 | 
						|
                  IWORK = ITAU + N
 | 
						|
*
 | 
						|
*                 Compute A=Q*R
 | 
						|
*                 (Workspace: need N*N + 2*N, prefer N*N + N + N*NB)
 | 
						|
*
 | 
						|
                  CALL DGEQRF( M, N, A, LDA, WORK( ITAU ),
 | 
						|
     $                         WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                 Copy R to WORK(IR) and zero out below it
 | 
						|
*
 | 
						|
                  CALL DLACPY( 'U', N, N, A, LDA, WORK( IR ), LDWRKR )
 | 
						|
                  CALL DLASET( 'L', N-1, N-1, ZERO, ZERO, WORK( IR+1 ),
 | 
						|
     $                         LDWRKR )
 | 
						|
*
 | 
						|
*                 Generate Q in A
 | 
						|
*                 (Workspace: need N*N + 2*N, prefer N*N + N + N*NB)
 | 
						|
*
 | 
						|
                  CALL DORGQR( M, N, N, A, LDA, WORK( ITAU ),
 | 
						|
     $                         WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                  IE = ITAU
 | 
						|
                  ITAUQ = IE + N
 | 
						|
                  ITAUP = ITAUQ + N
 | 
						|
                  IWORK = ITAUP + N
 | 
						|
*
 | 
						|
*                 Bidiagonalize R in WORK(IR)
 | 
						|
*                 (Workspace: need N*N + 4*N, prefer N*N + 3*N + 2*N*NB)
 | 
						|
*
 | 
						|
                  CALL DGEBRD( N, N, WORK( IR ), LDWRKR, S, WORK( IE ),
 | 
						|
     $                         WORK( ITAUQ ), WORK( ITAUP ),
 | 
						|
     $                         WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                 Generate left vectors bidiagonalizing R
 | 
						|
*                 (Workspace: need N*N + 4*N, prefer N*N + 3*N + N*NB)
 | 
						|
*
 | 
						|
                  CALL DORGBR( 'Q', N, N, N, WORK( IR ), LDWRKR,
 | 
						|
     $                         WORK( ITAUQ ), WORK( IWORK ),
 | 
						|
     $                         LWORK-IWORK+1, IERR )
 | 
						|
                  IWORK = IE + N
 | 
						|
*
 | 
						|
*                 Perform bidiagonal QR iteration, computing left
 | 
						|
*                 singular vectors of R in WORK(IR)
 | 
						|
*                 (Workspace: need N*N + BDSPAC)
 | 
						|
*
 | 
						|
                  CALL DBDSQR( 'U', N, 0, N, 0, S, WORK( IE ), DUM, 1,
 | 
						|
     $                         WORK( IR ), LDWRKR, DUM, 1,
 | 
						|
     $                         WORK( IWORK ), INFO )
 | 
						|
                  IU = IE + N
 | 
						|
*
 | 
						|
*                 Multiply Q in A by left singular vectors of R in
 | 
						|
*                 WORK(IR), storing result in WORK(IU) and copying to A
 | 
						|
*                 (Workspace: need N*N + 2*N, prefer N*N + M*N + N)
 | 
						|
*
 | 
						|
                  DO 10 I = 1, M, LDWRKU
 | 
						|
                     CHUNK = MIN( M-I+1, LDWRKU )
 | 
						|
                     CALL DGEMM( 'N', 'N', CHUNK, N, N, ONE, A( I, 1 ),
 | 
						|
     $                           LDA, WORK( IR ), LDWRKR, ZERO,
 | 
						|
     $                           WORK( IU ), LDWRKU )
 | 
						|
                     CALL DLACPY( 'F', CHUNK, N, WORK( IU ), LDWRKU,
 | 
						|
     $                            A( I, 1 ), LDA )
 | 
						|
   10             CONTINUE
 | 
						|
*
 | 
						|
               ELSE
 | 
						|
*
 | 
						|
*                 Insufficient workspace for a fast algorithm
 | 
						|
*
 | 
						|
                  IE = 1
 | 
						|
                  ITAUQ = IE + N
 | 
						|
                  ITAUP = ITAUQ + N
 | 
						|
                  IWORK = ITAUP + N
 | 
						|
*
 | 
						|
*                 Bidiagonalize A
 | 
						|
*                 (Workspace: need 3*N + M, prefer 3*N + (M + N)*NB)
 | 
						|
*
 | 
						|
                  CALL DGEBRD( M, N, A, LDA, S, WORK( IE ),
 | 
						|
     $                         WORK( ITAUQ ), WORK( ITAUP ),
 | 
						|
     $                         WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                 Generate left vectors bidiagonalizing A
 | 
						|
*                 (Workspace: need 4*N, prefer 3*N + N*NB)
 | 
						|
*
 | 
						|
                  CALL DORGBR( 'Q', M, N, N, A, LDA, WORK( ITAUQ ),
 | 
						|
     $                         WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                  IWORK = IE + N
 | 
						|
*
 | 
						|
*                 Perform bidiagonal QR iteration, computing left
 | 
						|
*                 singular vectors of A in A
 | 
						|
*                 (Workspace: need BDSPAC)
 | 
						|
*
 | 
						|
                  CALL DBDSQR( 'U', N, 0, M, 0, S, WORK( IE ), DUM, 1,
 | 
						|
     $                         A, LDA, DUM, 1, WORK( IWORK ), INFO )
 | 
						|
*
 | 
						|
               END IF
 | 
						|
*
 | 
						|
            ELSE IF( WNTUO .AND. WNTVAS ) THEN
 | 
						|
*
 | 
						|
*              Path 3 (M much larger than N, JOBU='O', JOBVT='S' or 'A')
 | 
						|
*              N left singular vectors to be overwritten on A and
 | 
						|
*              N right singular vectors to be computed in VT
 | 
						|
*
 | 
						|
               IF( LWORK.GE.N*N+MAX( 4*N, BDSPAC ) ) THEN
 | 
						|
*
 | 
						|
*                 Sufficient workspace for a fast algorithm
 | 
						|
*
 | 
						|
                  IR = 1
 | 
						|
                  IF( LWORK.GE.MAX( WRKBL, LDA*N + N ) + LDA*N ) THEN
 | 
						|
*
 | 
						|
*                    WORK(IU) is LDA by N and WORK(IR) is LDA by N
 | 
						|
*
 | 
						|
                     LDWRKU = LDA
 | 
						|
                     LDWRKR = LDA
 | 
						|
                  ELSE IF( LWORK.GE.MAX( WRKBL, LDA*N + N ) + N*N ) THEN
 | 
						|
*
 | 
						|
*                    WORK(IU) is LDA by N and WORK(IR) is N by N
 | 
						|
*
 | 
						|
                     LDWRKU = LDA
 | 
						|
                     LDWRKR = N
 | 
						|
                  ELSE
 | 
						|
*
 | 
						|
*                    WORK(IU) is LDWRKU by N and WORK(IR) is N by N
 | 
						|
*
 | 
						|
                     LDWRKU = ( LWORK-N*N-N ) / N
 | 
						|
                     LDWRKR = N
 | 
						|
                  END IF
 | 
						|
                  ITAU = IR + LDWRKR*N
 | 
						|
                  IWORK = ITAU + N
 | 
						|
*
 | 
						|
*                 Compute A=Q*R
 | 
						|
*                 (Workspace: need N*N + 2*N, prefer N*N + N + N*NB)
 | 
						|
*
 | 
						|
                  CALL DGEQRF( M, N, A, LDA, WORK( ITAU ),
 | 
						|
     $                         WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                 Copy R to VT, zeroing out below it
 | 
						|
*
 | 
						|
                  CALL DLACPY( 'U', N, N, A, LDA, VT, LDVT )
 | 
						|
                  IF( N.GT.1 )
 | 
						|
     $               CALL DLASET( 'L', N-1, N-1, ZERO, ZERO,
 | 
						|
     $                            VT( 2, 1 ), LDVT )
 | 
						|
*
 | 
						|
*                 Generate Q in A
 | 
						|
*                 (Workspace: need N*N + 2*N, prefer N*N + N + N*NB)
 | 
						|
*
 | 
						|
                  CALL DORGQR( M, N, N, A, LDA, WORK( ITAU ),
 | 
						|
     $                         WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                  IE = ITAU
 | 
						|
                  ITAUQ = IE + N
 | 
						|
                  ITAUP = ITAUQ + N
 | 
						|
                  IWORK = ITAUP + N
 | 
						|
*
 | 
						|
*                 Bidiagonalize R in VT, copying result to WORK(IR)
 | 
						|
*                 (Workspace: need N*N + 4*N, prefer N*N + 3*N + 2*N*NB)
 | 
						|
*
 | 
						|
                  CALL DGEBRD( N, N, VT, LDVT, S, WORK( IE ),
 | 
						|
     $                         WORK( ITAUQ ), WORK( ITAUP ),
 | 
						|
     $                         WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                  CALL DLACPY( 'L', N, N, VT, LDVT, WORK( IR ), LDWRKR )
 | 
						|
*
 | 
						|
*                 Generate left vectors bidiagonalizing R in WORK(IR)
 | 
						|
*                 (Workspace: need N*N + 4*N, prefer N*N + 3*N + N*NB)
 | 
						|
*
 | 
						|
                  CALL DORGBR( 'Q', N, N, N, WORK( IR ), LDWRKR,
 | 
						|
     $                         WORK( ITAUQ ), WORK( IWORK ),
 | 
						|
     $                         LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                 Generate right vectors bidiagonalizing R in VT
 | 
						|
*                 (Workspace: need N*N + 4*N-1, prefer N*N + 3*N + (N-1)*NB)
 | 
						|
*
 | 
						|
                  CALL DORGBR( 'P', N, N, N, VT, LDVT, WORK( ITAUP ),
 | 
						|
     $                         WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                  IWORK = IE + N
 | 
						|
*
 | 
						|
*                 Perform bidiagonal QR iteration, computing left
 | 
						|
*                 singular vectors of R in WORK(IR) and computing right
 | 
						|
*                 singular vectors of R in VT
 | 
						|
*                 (Workspace: need N*N + BDSPAC)
 | 
						|
*
 | 
						|
                  CALL DBDSQR( 'U', N, N, N, 0, S, WORK( IE ), VT, LDVT,
 | 
						|
     $                         WORK( IR ), LDWRKR, DUM, 1,
 | 
						|
     $                         WORK( IWORK ), INFO )
 | 
						|
                  IU = IE + N
 | 
						|
*
 | 
						|
*                 Multiply Q in A by left singular vectors of R in
 | 
						|
*                 WORK(IR), storing result in WORK(IU) and copying to A
 | 
						|
*                 (Workspace: need N*N + 2*N, prefer N*N + M*N + N)
 | 
						|
*
 | 
						|
                  DO 20 I = 1, M, LDWRKU
 | 
						|
                     CHUNK = MIN( M-I+1, LDWRKU )
 | 
						|
                     CALL DGEMM( 'N', 'N', CHUNK, N, N, ONE, A( I, 1 ),
 | 
						|
     $                           LDA, WORK( IR ), LDWRKR, ZERO,
 | 
						|
     $                           WORK( IU ), LDWRKU )
 | 
						|
                     CALL DLACPY( 'F', CHUNK, N, WORK( IU ), LDWRKU,
 | 
						|
     $                            A( I, 1 ), LDA )
 | 
						|
   20             CONTINUE
 | 
						|
*
 | 
						|
               ELSE
 | 
						|
*
 | 
						|
*                 Insufficient workspace for a fast algorithm
 | 
						|
*
 | 
						|
                  ITAU = 1
 | 
						|
                  IWORK = ITAU + N
 | 
						|
*
 | 
						|
*                 Compute A=Q*R
 | 
						|
*                 (Workspace: need 2*N, prefer N + N*NB)
 | 
						|
*
 | 
						|
                  CALL DGEQRF( M, N, A, LDA, WORK( ITAU ),
 | 
						|
     $                         WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                 Copy R to VT, zeroing out below it
 | 
						|
*
 | 
						|
                  CALL DLACPY( 'U', N, N, A, LDA, VT, LDVT )
 | 
						|
                  IF( N.GT.1 )
 | 
						|
     $               CALL DLASET( 'L', N-1, N-1, ZERO, ZERO,
 | 
						|
     $                            VT( 2, 1 ), LDVT )
 | 
						|
*
 | 
						|
*                 Generate Q in A
 | 
						|
*                 (Workspace: need 2*N, prefer N + N*NB)
 | 
						|
*
 | 
						|
                  CALL DORGQR( M, N, N, A, LDA, WORK( ITAU ),
 | 
						|
     $                         WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                  IE = ITAU
 | 
						|
                  ITAUQ = IE + N
 | 
						|
                  ITAUP = ITAUQ + N
 | 
						|
                  IWORK = ITAUP + N
 | 
						|
*
 | 
						|
*                 Bidiagonalize R in VT
 | 
						|
*                 (Workspace: need 4*N, prefer 3*N + 2*N*NB)
 | 
						|
*
 | 
						|
                  CALL DGEBRD( N, N, VT, LDVT, S, WORK( IE ),
 | 
						|
     $                         WORK( ITAUQ ), WORK( ITAUP ),
 | 
						|
     $                         WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                 Multiply Q in A by left vectors bidiagonalizing R
 | 
						|
*                 (Workspace: need 3*N + M, prefer 3*N + M*NB)
 | 
						|
*
 | 
						|
                  CALL DORMBR( 'Q', 'R', 'N', M, N, N, VT, LDVT,
 | 
						|
     $                         WORK( ITAUQ ), A, LDA, WORK( IWORK ),
 | 
						|
     $                         LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                 Generate right vectors bidiagonalizing R in VT
 | 
						|
*                 (Workspace: need 4*N-1, prefer 3*N + (N-1)*NB)
 | 
						|
*
 | 
						|
                  CALL DORGBR( 'P', N, N, N, VT, LDVT, WORK( ITAUP ),
 | 
						|
     $                         WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                  IWORK = IE + N
 | 
						|
*
 | 
						|
*                 Perform bidiagonal QR iteration, computing left
 | 
						|
*                 singular vectors of A in A and computing right
 | 
						|
*                 singular vectors of A in VT
 | 
						|
*                 (Workspace: need BDSPAC)
 | 
						|
*
 | 
						|
                  CALL DBDSQR( 'U', N, N, M, 0, S, WORK( IE ), VT, LDVT,
 | 
						|
     $                         A, LDA, DUM, 1, WORK( IWORK ), INFO )
 | 
						|
*
 | 
						|
               END IF
 | 
						|
*
 | 
						|
            ELSE IF( WNTUS ) THEN
 | 
						|
*
 | 
						|
               IF( WNTVN ) THEN
 | 
						|
*
 | 
						|
*                 Path 4 (M much larger than N, JOBU='S', JOBVT='N')
 | 
						|
*                 N left singular vectors to be computed in U and
 | 
						|
*                 no right singular vectors to be computed
 | 
						|
*
 | 
						|
                  IF( LWORK.GE.N*N+MAX( 4*N, BDSPAC ) ) THEN
 | 
						|
*
 | 
						|
*                    Sufficient workspace for a fast algorithm
 | 
						|
*
 | 
						|
                     IR = 1
 | 
						|
                     IF( LWORK.GE.WRKBL+LDA*N ) THEN
 | 
						|
*
 | 
						|
*                       WORK(IR) is LDA by N
 | 
						|
*
 | 
						|
                        LDWRKR = LDA
 | 
						|
                     ELSE
 | 
						|
*
 | 
						|
*                       WORK(IR) is N by N
 | 
						|
*
 | 
						|
                        LDWRKR = N
 | 
						|
                     END IF
 | 
						|
                     ITAU = IR + LDWRKR*N
 | 
						|
                     IWORK = ITAU + N
 | 
						|
*
 | 
						|
*                    Compute A=Q*R
 | 
						|
*                    (Workspace: need N*N + 2*N, prefer N*N + N + N*NB)
 | 
						|
*
 | 
						|
                     CALL DGEQRF( M, N, A, LDA, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Copy R to WORK(IR), zeroing out below it
 | 
						|
*
 | 
						|
                     CALL DLACPY( 'U', N, N, A, LDA, WORK( IR ),
 | 
						|
     $                            LDWRKR )
 | 
						|
                     CALL DLASET( 'L', N-1, N-1, ZERO, ZERO,
 | 
						|
     $                            WORK( IR+1 ), LDWRKR )
 | 
						|
*
 | 
						|
*                    Generate Q in A
 | 
						|
*                    (Workspace: need N*N + 2*N, prefer N*N + N + N*NB)
 | 
						|
*
 | 
						|
                     CALL DORGQR( M, N, N, A, LDA, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     IE = ITAU
 | 
						|
                     ITAUQ = IE + N
 | 
						|
                     ITAUP = ITAUQ + N
 | 
						|
                     IWORK = ITAUP + N
 | 
						|
*
 | 
						|
*                    Bidiagonalize R in WORK(IR)
 | 
						|
*                    (Workspace: need N*N + 4*N, prefer N*N + 3*N + 2*N*NB)
 | 
						|
*
 | 
						|
                     CALL DGEBRD( N, N, WORK( IR ), LDWRKR, S,
 | 
						|
     $                            WORK( IE ), WORK( ITAUQ ),
 | 
						|
     $                            WORK( ITAUP ), WORK( IWORK ),
 | 
						|
     $                            LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Generate left vectors bidiagonalizing R in WORK(IR)
 | 
						|
*                    (Workspace: need N*N + 4*N, prefer N*N + 3*N + N*NB)
 | 
						|
*
 | 
						|
                     CALL DORGBR( 'Q', N, N, N, WORK( IR ), LDWRKR,
 | 
						|
     $                            WORK( ITAUQ ), WORK( IWORK ),
 | 
						|
     $                            LWORK-IWORK+1, IERR )
 | 
						|
                     IWORK = IE + N
 | 
						|
*
 | 
						|
*                    Perform bidiagonal QR iteration, computing left
 | 
						|
*                    singular vectors of R in WORK(IR)
 | 
						|
*                    (Workspace: need N*N + BDSPAC)
 | 
						|
*
 | 
						|
                     CALL DBDSQR( 'U', N, 0, N, 0, S, WORK( IE ), DUM,
 | 
						|
     $                            1, WORK( IR ), LDWRKR, DUM, 1,
 | 
						|
     $                            WORK( IWORK ), INFO )
 | 
						|
*
 | 
						|
*                    Multiply Q in A by left singular vectors of R in
 | 
						|
*                    WORK(IR), storing result in U
 | 
						|
*                    (Workspace: need N*N)
 | 
						|
*
 | 
						|
                     CALL DGEMM( 'N', 'N', M, N, N, ONE, A, LDA,
 | 
						|
     $                           WORK( IR ), LDWRKR, ZERO, U, LDU )
 | 
						|
*
 | 
						|
                  ELSE
 | 
						|
*
 | 
						|
*                    Insufficient workspace for a fast algorithm
 | 
						|
*
 | 
						|
                     ITAU = 1
 | 
						|
                     IWORK = ITAU + N
 | 
						|
*
 | 
						|
*                    Compute A=Q*R, copying result to U
 | 
						|
*                    (Workspace: need 2*N, prefer N + N*NB)
 | 
						|
*
 | 
						|
                     CALL DGEQRF( M, N, A, LDA, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     CALL DLACPY( 'L', M, N, A, LDA, U, LDU )
 | 
						|
*
 | 
						|
*                    Generate Q in U
 | 
						|
*                    (Workspace: need 2*N, prefer N + N*NB)
 | 
						|
*
 | 
						|
                     CALL DORGQR( M, N, N, U, LDU, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     IE = ITAU
 | 
						|
                     ITAUQ = IE + N
 | 
						|
                     ITAUP = ITAUQ + N
 | 
						|
                     IWORK = ITAUP + N
 | 
						|
*
 | 
						|
*                    Zero out below R in A
 | 
						|
*
 | 
						|
                     IF( N .GT. 1 ) THEN
 | 
						|
                        CALL DLASET( 'L', N-1, N-1, ZERO, ZERO,
 | 
						|
     $                               A( 2, 1 ), LDA )
 | 
						|
                     END IF
 | 
						|
*
 | 
						|
*                    Bidiagonalize R in A
 | 
						|
*                    (Workspace: need 4*N, prefer 3*N + 2*N*NB)
 | 
						|
*
 | 
						|
                     CALL DGEBRD( N, N, A, LDA, S, WORK( IE ),
 | 
						|
     $                            WORK( ITAUQ ), WORK( ITAUP ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Multiply Q in U by left vectors bidiagonalizing R
 | 
						|
*                    (Workspace: need 3*N + M, prefer 3*N + M*NB)
 | 
						|
*
 | 
						|
                     CALL DORMBR( 'Q', 'R', 'N', M, N, N, A, LDA,
 | 
						|
     $                            WORK( ITAUQ ), U, LDU, WORK( IWORK ),
 | 
						|
     $                            LWORK-IWORK+1, IERR )
 | 
						|
                     IWORK = IE + N
 | 
						|
*
 | 
						|
*                    Perform bidiagonal QR iteration, computing left
 | 
						|
*                    singular vectors of A in U
 | 
						|
*                    (Workspace: need BDSPAC)
 | 
						|
*
 | 
						|
                     CALL DBDSQR( 'U', N, 0, M, 0, S, WORK( IE ), DUM,
 | 
						|
     $                            1, U, LDU, DUM, 1, WORK( IWORK ),
 | 
						|
     $                            INFO )
 | 
						|
*
 | 
						|
                  END IF
 | 
						|
*
 | 
						|
               ELSE IF( WNTVO ) THEN
 | 
						|
*
 | 
						|
*                 Path 5 (M much larger than N, JOBU='S', JOBVT='O')
 | 
						|
*                 N left singular vectors to be computed in U and
 | 
						|
*                 N right singular vectors to be overwritten on A
 | 
						|
*
 | 
						|
                  IF( LWORK.GE.2*N*N+MAX( 4*N, BDSPAC ) ) THEN
 | 
						|
*
 | 
						|
*                    Sufficient workspace for a fast algorithm
 | 
						|
*
 | 
						|
                     IU = 1
 | 
						|
                     IF( LWORK.GE.WRKBL+2*LDA*N ) THEN
 | 
						|
*
 | 
						|
*                       WORK(IU) is LDA by N and WORK(IR) is LDA by N
 | 
						|
*
 | 
						|
                        LDWRKU = LDA
 | 
						|
                        IR = IU + LDWRKU*N
 | 
						|
                        LDWRKR = LDA
 | 
						|
                     ELSE IF( LWORK.GE.WRKBL+( LDA + N )*N ) THEN
 | 
						|
*
 | 
						|
*                       WORK(IU) is LDA by N and WORK(IR) is N by N
 | 
						|
*
 | 
						|
                        LDWRKU = LDA
 | 
						|
                        IR = IU + LDWRKU*N
 | 
						|
                        LDWRKR = N
 | 
						|
                     ELSE
 | 
						|
*
 | 
						|
*                       WORK(IU) is N by N and WORK(IR) is N by N
 | 
						|
*
 | 
						|
                        LDWRKU = N
 | 
						|
                        IR = IU + LDWRKU*N
 | 
						|
                        LDWRKR = N
 | 
						|
                     END IF
 | 
						|
                     ITAU = IR + LDWRKR*N
 | 
						|
                     IWORK = ITAU + N
 | 
						|
*
 | 
						|
*                    Compute A=Q*R
 | 
						|
*                    (Workspace: need 2*N*N + 2*N, prefer 2*N*N + N + N*NB)
 | 
						|
*
 | 
						|
                     CALL DGEQRF( M, N, A, LDA, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Copy R to WORK(IU), zeroing out below it
 | 
						|
*
 | 
						|
                     CALL DLACPY( 'U', N, N, A, LDA, WORK( IU ),
 | 
						|
     $                            LDWRKU )
 | 
						|
                     CALL DLASET( 'L', N-1, N-1, ZERO, ZERO,
 | 
						|
     $                            WORK( IU+1 ), LDWRKU )
 | 
						|
*
 | 
						|
*                    Generate Q in A
 | 
						|
*                    (Workspace: need 2*N*N + 2*N, prefer 2*N*N + N + N*NB)
 | 
						|
*
 | 
						|
                     CALL DORGQR( M, N, N, A, LDA, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     IE = ITAU
 | 
						|
                     ITAUQ = IE + N
 | 
						|
                     ITAUP = ITAUQ + N
 | 
						|
                     IWORK = ITAUP + N
 | 
						|
*
 | 
						|
*                    Bidiagonalize R in WORK(IU), copying result to
 | 
						|
*                    WORK(IR)
 | 
						|
*                    (Workspace: need 2*N*N + 4*N,
 | 
						|
*                                prefer 2*N*N+3*N+2*N*NB)
 | 
						|
*
 | 
						|
                     CALL DGEBRD( N, N, WORK( IU ), LDWRKU, S,
 | 
						|
     $                            WORK( IE ), WORK( ITAUQ ),
 | 
						|
     $                            WORK( ITAUP ), WORK( IWORK ),
 | 
						|
     $                            LWORK-IWORK+1, IERR )
 | 
						|
                     CALL DLACPY( 'U', N, N, WORK( IU ), LDWRKU,
 | 
						|
     $                            WORK( IR ), LDWRKR )
 | 
						|
*
 | 
						|
*                    Generate left bidiagonalizing vectors in WORK(IU)
 | 
						|
*                    (Workspace: need 2*N*N + 4*N, prefer 2*N*N + 3*N + N*NB)
 | 
						|
*
 | 
						|
                     CALL DORGBR( 'Q', N, N, N, WORK( IU ), LDWRKU,
 | 
						|
     $                            WORK( ITAUQ ), WORK( IWORK ),
 | 
						|
     $                            LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Generate right bidiagonalizing vectors in WORK(IR)
 | 
						|
*                    (Workspace: need 2*N*N + 4*N-1,
 | 
						|
*                                prefer 2*N*N+3*N+(N-1)*NB)
 | 
						|
*
 | 
						|
                     CALL DORGBR( 'P', N, N, N, WORK( IR ), LDWRKR,
 | 
						|
     $                            WORK( ITAUP ), WORK( IWORK ),
 | 
						|
     $                            LWORK-IWORK+1, IERR )
 | 
						|
                     IWORK = IE + N
 | 
						|
*
 | 
						|
*                    Perform bidiagonal QR iteration, computing left
 | 
						|
*                    singular vectors of R in WORK(IU) and computing
 | 
						|
*                    right singular vectors of R in WORK(IR)
 | 
						|
*                    (Workspace: need 2*N*N + BDSPAC)
 | 
						|
*
 | 
						|
                     CALL DBDSQR( 'U', N, N, N, 0, S, WORK( IE ),
 | 
						|
     $                            WORK( IR ), LDWRKR, WORK( IU ),
 | 
						|
     $                            LDWRKU, DUM, 1, WORK( IWORK ), INFO )
 | 
						|
*
 | 
						|
*                    Multiply Q in A by left singular vectors of R in
 | 
						|
*                    WORK(IU), storing result in U
 | 
						|
*                    (Workspace: need N*N)
 | 
						|
*
 | 
						|
                     CALL DGEMM( 'N', 'N', M, N, N, ONE, A, LDA,
 | 
						|
     $                           WORK( IU ), LDWRKU, ZERO, U, LDU )
 | 
						|
*
 | 
						|
*                    Copy right singular vectors of R to A
 | 
						|
*                    (Workspace: need N*N)
 | 
						|
*
 | 
						|
                     CALL DLACPY( 'F', N, N, WORK( IR ), LDWRKR, A,
 | 
						|
     $                            LDA )
 | 
						|
*
 | 
						|
                  ELSE
 | 
						|
*
 | 
						|
*                    Insufficient workspace for a fast algorithm
 | 
						|
*
 | 
						|
                     ITAU = 1
 | 
						|
                     IWORK = ITAU + N
 | 
						|
*
 | 
						|
*                    Compute A=Q*R, copying result to U
 | 
						|
*                    (Workspace: need 2*N, prefer N + N*NB)
 | 
						|
*
 | 
						|
                     CALL DGEQRF( M, N, A, LDA, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     CALL DLACPY( 'L', M, N, A, LDA, U, LDU )
 | 
						|
*
 | 
						|
*                    Generate Q in U
 | 
						|
*                    (Workspace: need 2*N, prefer N + N*NB)
 | 
						|
*
 | 
						|
                     CALL DORGQR( M, N, N, U, LDU, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     IE = ITAU
 | 
						|
                     ITAUQ = IE + N
 | 
						|
                     ITAUP = ITAUQ + N
 | 
						|
                     IWORK = ITAUP + N
 | 
						|
*
 | 
						|
*                    Zero out below R in A
 | 
						|
*
 | 
						|
                     IF( N .GT. 1 ) THEN
 | 
						|
                        CALL DLASET( 'L', N-1, N-1, ZERO, ZERO,
 | 
						|
     $                               A( 2, 1 ), LDA )
 | 
						|
                     END IF
 | 
						|
*
 | 
						|
*                    Bidiagonalize R in A
 | 
						|
*                    (Workspace: need 4*N, prefer 3*N + 2*N*NB)
 | 
						|
*
 | 
						|
                     CALL DGEBRD( N, N, A, LDA, S, WORK( IE ),
 | 
						|
     $                            WORK( ITAUQ ), WORK( ITAUP ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Multiply Q in U by left vectors bidiagonalizing R
 | 
						|
*                    (Workspace: need 3*N + M, prefer 3*N + M*NB)
 | 
						|
*
 | 
						|
                     CALL DORMBR( 'Q', 'R', 'N', M, N, N, A, LDA,
 | 
						|
     $                            WORK( ITAUQ ), U, LDU, WORK( IWORK ),
 | 
						|
     $                            LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Generate right vectors bidiagonalizing R in A
 | 
						|
*                    (Workspace: need 4*N-1, prefer 3*N + (N-1)*NB)
 | 
						|
*
 | 
						|
                     CALL DORGBR( 'P', N, N, N, A, LDA, WORK( ITAUP ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     IWORK = IE + N
 | 
						|
*
 | 
						|
*                    Perform bidiagonal QR iteration, computing left
 | 
						|
*                    singular vectors of A in U and computing right
 | 
						|
*                    singular vectors of A in A
 | 
						|
*                    (Workspace: need BDSPAC)
 | 
						|
*
 | 
						|
                     CALL DBDSQR( 'U', N, N, M, 0, S, WORK( IE ), A,
 | 
						|
     $                            LDA, U, LDU, DUM, 1, WORK( IWORK ),
 | 
						|
     $                            INFO )
 | 
						|
*
 | 
						|
                  END IF
 | 
						|
*
 | 
						|
               ELSE IF( WNTVAS ) THEN
 | 
						|
*
 | 
						|
*                 Path 6 (M much larger than N, JOBU='S', JOBVT='S'
 | 
						|
*                         or 'A')
 | 
						|
*                 N left singular vectors to be computed in U and
 | 
						|
*                 N right singular vectors to be computed in VT
 | 
						|
*
 | 
						|
                  IF( LWORK.GE.N*N+MAX( 4*N, BDSPAC ) ) THEN
 | 
						|
*
 | 
						|
*                    Sufficient workspace for a fast algorithm
 | 
						|
*
 | 
						|
                     IU = 1
 | 
						|
                     IF( LWORK.GE.WRKBL+LDA*N ) THEN
 | 
						|
*
 | 
						|
*                       WORK(IU) is LDA by N
 | 
						|
*
 | 
						|
                        LDWRKU = LDA
 | 
						|
                     ELSE
 | 
						|
*
 | 
						|
*                       WORK(IU) is N by N
 | 
						|
*
 | 
						|
                        LDWRKU = N
 | 
						|
                     END IF
 | 
						|
                     ITAU = IU + LDWRKU*N
 | 
						|
                     IWORK = ITAU + N
 | 
						|
*
 | 
						|
*                    Compute A=Q*R
 | 
						|
*                    (Workspace: need N*N + 2*N, prefer N*N + N + N*NB)
 | 
						|
*
 | 
						|
                     CALL DGEQRF( M, N, A, LDA, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Copy R to WORK(IU), zeroing out below it
 | 
						|
*
 | 
						|
                     CALL DLACPY( 'U', N, N, A, LDA, WORK( IU ),
 | 
						|
     $                            LDWRKU )
 | 
						|
                     CALL DLASET( 'L', N-1, N-1, ZERO, ZERO,
 | 
						|
     $                            WORK( IU+1 ), LDWRKU )
 | 
						|
*
 | 
						|
*                    Generate Q in A
 | 
						|
*                    (Workspace: need N*N + 2*N, prefer N*N + N + N*NB)
 | 
						|
*
 | 
						|
                     CALL DORGQR( M, N, N, A, LDA, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     IE = ITAU
 | 
						|
                     ITAUQ = IE + N
 | 
						|
                     ITAUP = ITAUQ + N
 | 
						|
                     IWORK = ITAUP + N
 | 
						|
*
 | 
						|
*                    Bidiagonalize R in WORK(IU), copying result to VT
 | 
						|
*                    (Workspace: need N*N + 4*N, prefer N*N + 3*N + 2*N*NB)
 | 
						|
*
 | 
						|
                     CALL DGEBRD( N, N, WORK( IU ), LDWRKU, S,
 | 
						|
     $                            WORK( IE ), WORK( ITAUQ ),
 | 
						|
     $                            WORK( ITAUP ), WORK( IWORK ),
 | 
						|
     $                            LWORK-IWORK+1, IERR )
 | 
						|
                     CALL DLACPY( 'U', N, N, WORK( IU ), LDWRKU, VT,
 | 
						|
     $                            LDVT )
 | 
						|
*
 | 
						|
*                    Generate left bidiagonalizing vectors in WORK(IU)
 | 
						|
*                    (Workspace: need N*N + 4*N, prefer N*N + 3*N + N*NB)
 | 
						|
*
 | 
						|
                     CALL DORGBR( 'Q', N, N, N, WORK( IU ), LDWRKU,
 | 
						|
     $                            WORK( ITAUQ ), WORK( IWORK ),
 | 
						|
     $                            LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Generate right bidiagonalizing vectors in VT
 | 
						|
*                    (Workspace: need N*N + 4*N-1,
 | 
						|
*                                prefer N*N+3*N+(N-1)*NB)
 | 
						|
*
 | 
						|
                     CALL DORGBR( 'P', N, N, N, VT, LDVT, WORK( ITAUP ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     IWORK = IE + N
 | 
						|
*
 | 
						|
*                    Perform bidiagonal QR iteration, computing left
 | 
						|
*                    singular vectors of R in WORK(IU) and computing
 | 
						|
*                    right singular vectors of R in VT
 | 
						|
*                    (Workspace: need N*N + BDSPAC)
 | 
						|
*
 | 
						|
                     CALL DBDSQR( 'U', N, N, N, 0, S, WORK( IE ), VT,
 | 
						|
     $                            LDVT, WORK( IU ), LDWRKU, DUM, 1,
 | 
						|
     $                            WORK( IWORK ), INFO )
 | 
						|
*
 | 
						|
*                    Multiply Q in A by left singular vectors of R in
 | 
						|
*                    WORK(IU), storing result in U
 | 
						|
*                    (Workspace: need N*N)
 | 
						|
*
 | 
						|
                     CALL DGEMM( 'N', 'N', M, N, N, ONE, A, LDA,
 | 
						|
     $                           WORK( IU ), LDWRKU, ZERO, U, LDU )
 | 
						|
*
 | 
						|
                  ELSE
 | 
						|
*
 | 
						|
*                    Insufficient workspace for a fast algorithm
 | 
						|
*
 | 
						|
                     ITAU = 1
 | 
						|
                     IWORK = ITAU + N
 | 
						|
*
 | 
						|
*                    Compute A=Q*R, copying result to U
 | 
						|
*                    (Workspace: need 2*N, prefer N + N*NB)
 | 
						|
*
 | 
						|
                     CALL DGEQRF( M, N, A, LDA, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     CALL DLACPY( 'L', M, N, A, LDA, U, LDU )
 | 
						|
*
 | 
						|
*                    Generate Q in U
 | 
						|
*                    (Workspace: need 2*N, prefer N + N*NB)
 | 
						|
*
 | 
						|
                     CALL DORGQR( M, N, N, U, LDU, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Copy R to VT, zeroing out below it
 | 
						|
*
 | 
						|
                     CALL DLACPY( 'U', N, N, A, LDA, VT, LDVT )
 | 
						|
                     IF( N.GT.1 )
 | 
						|
     $                  CALL DLASET( 'L', N-1, N-1, ZERO, ZERO,
 | 
						|
     $                               VT( 2, 1 ), LDVT )
 | 
						|
                     IE = ITAU
 | 
						|
                     ITAUQ = IE + N
 | 
						|
                     ITAUP = ITAUQ + N
 | 
						|
                     IWORK = ITAUP + N
 | 
						|
*
 | 
						|
*                    Bidiagonalize R in VT
 | 
						|
*                    (Workspace: need 4*N, prefer 3*N + 2*N*NB)
 | 
						|
*
 | 
						|
                     CALL DGEBRD( N, N, VT, LDVT, S, WORK( IE ),
 | 
						|
     $                            WORK( ITAUQ ), WORK( ITAUP ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Multiply Q in U by left bidiagonalizing vectors
 | 
						|
*                    in VT
 | 
						|
*                    (Workspace: need 3*N + M, prefer 3*N + M*NB)
 | 
						|
*
 | 
						|
                     CALL DORMBR( 'Q', 'R', 'N', M, N, N, VT, LDVT,
 | 
						|
     $                            WORK( ITAUQ ), U, LDU, WORK( IWORK ),
 | 
						|
     $                            LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Generate right bidiagonalizing vectors in VT
 | 
						|
*                    (Workspace: need 4*N-1, prefer 3*N + (N-1)*NB)
 | 
						|
*
 | 
						|
                     CALL DORGBR( 'P', N, N, N, VT, LDVT, WORK( ITAUP ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     IWORK = IE + N
 | 
						|
*
 | 
						|
*                    Perform bidiagonal QR iteration, computing left
 | 
						|
*                    singular vectors of A in U and computing right
 | 
						|
*                    singular vectors of A in VT
 | 
						|
*                    (Workspace: need BDSPAC)
 | 
						|
*
 | 
						|
                     CALL DBDSQR( 'U', N, N, M, 0, S, WORK( IE ), VT,
 | 
						|
     $                            LDVT, U, LDU, DUM, 1, WORK( IWORK ),
 | 
						|
     $                            INFO )
 | 
						|
*
 | 
						|
                  END IF
 | 
						|
*
 | 
						|
               END IF
 | 
						|
*
 | 
						|
            ELSE IF( WNTUA ) THEN
 | 
						|
*
 | 
						|
               IF( WNTVN ) THEN
 | 
						|
*
 | 
						|
*                 Path 7 (M much larger than N, JOBU='A', JOBVT='N')
 | 
						|
*                 M left singular vectors to be computed in U and
 | 
						|
*                 no right singular vectors to be computed
 | 
						|
*
 | 
						|
                  IF( LWORK.GE.N*N+MAX( N+M, 4*N, BDSPAC ) ) THEN
 | 
						|
*
 | 
						|
*                    Sufficient workspace for a fast algorithm
 | 
						|
*
 | 
						|
                     IR = 1
 | 
						|
                     IF( LWORK.GE.WRKBL+LDA*N ) THEN
 | 
						|
*
 | 
						|
*                       WORK(IR) is LDA by N
 | 
						|
*
 | 
						|
                        LDWRKR = LDA
 | 
						|
                     ELSE
 | 
						|
*
 | 
						|
*                       WORK(IR) is N by N
 | 
						|
*
 | 
						|
                        LDWRKR = N
 | 
						|
                     END IF
 | 
						|
                     ITAU = IR + LDWRKR*N
 | 
						|
                     IWORK = ITAU + N
 | 
						|
*
 | 
						|
*                    Compute A=Q*R, copying result to U
 | 
						|
*                    (Workspace: need N*N + 2*N, prefer N*N + N + N*NB)
 | 
						|
*
 | 
						|
                     CALL DGEQRF( M, N, A, LDA, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     CALL DLACPY( 'L', M, N, A, LDA, U, LDU )
 | 
						|
*
 | 
						|
*                    Copy R to WORK(IR), zeroing out below it
 | 
						|
*
 | 
						|
                     CALL DLACPY( 'U', N, N, A, LDA, WORK( IR ),
 | 
						|
     $                            LDWRKR )
 | 
						|
                     CALL DLASET( 'L', N-1, N-1, ZERO, ZERO,
 | 
						|
     $                            WORK( IR+1 ), LDWRKR )
 | 
						|
*
 | 
						|
*                    Generate Q in U
 | 
						|
*                    (Workspace: need N*N + N + M, prefer N*N + N + M*NB)
 | 
						|
*
 | 
						|
                     CALL DORGQR( M, M, N, U, LDU, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     IE = ITAU
 | 
						|
                     ITAUQ = IE + N
 | 
						|
                     ITAUP = ITAUQ + N
 | 
						|
                     IWORK = ITAUP + N
 | 
						|
*
 | 
						|
*                    Bidiagonalize R in WORK(IR)
 | 
						|
*                    (Workspace: need N*N + 4*N, prefer N*N + 3*N + 2*N*NB)
 | 
						|
*
 | 
						|
                     CALL DGEBRD( N, N, WORK( IR ), LDWRKR, S,
 | 
						|
     $                            WORK( IE ), WORK( ITAUQ ),
 | 
						|
     $                            WORK( ITAUP ), WORK( IWORK ),
 | 
						|
     $                            LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Generate left bidiagonalizing vectors in WORK(IR)
 | 
						|
*                    (Workspace: need N*N + 4*N, prefer N*N + 3*N + N*NB)
 | 
						|
*
 | 
						|
                     CALL DORGBR( 'Q', N, N, N, WORK( IR ), LDWRKR,
 | 
						|
     $                            WORK( ITAUQ ), WORK( IWORK ),
 | 
						|
     $                            LWORK-IWORK+1, IERR )
 | 
						|
                     IWORK = IE + N
 | 
						|
*
 | 
						|
*                    Perform bidiagonal QR iteration, computing left
 | 
						|
*                    singular vectors of R in WORK(IR)
 | 
						|
*                    (Workspace: need N*N + BDSPAC)
 | 
						|
*
 | 
						|
                     CALL DBDSQR( 'U', N, 0, N, 0, S, WORK( IE ), DUM,
 | 
						|
     $                            1, WORK( IR ), LDWRKR, DUM, 1,
 | 
						|
     $                            WORK( IWORK ), INFO )
 | 
						|
*
 | 
						|
*                    Multiply Q in U by left singular vectors of R in
 | 
						|
*                    WORK(IR), storing result in A
 | 
						|
*                    (Workspace: need N*N)
 | 
						|
*
 | 
						|
                     CALL DGEMM( 'N', 'N', M, N, N, ONE, U, LDU,
 | 
						|
     $                           WORK( IR ), LDWRKR, ZERO, A, LDA )
 | 
						|
*
 | 
						|
*                    Copy left singular vectors of A from A to U
 | 
						|
*
 | 
						|
                     CALL DLACPY( 'F', M, N, A, LDA, U, LDU )
 | 
						|
*
 | 
						|
                  ELSE
 | 
						|
*
 | 
						|
*                    Insufficient workspace for a fast algorithm
 | 
						|
*
 | 
						|
                     ITAU = 1
 | 
						|
                     IWORK = ITAU + N
 | 
						|
*
 | 
						|
*                    Compute A=Q*R, copying result to U
 | 
						|
*                    (Workspace: need 2*N, prefer N + N*NB)
 | 
						|
*
 | 
						|
                     CALL DGEQRF( M, N, A, LDA, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     CALL DLACPY( 'L', M, N, A, LDA, U, LDU )
 | 
						|
*
 | 
						|
*                    Generate Q in U
 | 
						|
*                    (Workspace: need N + M, prefer N + M*NB)
 | 
						|
*
 | 
						|
                     CALL DORGQR( M, M, N, U, LDU, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     IE = ITAU
 | 
						|
                     ITAUQ = IE + N
 | 
						|
                     ITAUP = ITAUQ + N
 | 
						|
                     IWORK = ITAUP + N
 | 
						|
*
 | 
						|
*                    Zero out below R in A
 | 
						|
*
 | 
						|
                     IF( N .GT. 1 ) THEN
 | 
						|
                        CALL DLASET( 'L', N-1, N-1, ZERO, ZERO,
 | 
						|
     $                                A( 2, 1 ), LDA )
 | 
						|
                     END IF
 | 
						|
*
 | 
						|
*                    Bidiagonalize R in A
 | 
						|
*                    (Workspace: need 4*N, prefer 3*N + 2*N*NB)
 | 
						|
*
 | 
						|
                     CALL DGEBRD( N, N, A, LDA, S, WORK( IE ),
 | 
						|
     $                            WORK( ITAUQ ), WORK( ITAUP ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Multiply Q in U by left bidiagonalizing vectors
 | 
						|
*                    in A
 | 
						|
*                    (Workspace: need 3*N + M, prefer 3*N + M*NB)
 | 
						|
*
 | 
						|
                     CALL DORMBR( 'Q', 'R', 'N', M, N, N, A, LDA,
 | 
						|
     $                            WORK( ITAUQ ), U, LDU, WORK( IWORK ),
 | 
						|
     $                            LWORK-IWORK+1, IERR )
 | 
						|
                     IWORK = IE + N
 | 
						|
*
 | 
						|
*                    Perform bidiagonal QR iteration, computing left
 | 
						|
*                    singular vectors of A in U
 | 
						|
*                    (Workspace: need BDSPAC)
 | 
						|
*
 | 
						|
                     CALL DBDSQR( 'U', N, 0, M, 0, S, WORK( IE ), DUM,
 | 
						|
     $                            1, U, LDU, DUM, 1, WORK( IWORK ),
 | 
						|
     $                            INFO )
 | 
						|
*
 | 
						|
                  END IF
 | 
						|
*
 | 
						|
               ELSE IF( WNTVO ) THEN
 | 
						|
*
 | 
						|
*                 Path 8 (M much larger than N, JOBU='A', JOBVT='O')
 | 
						|
*                 M left singular vectors to be computed in U and
 | 
						|
*                 N right singular vectors to be overwritten on A
 | 
						|
*
 | 
						|
                  IF( LWORK.GE.2*N*N+MAX( N+M, 4*N, BDSPAC ) ) THEN
 | 
						|
*
 | 
						|
*                    Sufficient workspace for a fast algorithm
 | 
						|
*
 | 
						|
                     IU = 1
 | 
						|
                     IF( LWORK.GE.WRKBL+2*LDA*N ) THEN
 | 
						|
*
 | 
						|
*                       WORK(IU) is LDA by N and WORK(IR) is LDA by N
 | 
						|
*
 | 
						|
                        LDWRKU = LDA
 | 
						|
                        IR = IU + LDWRKU*N
 | 
						|
                        LDWRKR = LDA
 | 
						|
                     ELSE IF( LWORK.GE.WRKBL+( LDA + N )*N ) THEN
 | 
						|
*
 | 
						|
*                       WORK(IU) is LDA by N and WORK(IR) is N by N
 | 
						|
*
 | 
						|
                        LDWRKU = LDA
 | 
						|
                        IR = IU + LDWRKU*N
 | 
						|
                        LDWRKR = N
 | 
						|
                     ELSE
 | 
						|
*
 | 
						|
*                       WORK(IU) is N by N and WORK(IR) is N by N
 | 
						|
*
 | 
						|
                        LDWRKU = N
 | 
						|
                        IR = IU + LDWRKU*N
 | 
						|
                        LDWRKR = N
 | 
						|
                     END IF
 | 
						|
                     ITAU = IR + LDWRKR*N
 | 
						|
                     IWORK = ITAU + N
 | 
						|
*
 | 
						|
*                    Compute A=Q*R, copying result to U
 | 
						|
*                    (Workspace: need 2*N*N + 2*N, prefer 2*N*N + N + N*NB)
 | 
						|
*
 | 
						|
                     CALL DGEQRF( M, N, A, LDA, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     CALL DLACPY( 'L', M, N, A, LDA, U, LDU )
 | 
						|
*
 | 
						|
*                    Generate Q in U
 | 
						|
*                    (Workspace: need 2*N*N + N + M, prefer 2*N*N + N + M*NB)
 | 
						|
*
 | 
						|
                     CALL DORGQR( M, M, N, U, LDU, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Copy R to WORK(IU), zeroing out below it
 | 
						|
*
 | 
						|
                     CALL DLACPY( 'U', N, N, A, LDA, WORK( IU ),
 | 
						|
     $                            LDWRKU )
 | 
						|
                     CALL DLASET( 'L', N-1, N-1, ZERO, ZERO,
 | 
						|
     $                            WORK( IU+1 ), LDWRKU )
 | 
						|
                     IE = ITAU
 | 
						|
                     ITAUQ = IE + N
 | 
						|
                     ITAUP = ITAUQ + N
 | 
						|
                     IWORK = ITAUP + N
 | 
						|
*
 | 
						|
*                    Bidiagonalize R in WORK(IU), copying result to
 | 
						|
*                    WORK(IR)
 | 
						|
*                    (Workspace: need 2*N*N + 4*N,
 | 
						|
*                                prefer 2*N*N+3*N+2*N*NB)
 | 
						|
*
 | 
						|
                     CALL DGEBRD( N, N, WORK( IU ), LDWRKU, S,
 | 
						|
     $                            WORK( IE ), WORK( ITAUQ ),
 | 
						|
     $                            WORK( ITAUP ), WORK( IWORK ),
 | 
						|
     $                            LWORK-IWORK+1, IERR )
 | 
						|
                     CALL DLACPY( 'U', N, N, WORK( IU ), LDWRKU,
 | 
						|
     $                            WORK( IR ), LDWRKR )
 | 
						|
*
 | 
						|
*                    Generate left bidiagonalizing vectors in WORK(IU)
 | 
						|
*                    (Workspace: need 2*N*N + 4*N, prefer 2*N*N + 3*N + N*NB)
 | 
						|
*
 | 
						|
                     CALL DORGBR( 'Q', N, N, N, WORK( IU ), LDWRKU,
 | 
						|
     $                            WORK( ITAUQ ), WORK( IWORK ),
 | 
						|
     $                            LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Generate right bidiagonalizing vectors in WORK(IR)
 | 
						|
*                    (Workspace: need 2*N*N + 4*N-1,
 | 
						|
*                                prefer 2*N*N+3*N+(N-1)*NB)
 | 
						|
*
 | 
						|
                     CALL DORGBR( 'P', N, N, N, WORK( IR ), LDWRKR,
 | 
						|
     $                            WORK( ITAUP ), WORK( IWORK ),
 | 
						|
     $                            LWORK-IWORK+1, IERR )
 | 
						|
                     IWORK = IE + N
 | 
						|
*
 | 
						|
*                    Perform bidiagonal QR iteration, computing left
 | 
						|
*                    singular vectors of R in WORK(IU) and computing
 | 
						|
*                    right singular vectors of R in WORK(IR)
 | 
						|
*                    (Workspace: need 2*N*N + BDSPAC)
 | 
						|
*
 | 
						|
                     CALL DBDSQR( 'U', N, N, N, 0, S, WORK( IE ),
 | 
						|
     $                            WORK( IR ), LDWRKR, WORK( IU ),
 | 
						|
     $                            LDWRKU, DUM, 1, WORK( IWORK ), INFO )
 | 
						|
*
 | 
						|
*                    Multiply Q in U by left singular vectors of R in
 | 
						|
*                    WORK(IU), storing result in A
 | 
						|
*                    (Workspace: need N*N)
 | 
						|
*
 | 
						|
                     CALL DGEMM( 'N', 'N', M, N, N, ONE, U, LDU,
 | 
						|
     $                           WORK( IU ), LDWRKU, ZERO, A, LDA )
 | 
						|
*
 | 
						|
*                    Copy left singular vectors of A from A to U
 | 
						|
*
 | 
						|
                     CALL DLACPY( 'F', M, N, A, LDA, U, LDU )
 | 
						|
*
 | 
						|
*                    Copy right singular vectors of R from WORK(IR) to A
 | 
						|
*
 | 
						|
                     CALL DLACPY( 'F', N, N, WORK( IR ), LDWRKR, A,
 | 
						|
     $                            LDA )
 | 
						|
*
 | 
						|
                  ELSE
 | 
						|
*
 | 
						|
*                    Insufficient workspace for a fast algorithm
 | 
						|
*
 | 
						|
                     ITAU = 1
 | 
						|
                     IWORK = ITAU + N
 | 
						|
*
 | 
						|
*                    Compute A=Q*R, copying result to U
 | 
						|
*                    (Workspace: need 2*N, prefer N + N*NB)
 | 
						|
*
 | 
						|
                     CALL DGEQRF( M, N, A, LDA, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     CALL DLACPY( 'L', M, N, A, LDA, U, LDU )
 | 
						|
*
 | 
						|
*                    Generate Q in U
 | 
						|
*                    (Workspace: need N + M, prefer N + M*NB)
 | 
						|
*
 | 
						|
                     CALL DORGQR( M, M, N, U, LDU, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     IE = ITAU
 | 
						|
                     ITAUQ = IE + N
 | 
						|
                     ITAUP = ITAUQ + N
 | 
						|
                     IWORK = ITAUP + N
 | 
						|
*
 | 
						|
*                    Zero out below R in A
 | 
						|
*
 | 
						|
                     IF( N .GT. 1 ) THEN
 | 
						|
                        CALL DLASET( 'L', N-1, N-1, ZERO, ZERO,
 | 
						|
     $                                A( 2, 1 ), LDA )
 | 
						|
                     END IF
 | 
						|
*
 | 
						|
*                    Bidiagonalize R in A
 | 
						|
*                    (Workspace: need 4*N, prefer 3*N + 2*N*NB)
 | 
						|
*
 | 
						|
                     CALL DGEBRD( N, N, A, LDA, S, WORK( IE ),
 | 
						|
     $                            WORK( ITAUQ ), WORK( ITAUP ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Multiply Q in U by left bidiagonalizing vectors
 | 
						|
*                    in A
 | 
						|
*                    (Workspace: need 3*N + M, prefer 3*N + M*NB)
 | 
						|
*
 | 
						|
                     CALL DORMBR( 'Q', 'R', 'N', M, N, N, A, LDA,
 | 
						|
     $                            WORK( ITAUQ ), U, LDU, WORK( IWORK ),
 | 
						|
     $                            LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Generate right bidiagonalizing vectors in A
 | 
						|
*                    (Workspace: need 4*N-1, prefer 3*N + (N-1)*NB)
 | 
						|
*
 | 
						|
                     CALL DORGBR( 'P', N, N, N, A, LDA, WORK( ITAUP ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     IWORK = IE + N
 | 
						|
*
 | 
						|
*                    Perform bidiagonal QR iteration, computing left
 | 
						|
*                    singular vectors of A in U and computing right
 | 
						|
*                    singular vectors of A in A
 | 
						|
*                    (Workspace: need BDSPAC)
 | 
						|
*
 | 
						|
                     CALL DBDSQR( 'U', N, N, M, 0, S, WORK( IE ), A,
 | 
						|
     $                            LDA, U, LDU, DUM, 1, WORK( IWORK ),
 | 
						|
     $                            INFO )
 | 
						|
*
 | 
						|
                  END IF
 | 
						|
*
 | 
						|
               ELSE IF( WNTVAS ) THEN
 | 
						|
*
 | 
						|
*                 Path 9 (M much larger than N, JOBU='A', JOBVT='S'
 | 
						|
*                         or 'A')
 | 
						|
*                 M left singular vectors to be computed in U and
 | 
						|
*                 N right singular vectors to be computed in VT
 | 
						|
*
 | 
						|
                  IF( LWORK.GE.N*N+MAX( N+M, 4*N, BDSPAC ) ) THEN
 | 
						|
*
 | 
						|
*                    Sufficient workspace for a fast algorithm
 | 
						|
*
 | 
						|
                     IU = 1
 | 
						|
                     IF( LWORK.GE.WRKBL+LDA*N ) THEN
 | 
						|
*
 | 
						|
*                       WORK(IU) is LDA by N
 | 
						|
*
 | 
						|
                        LDWRKU = LDA
 | 
						|
                     ELSE
 | 
						|
*
 | 
						|
*                       WORK(IU) is N by N
 | 
						|
*
 | 
						|
                        LDWRKU = N
 | 
						|
                     END IF
 | 
						|
                     ITAU = IU + LDWRKU*N
 | 
						|
                     IWORK = ITAU + N
 | 
						|
*
 | 
						|
*                    Compute A=Q*R, copying result to U
 | 
						|
*                    (Workspace: need N*N + 2*N, prefer N*N + N + N*NB)
 | 
						|
*
 | 
						|
                     CALL DGEQRF( M, N, A, LDA, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     CALL DLACPY( 'L', M, N, A, LDA, U, LDU )
 | 
						|
*
 | 
						|
*                    Generate Q in U
 | 
						|
*                    (Workspace: need N*N + N + M, prefer N*N + N + M*NB)
 | 
						|
*
 | 
						|
                     CALL DORGQR( M, M, N, U, LDU, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Copy R to WORK(IU), zeroing out below it
 | 
						|
*
 | 
						|
                     CALL DLACPY( 'U', N, N, A, LDA, WORK( IU ),
 | 
						|
     $                            LDWRKU )
 | 
						|
                     CALL DLASET( 'L', N-1, N-1, ZERO, ZERO,
 | 
						|
     $                            WORK( IU+1 ), LDWRKU )
 | 
						|
                     IE = ITAU
 | 
						|
                     ITAUQ = IE + N
 | 
						|
                     ITAUP = ITAUQ + N
 | 
						|
                     IWORK = ITAUP + N
 | 
						|
*
 | 
						|
*                    Bidiagonalize R in WORK(IU), copying result to VT
 | 
						|
*                    (Workspace: need N*N + 4*N, prefer N*N + 3*N + 2*N*NB)
 | 
						|
*
 | 
						|
                     CALL DGEBRD( N, N, WORK( IU ), LDWRKU, S,
 | 
						|
     $                            WORK( IE ), WORK( ITAUQ ),
 | 
						|
     $                            WORK( ITAUP ), WORK( IWORK ),
 | 
						|
     $                            LWORK-IWORK+1, IERR )
 | 
						|
                     CALL DLACPY( 'U', N, N, WORK( IU ), LDWRKU, VT,
 | 
						|
     $                            LDVT )
 | 
						|
*
 | 
						|
*                    Generate left bidiagonalizing vectors in WORK(IU)
 | 
						|
*                    (Workspace: need N*N + 4*N, prefer N*N + 3*N + N*NB)
 | 
						|
*
 | 
						|
                     CALL DORGBR( 'Q', N, N, N, WORK( IU ), LDWRKU,
 | 
						|
     $                            WORK( ITAUQ ), WORK( IWORK ),
 | 
						|
     $                            LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Generate right bidiagonalizing vectors in VT
 | 
						|
*                    (Workspace: need N*N + 4*N-1,
 | 
						|
*                                prefer N*N+3*N+(N-1)*NB)
 | 
						|
*
 | 
						|
                     CALL DORGBR( 'P', N, N, N, VT, LDVT, WORK( ITAUP ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     IWORK = IE + N
 | 
						|
*
 | 
						|
*                    Perform bidiagonal QR iteration, computing left
 | 
						|
*                    singular vectors of R in WORK(IU) and computing
 | 
						|
*                    right singular vectors of R in VT
 | 
						|
*                    (Workspace: need N*N + BDSPAC)
 | 
						|
*
 | 
						|
                     CALL DBDSQR( 'U', N, N, N, 0, S, WORK( IE ), VT,
 | 
						|
     $                            LDVT, WORK( IU ), LDWRKU, DUM, 1,
 | 
						|
     $                            WORK( IWORK ), INFO )
 | 
						|
*
 | 
						|
*                    Multiply Q in U by left singular vectors of R in
 | 
						|
*                    WORK(IU), storing result in A
 | 
						|
*                    (Workspace: need N*N)
 | 
						|
*
 | 
						|
                     CALL DGEMM( 'N', 'N', M, N, N, ONE, U, LDU,
 | 
						|
     $                           WORK( IU ), LDWRKU, ZERO, A, LDA )
 | 
						|
*
 | 
						|
*                    Copy left singular vectors of A from A to U
 | 
						|
*
 | 
						|
                     CALL DLACPY( 'F', M, N, A, LDA, U, LDU )
 | 
						|
*
 | 
						|
                  ELSE
 | 
						|
*
 | 
						|
*                    Insufficient workspace for a fast algorithm
 | 
						|
*
 | 
						|
                     ITAU = 1
 | 
						|
                     IWORK = ITAU + N
 | 
						|
*
 | 
						|
*                    Compute A=Q*R, copying result to U
 | 
						|
*                    (Workspace: need 2*N, prefer N + N*NB)
 | 
						|
*
 | 
						|
                     CALL DGEQRF( M, N, A, LDA, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     CALL DLACPY( 'L', M, N, A, LDA, U, LDU )
 | 
						|
*
 | 
						|
*                    Generate Q in U
 | 
						|
*                    (Workspace: need N + M, prefer N + M*NB)
 | 
						|
*
 | 
						|
                     CALL DORGQR( M, M, N, U, LDU, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Copy R from A to VT, zeroing out below it
 | 
						|
*
 | 
						|
                     CALL DLACPY( 'U', N, N, A, LDA, VT, LDVT )
 | 
						|
                     IF( N.GT.1 )
 | 
						|
     $                  CALL DLASET( 'L', N-1, N-1, ZERO, ZERO,
 | 
						|
     $                               VT( 2, 1 ), LDVT )
 | 
						|
                     IE = ITAU
 | 
						|
                     ITAUQ = IE + N
 | 
						|
                     ITAUP = ITAUQ + N
 | 
						|
                     IWORK = ITAUP + N
 | 
						|
*
 | 
						|
*                    Bidiagonalize R in VT
 | 
						|
*                    (Workspace: need 4*N, prefer 3*N + 2*N*NB)
 | 
						|
*
 | 
						|
                     CALL DGEBRD( N, N, VT, LDVT, S, WORK( IE ),
 | 
						|
     $                            WORK( ITAUQ ), WORK( ITAUP ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Multiply Q in U by left bidiagonalizing vectors
 | 
						|
*                    in VT
 | 
						|
*                    (Workspace: need 3*N + M, prefer 3*N + M*NB)
 | 
						|
*
 | 
						|
                     CALL DORMBR( 'Q', 'R', 'N', M, N, N, VT, LDVT,
 | 
						|
     $                            WORK( ITAUQ ), U, LDU, WORK( IWORK ),
 | 
						|
     $                            LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Generate right bidiagonalizing vectors in VT
 | 
						|
*                    (Workspace: need 4*N-1, prefer 3*N + (N-1)*NB)
 | 
						|
*
 | 
						|
                     CALL DORGBR( 'P', N, N, N, VT, LDVT, WORK( ITAUP ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     IWORK = IE + N
 | 
						|
*
 | 
						|
*                    Perform bidiagonal QR iteration, computing left
 | 
						|
*                    singular vectors of A in U and computing right
 | 
						|
*                    singular vectors of A in VT
 | 
						|
*                    (Workspace: need BDSPAC)
 | 
						|
*
 | 
						|
                     CALL DBDSQR( 'U', N, N, M, 0, S, WORK( IE ), VT,
 | 
						|
     $                            LDVT, U, LDU, DUM, 1, WORK( IWORK ),
 | 
						|
     $                            INFO )
 | 
						|
*
 | 
						|
                  END IF
 | 
						|
*
 | 
						|
               END IF
 | 
						|
*
 | 
						|
            END IF
 | 
						|
*
 | 
						|
         ELSE
 | 
						|
*
 | 
						|
*           M .LT. MNTHR
 | 
						|
*
 | 
						|
*           Path 10 (M at least N, but not much larger)
 | 
						|
*           Reduce to bidiagonal form without QR decomposition
 | 
						|
*
 | 
						|
            IE = 1
 | 
						|
            ITAUQ = IE + N
 | 
						|
            ITAUP = ITAUQ + N
 | 
						|
            IWORK = ITAUP + N
 | 
						|
*
 | 
						|
*           Bidiagonalize A
 | 
						|
*           (Workspace: need 3*N + M, prefer 3*N + (M + N)*NB)
 | 
						|
*
 | 
						|
            CALL DGEBRD( M, N, A, LDA, S, WORK( IE ), WORK( ITAUQ ),
 | 
						|
     $                   WORK( ITAUP ), WORK( IWORK ), LWORK-IWORK+1,
 | 
						|
     $                   IERR )
 | 
						|
            IF( WNTUAS ) THEN
 | 
						|
*
 | 
						|
*              If left singular vectors desired in U, copy result to U
 | 
						|
*              and generate left bidiagonalizing vectors in U
 | 
						|
*              (Workspace: need 3*N + NCU, prefer 3*N + NCU*NB)
 | 
						|
*
 | 
						|
               CALL DLACPY( 'L', M, N, A, LDA, U, LDU )
 | 
						|
               IF( WNTUS )
 | 
						|
     $            NCU = N
 | 
						|
               IF( WNTUA )
 | 
						|
     $            NCU = M
 | 
						|
               CALL DORGBR( 'Q', M, NCU, N, U, LDU, WORK( ITAUQ ),
 | 
						|
     $                      WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
            END IF
 | 
						|
            IF( WNTVAS ) THEN
 | 
						|
*
 | 
						|
*              If right singular vectors desired in VT, copy result to
 | 
						|
*              VT and generate right bidiagonalizing vectors in VT
 | 
						|
*              (Workspace: need 4*N-1, prefer 3*N + (N-1)*NB)
 | 
						|
*
 | 
						|
               CALL DLACPY( 'U', N, N, A, LDA, VT, LDVT )
 | 
						|
               CALL DORGBR( 'P', N, N, N, VT, LDVT, WORK( ITAUP ),
 | 
						|
     $                      WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
            END IF
 | 
						|
            IF( WNTUO ) THEN
 | 
						|
*
 | 
						|
*              If left singular vectors desired in A, generate left
 | 
						|
*              bidiagonalizing vectors in A
 | 
						|
*              (Workspace: need 4*N, prefer 3*N + N*NB)
 | 
						|
*
 | 
						|
               CALL DORGBR( 'Q', M, N, N, A, LDA, WORK( ITAUQ ),
 | 
						|
     $                      WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
            END IF
 | 
						|
            IF( WNTVO ) THEN
 | 
						|
*
 | 
						|
*              If right singular vectors desired in A, generate right
 | 
						|
*              bidiagonalizing vectors in A
 | 
						|
*              (Workspace: need 4*N-1, prefer 3*N + (N-1)*NB)
 | 
						|
*
 | 
						|
               CALL DORGBR( 'P', N, N, N, A, LDA, WORK( ITAUP ),
 | 
						|
     $                      WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
            END IF
 | 
						|
            IWORK = IE + N
 | 
						|
            IF( WNTUAS .OR. WNTUO )
 | 
						|
     $         NRU = M
 | 
						|
            IF( WNTUN )
 | 
						|
     $         NRU = 0
 | 
						|
            IF( WNTVAS .OR. WNTVO )
 | 
						|
     $         NCVT = N
 | 
						|
            IF( WNTVN )
 | 
						|
     $         NCVT = 0
 | 
						|
            IF( ( .NOT.WNTUO ) .AND. ( .NOT.WNTVO ) ) THEN
 | 
						|
*
 | 
						|
*              Perform bidiagonal QR iteration, if desired, computing
 | 
						|
*              left singular vectors in U and computing right singular
 | 
						|
*              vectors in VT
 | 
						|
*              (Workspace: need BDSPAC)
 | 
						|
*
 | 
						|
               CALL DBDSQR( 'U', N, NCVT, NRU, 0, S, WORK( IE ), VT,
 | 
						|
     $                      LDVT, U, LDU, DUM, 1, WORK( IWORK ), INFO )
 | 
						|
            ELSE IF( ( .NOT.WNTUO ) .AND. WNTVO ) THEN
 | 
						|
*
 | 
						|
*              Perform bidiagonal QR iteration, if desired, computing
 | 
						|
*              left singular vectors in U and computing right singular
 | 
						|
*              vectors in A
 | 
						|
*              (Workspace: need BDSPAC)
 | 
						|
*
 | 
						|
               CALL DBDSQR( 'U', N, NCVT, NRU, 0, S, WORK( IE ), A, LDA,
 | 
						|
     $                      U, LDU, DUM, 1, WORK( IWORK ), INFO )
 | 
						|
            ELSE
 | 
						|
*
 | 
						|
*              Perform bidiagonal QR iteration, if desired, computing
 | 
						|
*              left singular vectors in A and computing right singular
 | 
						|
*              vectors in VT
 | 
						|
*              (Workspace: need BDSPAC)
 | 
						|
*
 | 
						|
               CALL DBDSQR( 'U', N, NCVT, NRU, 0, S, WORK( IE ), VT,
 | 
						|
     $                      LDVT, A, LDA, DUM, 1, WORK( IWORK ), INFO )
 | 
						|
            END IF
 | 
						|
*
 | 
						|
         END IF
 | 
						|
*
 | 
						|
      ELSE
 | 
						|
*
 | 
						|
*        A has more columns than rows. If A has sufficiently more
 | 
						|
*        columns than rows, first reduce using the LQ decomposition (if
 | 
						|
*        sufficient workspace available)
 | 
						|
*
 | 
						|
         IF( N.GE.MNTHR ) THEN
 | 
						|
*
 | 
						|
            IF( WNTVN ) THEN
 | 
						|
*
 | 
						|
*              Path 1t(N much larger than M, JOBVT='N')
 | 
						|
*              No right singular vectors to be computed
 | 
						|
*
 | 
						|
               ITAU = 1
 | 
						|
               IWORK = ITAU + M
 | 
						|
*
 | 
						|
*              Compute A=L*Q
 | 
						|
*              (Workspace: need 2*M, prefer M + M*NB)
 | 
						|
*
 | 
						|
               CALL DGELQF( M, N, A, LDA, WORK( ITAU ), WORK( IWORK ),
 | 
						|
     $                      LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*              Zero out above L
 | 
						|
*
 | 
						|
               CALL DLASET( 'U', M-1, M-1, ZERO, ZERO, A( 1, 2 ), LDA )
 | 
						|
               IE = 1
 | 
						|
               ITAUQ = IE + M
 | 
						|
               ITAUP = ITAUQ + M
 | 
						|
               IWORK = ITAUP + M
 | 
						|
*
 | 
						|
*              Bidiagonalize L in A
 | 
						|
*              (Workspace: need 4*M, prefer 3*M + 2*M*NB)
 | 
						|
*
 | 
						|
               CALL DGEBRD( M, M, A, LDA, S, WORK( IE ), WORK( ITAUQ ),
 | 
						|
     $                      WORK( ITAUP ), WORK( IWORK ), LWORK-IWORK+1,
 | 
						|
     $                      IERR )
 | 
						|
               IF( WNTUO .OR. WNTUAS ) THEN
 | 
						|
*
 | 
						|
*                 If left singular vectors desired, generate Q
 | 
						|
*                 (Workspace: need 4*M, prefer 3*M + M*NB)
 | 
						|
*
 | 
						|
                  CALL DORGBR( 'Q', M, M, M, A, LDA, WORK( ITAUQ ),
 | 
						|
     $                         WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
               END IF
 | 
						|
               IWORK = IE + M
 | 
						|
               NRU = 0
 | 
						|
               IF( WNTUO .OR. WNTUAS )
 | 
						|
     $            NRU = M
 | 
						|
*
 | 
						|
*              Perform bidiagonal QR iteration, computing left singular
 | 
						|
*              vectors of A in A if desired
 | 
						|
*              (Workspace: need BDSPAC)
 | 
						|
*
 | 
						|
               CALL DBDSQR( 'U', M, 0, NRU, 0, S, WORK( IE ), DUM, 1, A,
 | 
						|
     $                      LDA, DUM, 1, WORK( IWORK ), INFO )
 | 
						|
*
 | 
						|
*              If left singular vectors desired in U, copy them there
 | 
						|
*
 | 
						|
               IF( WNTUAS )
 | 
						|
     $            CALL DLACPY( 'F', M, M, A, LDA, U, LDU )
 | 
						|
*
 | 
						|
            ELSE IF( WNTVO .AND. WNTUN ) THEN
 | 
						|
*
 | 
						|
*              Path 2t(N much larger than M, JOBU='N', JOBVT='O')
 | 
						|
*              M right singular vectors to be overwritten on A and
 | 
						|
*              no left singular vectors to be computed
 | 
						|
*
 | 
						|
               IF( LWORK.GE.M*M+MAX( 4*M, BDSPAC ) ) THEN
 | 
						|
*
 | 
						|
*                 Sufficient workspace for a fast algorithm
 | 
						|
*
 | 
						|
                  IR = 1
 | 
						|
                  IF( LWORK.GE.MAX( WRKBL, LDA*N + M ) + LDA*M ) THEN
 | 
						|
*
 | 
						|
*                    WORK(IU) is LDA by N and WORK(IR) is LDA by M
 | 
						|
*
 | 
						|
                     LDWRKU = LDA
 | 
						|
                     CHUNK = N
 | 
						|
                     LDWRKR = LDA
 | 
						|
                  ELSE IF( LWORK.GE.MAX( WRKBL, LDA*N + M ) + M*M ) THEN
 | 
						|
*
 | 
						|
*                    WORK(IU) is LDA by N and WORK(IR) is M by M
 | 
						|
*
 | 
						|
                     LDWRKU = LDA
 | 
						|
                     CHUNK = N
 | 
						|
                     LDWRKR = M
 | 
						|
                  ELSE
 | 
						|
*
 | 
						|
*                    WORK(IU) is M by CHUNK and WORK(IR) is M by M
 | 
						|
*
 | 
						|
                     LDWRKU = M
 | 
						|
                     CHUNK = ( LWORK-M*M-M ) / M
 | 
						|
                     LDWRKR = M
 | 
						|
                  END IF
 | 
						|
                  ITAU = IR + LDWRKR*M
 | 
						|
                  IWORK = ITAU + M
 | 
						|
*
 | 
						|
*                 Compute A=L*Q
 | 
						|
*                 (Workspace: need M*M + 2*M, prefer M*M + M + M*NB)
 | 
						|
*
 | 
						|
                  CALL DGELQF( M, N, A, LDA, WORK( ITAU ),
 | 
						|
     $                         WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                 Copy L to WORK(IR) and zero out above it
 | 
						|
*
 | 
						|
                  CALL DLACPY( 'L', M, M, A, LDA, WORK( IR ), LDWRKR )
 | 
						|
                  CALL DLASET( 'U', M-1, M-1, ZERO, ZERO,
 | 
						|
     $                         WORK( IR+LDWRKR ), LDWRKR )
 | 
						|
*
 | 
						|
*                 Generate Q in A
 | 
						|
*                 (Workspace: need M*M + 2*M, prefer M*M + M + M*NB)
 | 
						|
*
 | 
						|
                  CALL DORGLQ( M, N, M, A, LDA, WORK( ITAU ),
 | 
						|
     $                         WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                  IE = ITAU
 | 
						|
                  ITAUQ = IE + M
 | 
						|
                  ITAUP = ITAUQ + M
 | 
						|
                  IWORK = ITAUP + M
 | 
						|
*
 | 
						|
*                 Bidiagonalize L in WORK(IR)
 | 
						|
*                 (Workspace: need M*M + 4*M, prefer M*M + 3*M + 2*M*NB)
 | 
						|
*
 | 
						|
                  CALL DGEBRD( M, M, WORK( IR ), LDWRKR, S, WORK( IE ),
 | 
						|
     $                         WORK( ITAUQ ), WORK( ITAUP ),
 | 
						|
     $                         WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                 Generate right vectors bidiagonalizing L
 | 
						|
*                 (Workspace: need M*M + 4*M-1, prefer M*M + 3*M + (M-1)*NB)
 | 
						|
*
 | 
						|
                  CALL DORGBR( 'P', M, M, M, WORK( IR ), LDWRKR,
 | 
						|
     $                         WORK( ITAUP ), WORK( IWORK ),
 | 
						|
     $                         LWORK-IWORK+1, IERR )
 | 
						|
                  IWORK = IE + M
 | 
						|
*
 | 
						|
*                 Perform bidiagonal QR iteration, computing right
 | 
						|
*                 singular vectors of L in WORK(IR)
 | 
						|
*                 (Workspace: need M*M + BDSPAC)
 | 
						|
*
 | 
						|
                  CALL DBDSQR( 'U', M, M, 0, 0, S, WORK( IE ),
 | 
						|
     $                         WORK( IR ), LDWRKR, DUM, 1, DUM, 1,
 | 
						|
     $                         WORK( IWORK ), INFO )
 | 
						|
                  IU = IE + M
 | 
						|
*
 | 
						|
*                 Multiply right singular vectors of L in WORK(IR) by Q
 | 
						|
*                 in A, storing result in WORK(IU) and copying to A
 | 
						|
*                 (Workspace: need M*M + 2*M, prefer M*M + M*N + M)
 | 
						|
*
 | 
						|
                  DO 30 I = 1, N, CHUNK
 | 
						|
                     BLK = MIN( N-I+1, CHUNK )
 | 
						|
                     CALL DGEMM( 'N', 'N', M, BLK, M, ONE, WORK( IR ),
 | 
						|
     $                           LDWRKR, A( 1, I ), LDA, ZERO,
 | 
						|
     $                           WORK( IU ), LDWRKU )
 | 
						|
                     CALL DLACPY( 'F', M, BLK, WORK( IU ), LDWRKU,
 | 
						|
     $                            A( 1, I ), LDA )
 | 
						|
   30             CONTINUE
 | 
						|
*
 | 
						|
               ELSE
 | 
						|
*
 | 
						|
*                 Insufficient workspace for a fast algorithm
 | 
						|
*
 | 
						|
                  IE = 1
 | 
						|
                  ITAUQ = IE + M
 | 
						|
                  ITAUP = ITAUQ + M
 | 
						|
                  IWORK = ITAUP + M
 | 
						|
*
 | 
						|
*                 Bidiagonalize A
 | 
						|
*                 (Workspace: need 3*M + N, prefer 3*M + (M + N)*NB)
 | 
						|
*
 | 
						|
                  CALL DGEBRD( M, N, A, LDA, S, WORK( IE ),
 | 
						|
     $                         WORK( ITAUQ ), WORK( ITAUP ),
 | 
						|
     $                         WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                 Generate right vectors bidiagonalizing A
 | 
						|
*                 (Workspace: need 4*M, prefer 3*M + M*NB)
 | 
						|
*
 | 
						|
                  CALL DORGBR( 'P', M, N, M, A, LDA, WORK( ITAUP ),
 | 
						|
     $                         WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                  IWORK = IE + M
 | 
						|
*
 | 
						|
*                 Perform bidiagonal QR iteration, computing right
 | 
						|
*                 singular vectors of A in A
 | 
						|
*                 (Workspace: need BDSPAC)
 | 
						|
*
 | 
						|
                  CALL DBDSQR( 'L', M, N, 0, 0, S, WORK( IE ), A, LDA,
 | 
						|
     $                         DUM, 1, DUM, 1, WORK( IWORK ), INFO )
 | 
						|
*
 | 
						|
               END IF
 | 
						|
*
 | 
						|
            ELSE IF( WNTVO .AND. WNTUAS ) THEN
 | 
						|
*
 | 
						|
*              Path 3t(N much larger than M, JOBU='S' or 'A', JOBVT='O')
 | 
						|
*              M right singular vectors to be overwritten on A and
 | 
						|
*              M left singular vectors to be computed in U
 | 
						|
*
 | 
						|
               IF( LWORK.GE.M*M+MAX( 4*M, BDSPAC ) ) THEN
 | 
						|
*
 | 
						|
*                 Sufficient workspace for a fast algorithm
 | 
						|
*
 | 
						|
                  IR = 1
 | 
						|
                  IF( LWORK.GE.MAX( WRKBL, LDA*N + M ) + LDA*M ) THEN
 | 
						|
*
 | 
						|
*                    WORK(IU) is LDA by N and WORK(IR) is LDA by M
 | 
						|
*
 | 
						|
                     LDWRKU = LDA
 | 
						|
                     CHUNK = N
 | 
						|
                     LDWRKR = LDA
 | 
						|
                  ELSE IF( LWORK.GE.MAX( WRKBL, LDA*N + M ) + M*M ) THEN
 | 
						|
*
 | 
						|
*                    WORK(IU) is LDA by N and WORK(IR) is M by M
 | 
						|
*
 | 
						|
                     LDWRKU = LDA
 | 
						|
                     CHUNK = N
 | 
						|
                     LDWRKR = M
 | 
						|
                  ELSE
 | 
						|
*
 | 
						|
*                    WORK(IU) is M by CHUNK and WORK(IR) is M by M
 | 
						|
*
 | 
						|
                     LDWRKU = M
 | 
						|
                     CHUNK = ( LWORK-M*M-M ) / M
 | 
						|
                     LDWRKR = M
 | 
						|
                  END IF
 | 
						|
                  ITAU = IR + LDWRKR*M
 | 
						|
                  IWORK = ITAU + M
 | 
						|
*
 | 
						|
*                 Compute A=L*Q
 | 
						|
*                 (Workspace: need M*M + 2*M, prefer M*M + M + M*NB)
 | 
						|
*
 | 
						|
                  CALL DGELQF( M, N, A, LDA, WORK( ITAU ),
 | 
						|
     $                         WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                 Copy L to U, zeroing about above it
 | 
						|
*
 | 
						|
                  CALL DLACPY( 'L', M, M, A, LDA, U, LDU )
 | 
						|
                  CALL DLASET( 'U', M-1, M-1, ZERO, ZERO, U( 1, 2 ),
 | 
						|
     $                         LDU )
 | 
						|
*
 | 
						|
*                 Generate Q in A
 | 
						|
*                 (Workspace: need M*M + 2*M, prefer M*M + M + M*NB)
 | 
						|
*
 | 
						|
                  CALL DORGLQ( M, N, M, A, LDA, WORK( ITAU ),
 | 
						|
     $                         WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                  IE = ITAU
 | 
						|
                  ITAUQ = IE + M
 | 
						|
                  ITAUP = ITAUQ + M
 | 
						|
                  IWORK = ITAUP + M
 | 
						|
*
 | 
						|
*                 Bidiagonalize L in U, copying result to WORK(IR)
 | 
						|
*                 (Workspace: need M*M + 4*M, prefer M*M + 3*M + 2*M*NB)
 | 
						|
*
 | 
						|
                  CALL DGEBRD( M, M, U, LDU, S, WORK( IE ),
 | 
						|
     $                         WORK( ITAUQ ), WORK( ITAUP ),
 | 
						|
     $                         WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                  CALL DLACPY( 'U', M, M, U, LDU, WORK( IR ), LDWRKR )
 | 
						|
*
 | 
						|
*                 Generate right vectors bidiagonalizing L in WORK(IR)
 | 
						|
*                 (Workspace: need M*M + 4*M-1, prefer M*M + 3*M + (M-1)*NB)
 | 
						|
*
 | 
						|
                  CALL DORGBR( 'P', M, M, M, WORK( IR ), LDWRKR,
 | 
						|
     $                         WORK( ITAUP ), WORK( IWORK ),
 | 
						|
     $                         LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                 Generate left vectors bidiagonalizing L in U
 | 
						|
*                 (Workspace: need M*M + 4*M, prefer M*M + 3*M + M*NB)
 | 
						|
*
 | 
						|
                  CALL DORGBR( 'Q', M, M, M, U, LDU, WORK( ITAUQ ),
 | 
						|
     $                         WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                  IWORK = IE + M
 | 
						|
*
 | 
						|
*                 Perform bidiagonal QR iteration, computing left
 | 
						|
*                 singular vectors of L in U, and computing right
 | 
						|
*                 singular vectors of L in WORK(IR)
 | 
						|
*                 (Workspace: need M*M + BDSPAC)
 | 
						|
*
 | 
						|
                  CALL DBDSQR( 'U', M, M, M, 0, S, WORK( IE ),
 | 
						|
     $                         WORK( IR ), LDWRKR, U, LDU, DUM, 1,
 | 
						|
     $                         WORK( IWORK ), INFO )
 | 
						|
                  IU = IE + M
 | 
						|
*
 | 
						|
*                 Multiply right singular vectors of L in WORK(IR) by Q
 | 
						|
*                 in A, storing result in WORK(IU) and copying to A
 | 
						|
*                 (Workspace: need M*M + 2*M, prefer M*M + M*N + M))
 | 
						|
*
 | 
						|
                  DO 40 I = 1, N, CHUNK
 | 
						|
                     BLK = MIN( N-I+1, CHUNK )
 | 
						|
                     CALL DGEMM( 'N', 'N', M, BLK, M, ONE, WORK( IR ),
 | 
						|
     $                           LDWRKR, A( 1, I ), LDA, ZERO,
 | 
						|
     $                           WORK( IU ), LDWRKU )
 | 
						|
                     CALL DLACPY( 'F', M, BLK, WORK( IU ), LDWRKU,
 | 
						|
     $                            A( 1, I ), LDA )
 | 
						|
   40             CONTINUE
 | 
						|
*
 | 
						|
               ELSE
 | 
						|
*
 | 
						|
*                 Insufficient workspace for a fast algorithm
 | 
						|
*
 | 
						|
                  ITAU = 1
 | 
						|
                  IWORK = ITAU + M
 | 
						|
*
 | 
						|
*                 Compute A=L*Q
 | 
						|
*                 (Workspace: need 2*M, prefer M + M*NB)
 | 
						|
*
 | 
						|
                  CALL DGELQF( M, N, A, LDA, WORK( ITAU ),
 | 
						|
     $                         WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                 Copy L to U, zeroing out above it
 | 
						|
*
 | 
						|
                  CALL DLACPY( 'L', M, M, A, LDA, U, LDU )
 | 
						|
                  CALL DLASET( 'U', M-1, M-1, ZERO, ZERO, U( 1, 2 ),
 | 
						|
     $                         LDU )
 | 
						|
*
 | 
						|
*                 Generate Q in A
 | 
						|
*                 (Workspace: need 2*M, prefer M + M*NB)
 | 
						|
*
 | 
						|
                  CALL DORGLQ( M, N, M, A, LDA, WORK( ITAU ),
 | 
						|
     $                         WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                  IE = ITAU
 | 
						|
                  ITAUQ = IE + M
 | 
						|
                  ITAUP = ITAUQ + M
 | 
						|
                  IWORK = ITAUP + M
 | 
						|
*
 | 
						|
*                 Bidiagonalize L in U
 | 
						|
*                 (Workspace: need 4*M, prefer 3*M + 2*M*NB)
 | 
						|
*
 | 
						|
                  CALL DGEBRD( M, M, U, LDU, S, WORK( IE ),
 | 
						|
     $                         WORK( ITAUQ ), WORK( ITAUP ),
 | 
						|
     $                         WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                 Multiply right vectors bidiagonalizing L by Q in A
 | 
						|
*                 (Workspace: need 3*M + N, prefer 3*M + N*NB)
 | 
						|
*
 | 
						|
                  CALL DORMBR( 'P', 'L', 'T', M, N, M, U, LDU,
 | 
						|
     $                         WORK( ITAUP ), A, LDA, WORK( IWORK ),
 | 
						|
     $                         LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                 Generate left vectors bidiagonalizing L in U
 | 
						|
*                 (Workspace: need 4*M, prefer 3*M + M*NB)
 | 
						|
*
 | 
						|
                  CALL DORGBR( 'Q', M, M, M, U, LDU, WORK( ITAUQ ),
 | 
						|
     $                         WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                  IWORK = IE + M
 | 
						|
*
 | 
						|
*                 Perform bidiagonal QR iteration, computing left
 | 
						|
*                 singular vectors of A in U and computing right
 | 
						|
*                 singular vectors of A in A
 | 
						|
*                 (Workspace: need BDSPAC)
 | 
						|
*
 | 
						|
                  CALL DBDSQR( 'U', M, N, M, 0, S, WORK( IE ), A, LDA,
 | 
						|
     $                         U, LDU, DUM, 1, WORK( IWORK ), INFO )
 | 
						|
*
 | 
						|
               END IF
 | 
						|
*
 | 
						|
            ELSE IF( WNTVS ) THEN
 | 
						|
*
 | 
						|
               IF( WNTUN ) THEN
 | 
						|
*
 | 
						|
*                 Path 4t(N much larger than M, JOBU='N', JOBVT='S')
 | 
						|
*                 M right singular vectors to be computed in VT and
 | 
						|
*                 no left singular vectors to be computed
 | 
						|
*
 | 
						|
                  IF( LWORK.GE.M*M+MAX( 4*M, BDSPAC ) ) THEN
 | 
						|
*
 | 
						|
*                    Sufficient workspace for a fast algorithm
 | 
						|
*
 | 
						|
                     IR = 1
 | 
						|
                     IF( LWORK.GE.WRKBL+LDA*M ) THEN
 | 
						|
*
 | 
						|
*                       WORK(IR) is LDA by M
 | 
						|
*
 | 
						|
                        LDWRKR = LDA
 | 
						|
                     ELSE
 | 
						|
*
 | 
						|
*                       WORK(IR) is M by M
 | 
						|
*
 | 
						|
                        LDWRKR = M
 | 
						|
                     END IF
 | 
						|
                     ITAU = IR + LDWRKR*M
 | 
						|
                     IWORK = ITAU + M
 | 
						|
*
 | 
						|
*                    Compute A=L*Q
 | 
						|
*                    (Workspace: need M*M + 2*M, prefer M*M + M + M*NB)
 | 
						|
*
 | 
						|
                     CALL DGELQF( M, N, A, LDA, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Copy L to WORK(IR), zeroing out above it
 | 
						|
*
 | 
						|
                     CALL DLACPY( 'L', M, M, A, LDA, WORK( IR ),
 | 
						|
     $                            LDWRKR )
 | 
						|
                     CALL DLASET( 'U', M-1, M-1, ZERO, ZERO,
 | 
						|
     $                            WORK( IR+LDWRKR ), LDWRKR )
 | 
						|
*
 | 
						|
*                    Generate Q in A
 | 
						|
*                    (Workspace: need M*M + 2*M, prefer M*M + M + M*NB)
 | 
						|
*
 | 
						|
                     CALL DORGLQ( M, N, M, A, LDA, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     IE = ITAU
 | 
						|
                     ITAUQ = IE + M
 | 
						|
                     ITAUP = ITAUQ + M
 | 
						|
                     IWORK = ITAUP + M
 | 
						|
*
 | 
						|
*                    Bidiagonalize L in WORK(IR)
 | 
						|
*                    (Workspace: need M*M + 4*M, prefer M*M + 3*M + 2*M*NB)
 | 
						|
*
 | 
						|
                     CALL DGEBRD( M, M, WORK( IR ), LDWRKR, S,
 | 
						|
     $                            WORK( IE ), WORK( ITAUQ ),
 | 
						|
     $                            WORK( ITAUP ), WORK( IWORK ),
 | 
						|
     $                            LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Generate right vectors bidiagonalizing L in
 | 
						|
*                    WORK(IR)
 | 
						|
*                    (Workspace: need M*M + 4*M, prefer M*M + 3*M + (M-1)*NB)
 | 
						|
*
 | 
						|
                     CALL DORGBR( 'P', M, M, M, WORK( IR ), LDWRKR,
 | 
						|
     $                            WORK( ITAUP ), WORK( IWORK ),
 | 
						|
     $                            LWORK-IWORK+1, IERR )
 | 
						|
                     IWORK = IE + M
 | 
						|
*
 | 
						|
*                    Perform bidiagonal QR iteration, computing right
 | 
						|
*                    singular vectors of L in WORK(IR)
 | 
						|
*                    (Workspace: need M*M + BDSPAC)
 | 
						|
*
 | 
						|
                     CALL DBDSQR( 'U', M, M, 0, 0, S, WORK( IE ),
 | 
						|
     $                            WORK( IR ), LDWRKR, DUM, 1, DUM, 1,
 | 
						|
     $                            WORK( IWORK ), INFO )
 | 
						|
*
 | 
						|
*                    Multiply right singular vectors of L in WORK(IR) by
 | 
						|
*                    Q in A, storing result in VT
 | 
						|
*                    (Workspace: need M*M)
 | 
						|
*
 | 
						|
                     CALL DGEMM( 'N', 'N', M, N, M, ONE, WORK( IR ),
 | 
						|
     $                           LDWRKR, A, LDA, ZERO, VT, LDVT )
 | 
						|
*
 | 
						|
                  ELSE
 | 
						|
*
 | 
						|
*                    Insufficient workspace for a fast algorithm
 | 
						|
*
 | 
						|
                     ITAU = 1
 | 
						|
                     IWORK = ITAU + M
 | 
						|
*
 | 
						|
*                    Compute A=L*Q
 | 
						|
*                    (Workspace: need 2*M, prefer M + M*NB)
 | 
						|
*
 | 
						|
                     CALL DGELQF( M, N, A, LDA, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Copy result to VT
 | 
						|
*
 | 
						|
                     CALL DLACPY( 'U', M, N, A, LDA, VT, LDVT )
 | 
						|
*
 | 
						|
*                    Generate Q in VT
 | 
						|
*                    (Workspace: need 2*M, prefer M + M*NB)
 | 
						|
*
 | 
						|
                     CALL DORGLQ( M, N, M, VT, LDVT, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     IE = ITAU
 | 
						|
                     ITAUQ = IE + M
 | 
						|
                     ITAUP = ITAUQ + M
 | 
						|
                     IWORK = ITAUP + M
 | 
						|
*
 | 
						|
*                    Zero out above L in A
 | 
						|
*
 | 
						|
                     CALL DLASET( 'U', M-1, M-1, ZERO, ZERO, A( 1, 2 ),
 | 
						|
     $                            LDA )
 | 
						|
*
 | 
						|
*                    Bidiagonalize L in A
 | 
						|
*                    (Workspace: need 4*M, prefer 3*M + 2*M*NB)
 | 
						|
*
 | 
						|
                     CALL DGEBRD( M, M, A, LDA, S, WORK( IE ),
 | 
						|
     $                            WORK( ITAUQ ), WORK( ITAUP ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Multiply right vectors bidiagonalizing L by Q in VT
 | 
						|
*                    (Workspace: need 3*M + N, prefer 3*M + N*NB)
 | 
						|
*
 | 
						|
                     CALL DORMBR( 'P', 'L', 'T', M, N, M, A, LDA,
 | 
						|
     $                            WORK( ITAUP ), VT, LDVT,
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     IWORK = IE + M
 | 
						|
*
 | 
						|
*                    Perform bidiagonal QR iteration, computing right
 | 
						|
*                    singular vectors of A in VT
 | 
						|
*                    (Workspace: need BDSPAC)
 | 
						|
*
 | 
						|
                     CALL DBDSQR( 'U', M, N, 0, 0, S, WORK( IE ), VT,
 | 
						|
     $                            LDVT, DUM, 1, DUM, 1, WORK( IWORK ),
 | 
						|
     $                            INFO )
 | 
						|
*
 | 
						|
                  END IF
 | 
						|
*
 | 
						|
               ELSE IF( WNTUO ) THEN
 | 
						|
*
 | 
						|
*                 Path 5t(N much larger than M, JOBU='O', JOBVT='S')
 | 
						|
*                 M right singular vectors to be computed in VT and
 | 
						|
*                 M left singular vectors to be overwritten on A
 | 
						|
*
 | 
						|
                  IF( LWORK.GE.2*M*M+MAX( 4*M, BDSPAC ) ) THEN
 | 
						|
*
 | 
						|
*                    Sufficient workspace for a fast algorithm
 | 
						|
*
 | 
						|
                     IU = 1
 | 
						|
                     IF( LWORK.GE.WRKBL+2*LDA*M ) THEN
 | 
						|
*
 | 
						|
*                       WORK(IU) is LDA by M and WORK(IR) is LDA by M
 | 
						|
*
 | 
						|
                        LDWRKU = LDA
 | 
						|
                        IR = IU + LDWRKU*M
 | 
						|
                        LDWRKR = LDA
 | 
						|
                     ELSE IF( LWORK.GE.WRKBL+( LDA + M )*M ) THEN
 | 
						|
*
 | 
						|
*                       WORK(IU) is LDA by M and WORK(IR) is M by M
 | 
						|
*
 | 
						|
                        LDWRKU = LDA
 | 
						|
                        IR = IU + LDWRKU*M
 | 
						|
                        LDWRKR = M
 | 
						|
                     ELSE
 | 
						|
*
 | 
						|
*                       WORK(IU) is M by M and WORK(IR) is M by M
 | 
						|
*
 | 
						|
                        LDWRKU = M
 | 
						|
                        IR = IU + LDWRKU*M
 | 
						|
                        LDWRKR = M
 | 
						|
                     END IF
 | 
						|
                     ITAU = IR + LDWRKR*M
 | 
						|
                     IWORK = ITAU + M
 | 
						|
*
 | 
						|
*                    Compute A=L*Q
 | 
						|
*                    (Workspace: need 2*M*M + 2*M, prefer 2*M*M + M + M*NB)
 | 
						|
*
 | 
						|
                     CALL DGELQF( M, N, A, LDA, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Copy L to WORK(IU), zeroing out below it
 | 
						|
*
 | 
						|
                     CALL DLACPY( 'L', M, M, A, LDA, WORK( IU ),
 | 
						|
     $                            LDWRKU )
 | 
						|
                     CALL DLASET( 'U', M-1, M-1, ZERO, ZERO,
 | 
						|
     $                            WORK( IU+LDWRKU ), LDWRKU )
 | 
						|
*
 | 
						|
*                    Generate Q in A
 | 
						|
*                    (Workspace: need 2*M*M + 2*M, prefer 2*M*M + M + M*NB)
 | 
						|
*
 | 
						|
                     CALL DORGLQ( M, N, M, A, LDA, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     IE = ITAU
 | 
						|
                     ITAUQ = IE + M
 | 
						|
                     ITAUP = ITAUQ + M
 | 
						|
                     IWORK = ITAUP + M
 | 
						|
*
 | 
						|
*                    Bidiagonalize L in WORK(IU), copying result to
 | 
						|
*                    WORK(IR)
 | 
						|
*                    (Workspace: need 2*M*M + 4*M,
 | 
						|
*                                prefer 2*M*M+3*M+2*M*NB)
 | 
						|
*
 | 
						|
                     CALL DGEBRD( M, M, WORK( IU ), LDWRKU, S,
 | 
						|
     $                            WORK( IE ), WORK( ITAUQ ),
 | 
						|
     $                            WORK( ITAUP ), WORK( IWORK ),
 | 
						|
     $                            LWORK-IWORK+1, IERR )
 | 
						|
                     CALL DLACPY( 'L', M, M, WORK( IU ), LDWRKU,
 | 
						|
     $                            WORK( IR ), LDWRKR )
 | 
						|
*
 | 
						|
*                    Generate right bidiagonalizing vectors in WORK(IU)
 | 
						|
*                    (Workspace: need 2*M*M + 4*M-1,
 | 
						|
*                                prefer 2*M*M+3*M+(M-1)*NB)
 | 
						|
*
 | 
						|
                     CALL DORGBR( 'P', M, M, M, WORK( IU ), LDWRKU,
 | 
						|
     $                            WORK( ITAUP ), WORK( IWORK ),
 | 
						|
     $                            LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Generate left bidiagonalizing vectors in WORK(IR)
 | 
						|
*                    (Workspace: need 2*M*M + 4*M, prefer 2*M*M + 3*M + M*NB)
 | 
						|
*
 | 
						|
                     CALL DORGBR( 'Q', M, M, M, WORK( IR ), LDWRKR,
 | 
						|
     $                            WORK( ITAUQ ), WORK( IWORK ),
 | 
						|
     $                            LWORK-IWORK+1, IERR )
 | 
						|
                     IWORK = IE + M
 | 
						|
*
 | 
						|
*                    Perform bidiagonal QR iteration, computing left
 | 
						|
*                    singular vectors of L in WORK(IR) and computing
 | 
						|
*                    right singular vectors of L in WORK(IU)
 | 
						|
*                    (Workspace: need 2*M*M + BDSPAC)
 | 
						|
*
 | 
						|
                     CALL DBDSQR( 'U', M, M, M, 0, S, WORK( IE ),
 | 
						|
     $                            WORK( IU ), LDWRKU, WORK( IR ),
 | 
						|
     $                            LDWRKR, DUM, 1, WORK( IWORK ), INFO )
 | 
						|
*
 | 
						|
*                    Multiply right singular vectors of L in WORK(IU) by
 | 
						|
*                    Q in A, storing result in VT
 | 
						|
*                    (Workspace: need M*M)
 | 
						|
*
 | 
						|
                     CALL DGEMM( 'N', 'N', M, N, M, ONE, WORK( IU ),
 | 
						|
     $                           LDWRKU, A, LDA, ZERO, VT, LDVT )
 | 
						|
*
 | 
						|
*                    Copy left singular vectors of L to A
 | 
						|
*                    (Workspace: need M*M)
 | 
						|
*
 | 
						|
                     CALL DLACPY( 'F', M, M, WORK( IR ), LDWRKR, A,
 | 
						|
     $                            LDA )
 | 
						|
*
 | 
						|
                  ELSE
 | 
						|
*
 | 
						|
*                    Insufficient workspace for a fast algorithm
 | 
						|
*
 | 
						|
                     ITAU = 1
 | 
						|
                     IWORK = ITAU + M
 | 
						|
*
 | 
						|
*                    Compute A=L*Q, copying result to VT
 | 
						|
*                    (Workspace: need 2*M, prefer M + M*NB)
 | 
						|
*
 | 
						|
                     CALL DGELQF( M, N, A, LDA, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     CALL DLACPY( 'U', M, N, A, LDA, VT, LDVT )
 | 
						|
*
 | 
						|
*                    Generate Q in VT
 | 
						|
*                    (Workspace: need 2*M, prefer M + M*NB)
 | 
						|
*
 | 
						|
                     CALL DORGLQ( M, N, M, VT, LDVT, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     IE = ITAU
 | 
						|
                     ITAUQ = IE + M
 | 
						|
                     ITAUP = ITAUQ + M
 | 
						|
                     IWORK = ITAUP + M
 | 
						|
*
 | 
						|
*                    Zero out above L in A
 | 
						|
*
 | 
						|
                     CALL DLASET( 'U', M-1, M-1, ZERO, ZERO, A( 1, 2 ),
 | 
						|
     $                            LDA )
 | 
						|
*
 | 
						|
*                    Bidiagonalize L in A
 | 
						|
*                    (Workspace: need 4*M, prefer 3*M + 2*M*NB)
 | 
						|
*
 | 
						|
                     CALL DGEBRD( M, M, A, LDA, S, WORK( IE ),
 | 
						|
     $                            WORK( ITAUQ ), WORK( ITAUP ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Multiply right vectors bidiagonalizing L by Q in VT
 | 
						|
*                    (Workspace: need 3*M + N, prefer 3*M + N*NB)
 | 
						|
*
 | 
						|
                     CALL DORMBR( 'P', 'L', 'T', M, N, M, A, LDA,
 | 
						|
     $                            WORK( ITAUP ), VT, LDVT,
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Generate left bidiagonalizing vectors of L in A
 | 
						|
*                    (Workspace: need 4*M, prefer 3*M + M*NB)
 | 
						|
*
 | 
						|
                     CALL DORGBR( 'Q', M, M, M, A, LDA, WORK( ITAUQ ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     IWORK = IE + M
 | 
						|
*
 | 
						|
*                    Perform bidiagonal QR iteration, compute left
 | 
						|
*                    singular vectors of A in A and compute right
 | 
						|
*                    singular vectors of A in VT
 | 
						|
*                    (Workspace: need BDSPAC)
 | 
						|
*
 | 
						|
                     CALL DBDSQR( 'U', M, N, M, 0, S, WORK( IE ), VT,
 | 
						|
     $                            LDVT, A, LDA, DUM, 1, WORK( IWORK ),
 | 
						|
     $                            INFO )
 | 
						|
*
 | 
						|
                  END IF
 | 
						|
*
 | 
						|
               ELSE IF( WNTUAS ) THEN
 | 
						|
*
 | 
						|
*                 Path 6t(N much larger than M, JOBU='S' or 'A',
 | 
						|
*                         JOBVT='S')
 | 
						|
*                 M right singular vectors to be computed in VT and
 | 
						|
*                 M left singular vectors to be computed in U
 | 
						|
*
 | 
						|
                  IF( LWORK.GE.M*M+MAX( 4*M, BDSPAC ) ) THEN
 | 
						|
*
 | 
						|
*                    Sufficient workspace for a fast algorithm
 | 
						|
*
 | 
						|
                     IU = 1
 | 
						|
                     IF( LWORK.GE.WRKBL+LDA*M ) THEN
 | 
						|
*
 | 
						|
*                       WORK(IU) is LDA by N
 | 
						|
*
 | 
						|
                        LDWRKU = LDA
 | 
						|
                     ELSE
 | 
						|
*
 | 
						|
*                       WORK(IU) is LDA by M
 | 
						|
*
 | 
						|
                        LDWRKU = M
 | 
						|
                     END IF
 | 
						|
                     ITAU = IU + LDWRKU*M
 | 
						|
                     IWORK = ITAU + M
 | 
						|
*
 | 
						|
*                    Compute A=L*Q
 | 
						|
*                    (Workspace: need M*M + 2*M, prefer M*M + M + M*NB)
 | 
						|
*
 | 
						|
                     CALL DGELQF( M, N, A, LDA, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Copy L to WORK(IU), zeroing out above it
 | 
						|
*
 | 
						|
                     CALL DLACPY( 'L', M, M, A, LDA, WORK( IU ),
 | 
						|
     $                            LDWRKU )
 | 
						|
                     CALL DLASET( 'U', M-1, M-1, ZERO, ZERO,
 | 
						|
     $                            WORK( IU+LDWRKU ), LDWRKU )
 | 
						|
*
 | 
						|
*                    Generate Q in A
 | 
						|
*                    (Workspace: need M*M + 2*M, prefer M*M + M + M*NB)
 | 
						|
*
 | 
						|
                     CALL DORGLQ( M, N, M, A, LDA, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     IE = ITAU
 | 
						|
                     ITAUQ = IE + M
 | 
						|
                     ITAUP = ITAUQ + M
 | 
						|
                     IWORK = ITAUP + M
 | 
						|
*
 | 
						|
*                    Bidiagonalize L in WORK(IU), copying result to U
 | 
						|
*                    (Workspace: need M*M + 4*M, prefer M*M + 3*M + 2*M*NB)
 | 
						|
*
 | 
						|
                     CALL DGEBRD( M, M, WORK( IU ), LDWRKU, S,
 | 
						|
     $                            WORK( IE ), WORK( ITAUQ ),
 | 
						|
     $                            WORK( ITAUP ), WORK( IWORK ),
 | 
						|
     $                            LWORK-IWORK+1, IERR )
 | 
						|
                     CALL DLACPY( 'L', M, M, WORK( IU ), LDWRKU, U,
 | 
						|
     $                            LDU )
 | 
						|
*
 | 
						|
*                    Generate right bidiagonalizing vectors in WORK(IU)
 | 
						|
*                    (Workspace: need M*M + 4*M-1,
 | 
						|
*                                prefer M*M+3*M+(M-1)*NB)
 | 
						|
*
 | 
						|
                     CALL DORGBR( 'P', M, M, M, WORK( IU ), LDWRKU,
 | 
						|
     $                            WORK( ITAUP ), WORK( IWORK ),
 | 
						|
     $                            LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Generate left bidiagonalizing vectors in U
 | 
						|
*                    (Workspace: need M*M + 4*M, prefer M*M + 3*M + M*NB)
 | 
						|
*
 | 
						|
                     CALL DORGBR( 'Q', M, M, M, U, LDU, WORK( ITAUQ ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     IWORK = IE + M
 | 
						|
*
 | 
						|
*                    Perform bidiagonal QR iteration, computing left
 | 
						|
*                    singular vectors of L in U and computing right
 | 
						|
*                    singular vectors of L in WORK(IU)
 | 
						|
*                    (Workspace: need M*M + BDSPAC)
 | 
						|
*
 | 
						|
                     CALL DBDSQR( 'U', M, M, M, 0, S, WORK( IE ),
 | 
						|
     $                            WORK( IU ), LDWRKU, U, LDU, DUM, 1,
 | 
						|
     $                            WORK( IWORK ), INFO )
 | 
						|
*
 | 
						|
*                    Multiply right singular vectors of L in WORK(IU) by
 | 
						|
*                    Q in A, storing result in VT
 | 
						|
*                    (Workspace: need M*M)
 | 
						|
*
 | 
						|
                     CALL DGEMM( 'N', 'N', M, N, M, ONE, WORK( IU ),
 | 
						|
     $                           LDWRKU, A, LDA, ZERO, VT, LDVT )
 | 
						|
*
 | 
						|
                  ELSE
 | 
						|
*
 | 
						|
*                    Insufficient workspace for a fast algorithm
 | 
						|
*
 | 
						|
                     ITAU = 1
 | 
						|
                     IWORK = ITAU + M
 | 
						|
*
 | 
						|
*                    Compute A=L*Q, copying result to VT
 | 
						|
*                    (Workspace: need 2*M, prefer M + M*NB)
 | 
						|
*
 | 
						|
                     CALL DGELQF( M, N, A, LDA, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     CALL DLACPY( 'U', M, N, A, LDA, VT, LDVT )
 | 
						|
*
 | 
						|
*                    Generate Q in VT
 | 
						|
*                    (Workspace: need 2*M, prefer M + M*NB)
 | 
						|
*
 | 
						|
                     CALL DORGLQ( M, N, M, VT, LDVT, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Copy L to U, zeroing out above it
 | 
						|
*
 | 
						|
                     CALL DLACPY( 'L', M, M, A, LDA, U, LDU )
 | 
						|
                     CALL DLASET( 'U', M-1, M-1, ZERO, ZERO, U( 1, 2 ),
 | 
						|
     $                            LDU )
 | 
						|
                     IE = ITAU
 | 
						|
                     ITAUQ = IE + M
 | 
						|
                     ITAUP = ITAUQ + M
 | 
						|
                     IWORK = ITAUP + M
 | 
						|
*
 | 
						|
*                    Bidiagonalize L in U
 | 
						|
*                    (Workspace: need 4*M, prefer 3*M + 2*M*NB)
 | 
						|
*
 | 
						|
                     CALL DGEBRD( M, M, U, LDU, S, WORK( IE ),
 | 
						|
     $                            WORK( ITAUQ ), WORK( ITAUP ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Multiply right bidiagonalizing vectors in U by Q
 | 
						|
*                    in VT
 | 
						|
*                    (Workspace: need 3*M + N, prefer 3*M + N*NB)
 | 
						|
*
 | 
						|
                     CALL DORMBR( 'P', 'L', 'T', M, N, M, U, LDU,
 | 
						|
     $                            WORK( ITAUP ), VT, LDVT,
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Generate left bidiagonalizing vectors in U
 | 
						|
*                    (Workspace: need 4*M, prefer 3*M + M*NB)
 | 
						|
*
 | 
						|
                     CALL DORGBR( 'Q', M, M, M, U, LDU, WORK( ITAUQ ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     IWORK = IE + M
 | 
						|
*
 | 
						|
*                    Perform bidiagonal QR iteration, computing left
 | 
						|
*                    singular vectors of A in U and computing right
 | 
						|
*                    singular vectors of A in VT
 | 
						|
*                    (Workspace: need BDSPAC)
 | 
						|
*
 | 
						|
                     CALL DBDSQR( 'U', M, N, M, 0, S, WORK( IE ), VT,
 | 
						|
     $                            LDVT, U, LDU, DUM, 1, WORK( IWORK ),
 | 
						|
     $                            INFO )
 | 
						|
*
 | 
						|
                  END IF
 | 
						|
*
 | 
						|
               END IF
 | 
						|
*
 | 
						|
            ELSE IF( WNTVA ) THEN
 | 
						|
*
 | 
						|
               IF( WNTUN ) THEN
 | 
						|
*
 | 
						|
*                 Path 7t(N much larger than M, JOBU='N', JOBVT='A')
 | 
						|
*                 N right singular vectors to be computed in VT and
 | 
						|
*                 no left singular vectors to be computed
 | 
						|
*
 | 
						|
                  IF( LWORK.GE.M*M+MAX( N + M, 4*M, BDSPAC ) ) THEN
 | 
						|
*
 | 
						|
*                    Sufficient workspace for a fast algorithm
 | 
						|
*
 | 
						|
                     IR = 1
 | 
						|
                     IF( LWORK.GE.WRKBL+LDA*M ) THEN
 | 
						|
*
 | 
						|
*                       WORK(IR) is LDA by M
 | 
						|
*
 | 
						|
                        LDWRKR = LDA
 | 
						|
                     ELSE
 | 
						|
*
 | 
						|
*                       WORK(IR) is M by M
 | 
						|
*
 | 
						|
                        LDWRKR = M
 | 
						|
                     END IF
 | 
						|
                     ITAU = IR + LDWRKR*M
 | 
						|
                     IWORK = ITAU + M
 | 
						|
*
 | 
						|
*                    Compute A=L*Q, copying result to VT
 | 
						|
*                    (Workspace: need M*M + 2*M, prefer M*M + M + M*NB)
 | 
						|
*
 | 
						|
                     CALL DGELQF( M, N, A, LDA, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     CALL DLACPY( 'U', M, N, A, LDA, VT, LDVT )
 | 
						|
*
 | 
						|
*                    Copy L to WORK(IR), zeroing out above it
 | 
						|
*
 | 
						|
                     CALL DLACPY( 'L', M, M, A, LDA, WORK( IR ),
 | 
						|
     $                            LDWRKR )
 | 
						|
                     CALL DLASET( 'U', M-1, M-1, ZERO, ZERO,
 | 
						|
     $                            WORK( IR+LDWRKR ), LDWRKR )
 | 
						|
*
 | 
						|
*                    Generate Q in VT
 | 
						|
*                    (Workspace: need M*M + M + N, prefer M*M + M + N*NB)
 | 
						|
*
 | 
						|
                     CALL DORGLQ( N, N, M, VT, LDVT, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     IE = ITAU
 | 
						|
                     ITAUQ = IE + M
 | 
						|
                     ITAUP = ITAUQ + M
 | 
						|
                     IWORK = ITAUP + M
 | 
						|
*
 | 
						|
*                    Bidiagonalize L in WORK(IR)
 | 
						|
*                    (Workspace: need M*M + 4*M, prefer M*M + 3*M + 2*M*NB)
 | 
						|
*
 | 
						|
                     CALL DGEBRD( M, M, WORK( IR ), LDWRKR, S,
 | 
						|
     $                            WORK( IE ), WORK( ITAUQ ),
 | 
						|
     $                            WORK( ITAUP ), WORK( IWORK ),
 | 
						|
     $                            LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Generate right bidiagonalizing vectors in WORK(IR)
 | 
						|
*                    (Workspace: need M*M + 4*M-1,
 | 
						|
*                                prefer M*M+3*M+(M-1)*NB)
 | 
						|
*
 | 
						|
                     CALL DORGBR( 'P', M, M, M, WORK( IR ), LDWRKR,
 | 
						|
     $                            WORK( ITAUP ), WORK( IWORK ),
 | 
						|
     $                            LWORK-IWORK+1, IERR )
 | 
						|
                     IWORK = IE + M
 | 
						|
*
 | 
						|
*                    Perform bidiagonal QR iteration, computing right
 | 
						|
*                    singular vectors of L in WORK(IR)
 | 
						|
*                    (Workspace: need M*M + BDSPAC)
 | 
						|
*
 | 
						|
                     CALL DBDSQR( 'U', M, M, 0, 0, S, WORK( IE ),
 | 
						|
     $                            WORK( IR ), LDWRKR, DUM, 1, DUM, 1,
 | 
						|
     $                            WORK( IWORK ), INFO )
 | 
						|
*
 | 
						|
*                    Multiply right singular vectors of L in WORK(IR) by
 | 
						|
*                    Q in VT, storing result in A
 | 
						|
*                    (Workspace: need M*M)
 | 
						|
*
 | 
						|
                     CALL DGEMM( 'N', 'N', M, N, M, ONE, WORK( IR ),
 | 
						|
     $                           LDWRKR, VT, LDVT, ZERO, A, LDA )
 | 
						|
*
 | 
						|
*                    Copy right singular vectors of A from A to VT
 | 
						|
*
 | 
						|
                     CALL DLACPY( 'F', M, N, A, LDA, VT, LDVT )
 | 
						|
*
 | 
						|
                  ELSE
 | 
						|
*
 | 
						|
*                    Insufficient workspace for a fast algorithm
 | 
						|
*
 | 
						|
                     ITAU = 1
 | 
						|
                     IWORK = ITAU + M
 | 
						|
*
 | 
						|
*                    Compute A=L*Q, copying result to VT
 | 
						|
*                    (Workspace: need 2*M, prefer M + M*NB)
 | 
						|
*
 | 
						|
                     CALL DGELQF( M, N, A, LDA, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     CALL DLACPY( 'U', M, N, A, LDA, VT, LDVT )
 | 
						|
*
 | 
						|
*                    Generate Q in VT
 | 
						|
*                    (Workspace: need M + N, prefer M + N*NB)
 | 
						|
*
 | 
						|
                     CALL DORGLQ( N, N, M, VT, LDVT, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     IE = ITAU
 | 
						|
                     ITAUQ = IE + M
 | 
						|
                     ITAUP = ITAUQ + M
 | 
						|
                     IWORK = ITAUP + M
 | 
						|
*
 | 
						|
*                    Zero out above L in A
 | 
						|
*
 | 
						|
                     CALL DLASET( 'U', M-1, M-1, ZERO, ZERO, A( 1, 2 ),
 | 
						|
     $                            LDA )
 | 
						|
*
 | 
						|
*                    Bidiagonalize L in A
 | 
						|
*                    (Workspace: need 4*M, prefer 3*M + 2*M*NB)
 | 
						|
*
 | 
						|
                     CALL DGEBRD( M, M, A, LDA, S, WORK( IE ),
 | 
						|
     $                            WORK( ITAUQ ), WORK( ITAUP ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Multiply right bidiagonalizing vectors in A by Q
 | 
						|
*                    in VT
 | 
						|
*                    (Workspace: need 3*M + N, prefer 3*M + N*NB)
 | 
						|
*
 | 
						|
                     CALL DORMBR( 'P', 'L', 'T', M, N, M, A, LDA,
 | 
						|
     $                            WORK( ITAUP ), VT, LDVT,
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     IWORK = IE + M
 | 
						|
*
 | 
						|
*                    Perform bidiagonal QR iteration, computing right
 | 
						|
*                    singular vectors of A in VT
 | 
						|
*                    (Workspace: need BDSPAC)
 | 
						|
*
 | 
						|
                     CALL DBDSQR( 'U', M, N, 0, 0, S, WORK( IE ), VT,
 | 
						|
     $                            LDVT, DUM, 1, DUM, 1, WORK( IWORK ),
 | 
						|
     $                            INFO )
 | 
						|
*
 | 
						|
                  END IF
 | 
						|
*
 | 
						|
               ELSE IF( WNTUO ) THEN
 | 
						|
*
 | 
						|
*                 Path 8t(N much larger than M, JOBU='O', JOBVT='A')
 | 
						|
*                 N right singular vectors to be computed in VT and
 | 
						|
*                 M left singular vectors to be overwritten on A
 | 
						|
*
 | 
						|
                  IF( LWORK.GE.2*M*M+MAX( N + M, 4*M, BDSPAC ) ) THEN
 | 
						|
*
 | 
						|
*                    Sufficient workspace for a fast algorithm
 | 
						|
*
 | 
						|
                     IU = 1
 | 
						|
                     IF( LWORK.GE.WRKBL+2*LDA*M ) THEN
 | 
						|
*
 | 
						|
*                       WORK(IU) is LDA by M and WORK(IR) is LDA by M
 | 
						|
*
 | 
						|
                        LDWRKU = LDA
 | 
						|
                        IR = IU + LDWRKU*M
 | 
						|
                        LDWRKR = LDA
 | 
						|
                     ELSE IF( LWORK.GE.WRKBL+( LDA + M )*M ) THEN
 | 
						|
*
 | 
						|
*                       WORK(IU) is LDA by M and WORK(IR) is M by M
 | 
						|
*
 | 
						|
                        LDWRKU = LDA
 | 
						|
                        IR = IU + LDWRKU*M
 | 
						|
                        LDWRKR = M
 | 
						|
                     ELSE
 | 
						|
*
 | 
						|
*                       WORK(IU) is M by M and WORK(IR) is M by M
 | 
						|
*
 | 
						|
                        LDWRKU = M
 | 
						|
                        IR = IU + LDWRKU*M
 | 
						|
                        LDWRKR = M
 | 
						|
                     END IF
 | 
						|
                     ITAU = IR + LDWRKR*M
 | 
						|
                     IWORK = ITAU + M
 | 
						|
*
 | 
						|
*                    Compute A=L*Q, copying result to VT
 | 
						|
*                    (Workspace: need 2*M*M + 2*M, prefer 2*M*M + M + M*NB)
 | 
						|
*
 | 
						|
                     CALL DGELQF( M, N, A, LDA, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     CALL DLACPY( 'U', M, N, A, LDA, VT, LDVT )
 | 
						|
*
 | 
						|
*                    Generate Q in VT
 | 
						|
*                    (Workspace: need 2*M*M + M + N, prefer 2*M*M + M + N*NB)
 | 
						|
*
 | 
						|
                     CALL DORGLQ( N, N, M, VT, LDVT, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Copy L to WORK(IU), zeroing out above it
 | 
						|
*
 | 
						|
                     CALL DLACPY( 'L', M, M, A, LDA, WORK( IU ),
 | 
						|
     $                            LDWRKU )
 | 
						|
                     CALL DLASET( 'U', M-1, M-1, ZERO, ZERO,
 | 
						|
     $                            WORK( IU+LDWRKU ), LDWRKU )
 | 
						|
                     IE = ITAU
 | 
						|
                     ITAUQ = IE + M
 | 
						|
                     ITAUP = ITAUQ + M
 | 
						|
                     IWORK = ITAUP + M
 | 
						|
*
 | 
						|
*                    Bidiagonalize L in WORK(IU), copying result to
 | 
						|
*                    WORK(IR)
 | 
						|
*                    (Workspace: need 2*M*M + 4*M,
 | 
						|
*                                prefer 2*M*M+3*M+2*M*NB)
 | 
						|
*
 | 
						|
                     CALL DGEBRD( M, M, WORK( IU ), LDWRKU, S,
 | 
						|
     $                            WORK( IE ), WORK( ITAUQ ),
 | 
						|
     $                            WORK( ITAUP ), WORK( IWORK ),
 | 
						|
     $                            LWORK-IWORK+1, IERR )
 | 
						|
                     CALL DLACPY( 'L', M, M, WORK( IU ), LDWRKU,
 | 
						|
     $                            WORK( IR ), LDWRKR )
 | 
						|
*
 | 
						|
*                    Generate right bidiagonalizing vectors in WORK(IU)
 | 
						|
*                    (Workspace: need 2*M*M + 4*M-1,
 | 
						|
*                                prefer 2*M*M+3*M+(M-1)*NB)
 | 
						|
*
 | 
						|
                     CALL DORGBR( 'P', M, M, M, WORK( IU ), LDWRKU,
 | 
						|
     $                            WORK( ITAUP ), WORK( IWORK ),
 | 
						|
     $                            LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Generate left bidiagonalizing vectors in WORK(IR)
 | 
						|
*                    (Workspace: need 2*M*M + 4*M, prefer 2*M*M + 3*M + M*NB)
 | 
						|
*
 | 
						|
                     CALL DORGBR( 'Q', M, M, M, WORK( IR ), LDWRKR,
 | 
						|
     $                            WORK( ITAUQ ), WORK( IWORK ),
 | 
						|
     $                            LWORK-IWORK+1, IERR )
 | 
						|
                     IWORK = IE + M
 | 
						|
*
 | 
						|
*                    Perform bidiagonal QR iteration, computing left
 | 
						|
*                    singular vectors of L in WORK(IR) and computing
 | 
						|
*                    right singular vectors of L in WORK(IU)
 | 
						|
*                    (Workspace: need 2*M*M + BDSPAC)
 | 
						|
*
 | 
						|
                     CALL DBDSQR( 'U', M, M, M, 0, S, WORK( IE ),
 | 
						|
     $                            WORK( IU ), LDWRKU, WORK( IR ),
 | 
						|
     $                            LDWRKR, DUM, 1, WORK( IWORK ), INFO )
 | 
						|
*
 | 
						|
*                    Multiply right singular vectors of L in WORK(IU) by
 | 
						|
*                    Q in VT, storing result in A
 | 
						|
*                    (Workspace: need M*M)
 | 
						|
*
 | 
						|
                     CALL DGEMM( 'N', 'N', M, N, M, ONE, WORK( IU ),
 | 
						|
     $                           LDWRKU, VT, LDVT, ZERO, A, LDA )
 | 
						|
*
 | 
						|
*                    Copy right singular vectors of A from A to VT
 | 
						|
*
 | 
						|
                     CALL DLACPY( 'F', M, N, A, LDA, VT, LDVT )
 | 
						|
*
 | 
						|
*                    Copy left singular vectors of A from WORK(IR) to A
 | 
						|
*
 | 
						|
                     CALL DLACPY( 'F', M, M, WORK( IR ), LDWRKR, A,
 | 
						|
     $                            LDA )
 | 
						|
*
 | 
						|
                  ELSE
 | 
						|
*
 | 
						|
*                    Insufficient workspace for a fast algorithm
 | 
						|
*
 | 
						|
                     ITAU = 1
 | 
						|
                     IWORK = ITAU + M
 | 
						|
*
 | 
						|
*                    Compute A=L*Q, copying result to VT
 | 
						|
*                    (Workspace: need 2*M, prefer M + M*NB)
 | 
						|
*
 | 
						|
                     CALL DGELQF( M, N, A, LDA, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     CALL DLACPY( 'U', M, N, A, LDA, VT, LDVT )
 | 
						|
*
 | 
						|
*                    Generate Q in VT
 | 
						|
*                    (Workspace: need M + N, prefer M + N*NB)
 | 
						|
*
 | 
						|
                     CALL DORGLQ( N, N, M, VT, LDVT, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     IE = ITAU
 | 
						|
                     ITAUQ = IE + M
 | 
						|
                     ITAUP = ITAUQ + M
 | 
						|
                     IWORK = ITAUP + M
 | 
						|
*
 | 
						|
*                    Zero out above L in A
 | 
						|
*
 | 
						|
                     CALL DLASET( 'U', M-1, M-1, ZERO, ZERO, A( 1, 2 ),
 | 
						|
     $                            LDA )
 | 
						|
*
 | 
						|
*                    Bidiagonalize L in A
 | 
						|
*                    (Workspace: need 4*M, prefer 3*M + 2*M*NB)
 | 
						|
*
 | 
						|
                     CALL DGEBRD( M, M, A, LDA, S, WORK( IE ),
 | 
						|
     $                            WORK( ITAUQ ), WORK( ITAUP ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Multiply right bidiagonalizing vectors in A by Q
 | 
						|
*                    in VT
 | 
						|
*                    (Workspace: need 3*M + N, prefer 3*M + N*NB)
 | 
						|
*
 | 
						|
                     CALL DORMBR( 'P', 'L', 'T', M, N, M, A, LDA,
 | 
						|
     $                            WORK( ITAUP ), VT, LDVT,
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Generate left bidiagonalizing vectors in A
 | 
						|
*                    (Workspace: need 4*M, prefer 3*M + M*NB)
 | 
						|
*
 | 
						|
                     CALL DORGBR( 'Q', M, M, M, A, LDA, WORK( ITAUQ ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     IWORK = IE + M
 | 
						|
*
 | 
						|
*                    Perform bidiagonal QR iteration, computing left
 | 
						|
*                    singular vectors of A in A and computing right
 | 
						|
*                    singular vectors of A in VT
 | 
						|
*                    (Workspace: need BDSPAC)
 | 
						|
*
 | 
						|
                     CALL DBDSQR( 'U', M, N, M, 0, S, WORK( IE ), VT,
 | 
						|
     $                            LDVT, A, LDA, DUM, 1, WORK( IWORK ),
 | 
						|
     $                            INFO )
 | 
						|
*
 | 
						|
                  END IF
 | 
						|
*
 | 
						|
               ELSE IF( WNTUAS ) THEN
 | 
						|
*
 | 
						|
*                 Path 9t(N much larger than M, JOBU='S' or 'A',
 | 
						|
*                         JOBVT='A')
 | 
						|
*                 N right singular vectors to be computed in VT and
 | 
						|
*                 M left singular vectors to be computed in U
 | 
						|
*
 | 
						|
                  IF( LWORK.GE.M*M+MAX( N + M, 4*M, BDSPAC ) ) THEN
 | 
						|
*
 | 
						|
*                    Sufficient workspace for a fast algorithm
 | 
						|
*
 | 
						|
                     IU = 1
 | 
						|
                     IF( LWORK.GE.WRKBL+LDA*M ) THEN
 | 
						|
*
 | 
						|
*                       WORK(IU) is LDA by M
 | 
						|
*
 | 
						|
                        LDWRKU = LDA
 | 
						|
                     ELSE
 | 
						|
*
 | 
						|
*                       WORK(IU) is M by M
 | 
						|
*
 | 
						|
                        LDWRKU = M
 | 
						|
                     END IF
 | 
						|
                     ITAU = IU + LDWRKU*M
 | 
						|
                     IWORK = ITAU + M
 | 
						|
*
 | 
						|
*                    Compute A=L*Q, copying result to VT
 | 
						|
*                    (Workspace: need M*M + 2*M, prefer M*M + M + M*NB)
 | 
						|
*
 | 
						|
                     CALL DGELQF( M, N, A, LDA, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     CALL DLACPY( 'U', M, N, A, LDA, VT, LDVT )
 | 
						|
*
 | 
						|
*                    Generate Q in VT
 | 
						|
*                    (Workspace: need M*M + M + N, prefer M*M + M + N*NB)
 | 
						|
*
 | 
						|
                     CALL DORGLQ( N, N, M, VT, LDVT, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Copy L to WORK(IU), zeroing out above it
 | 
						|
*
 | 
						|
                     CALL DLACPY( 'L', M, M, A, LDA, WORK( IU ),
 | 
						|
     $                            LDWRKU )
 | 
						|
                     CALL DLASET( 'U', M-1, M-1, ZERO, ZERO,
 | 
						|
     $                            WORK( IU+LDWRKU ), LDWRKU )
 | 
						|
                     IE = ITAU
 | 
						|
                     ITAUQ = IE + M
 | 
						|
                     ITAUP = ITAUQ + M
 | 
						|
                     IWORK = ITAUP + M
 | 
						|
*
 | 
						|
*                    Bidiagonalize L in WORK(IU), copying result to U
 | 
						|
*                    (Workspace: need M*M + 4*M, prefer M*M + 3*M + 2*M*NB)
 | 
						|
*
 | 
						|
                     CALL DGEBRD( M, M, WORK( IU ), LDWRKU, S,
 | 
						|
     $                            WORK( IE ), WORK( ITAUQ ),
 | 
						|
     $                            WORK( ITAUP ), WORK( IWORK ),
 | 
						|
     $                            LWORK-IWORK+1, IERR )
 | 
						|
                     CALL DLACPY( 'L', M, M, WORK( IU ), LDWRKU, U,
 | 
						|
     $                            LDU )
 | 
						|
*
 | 
						|
*                    Generate right bidiagonalizing vectors in WORK(IU)
 | 
						|
*                    (Workspace: need M*M + 4*M, prefer M*M + 3*M + (M-1)*NB)
 | 
						|
*
 | 
						|
                     CALL DORGBR( 'P', M, M, M, WORK( IU ), LDWRKU,
 | 
						|
     $                            WORK( ITAUP ), WORK( IWORK ),
 | 
						|
     $                            LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Generate left bidiagonalizing vectors in U
 | 
						|
*                    (Workspace: need M*M + 4*M, prefer M*M + 3*M + M*NB)
 | 
						|
*
 | 
						|
                     CALL DORGBR( 'Q', M, M, M, U, LDU, WORK( ITAUQ ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     IWORK = IE + M
 | 
						|
*
 | 
						|
*                    Perform bidiagonal QR iteration, computing left
 | 
						|
*                    singular vectors of L in U and computing right
 | 
						|
*                    singular vectors of L in WORK(IU)
 | 
						|
*                    (Workspace: need M*M + BDSPAC)
 | 
						|
*
 | 
						|
                     CALL DBDSQR( 'U', M, M, M, 0, S, WORK( IE ),
 | 
						|
     $                            WORK( IU ), LDWRKU, U, LDU, DUM, 1,
 | 
						|
     $                            WORK( IWORK ), INFO )
 | 
						|
*
 | 
						|
*                    Multiply right singular vectors of L in WORK(IU) by
 | 
						|
*                    Q in VT, storing result in A
 | 
						|
*                    (Workspace: need M*M)
 | 
						|
*
 | 
						|
                     CALL DGEMM( 'N', 'N', M, N, M, ONE, WORK( IU ),
 | 
						|
     $                           LDWRKU, VT, LDVT, ZERO, A, LDA )
 | 
						|
*
 | 
						|
*                    Copy right singular vectors of A from A to VT
 | 
						|
*
 | 
						|
                     CALL DLACPY( 'F', M, N, A, LDA, VT, LDVT )
 | 
						|
*
 | 
						|
                  ELSE
 | 
						|
*
 | 
						|
*                    Insufficient workspace for a fast algorithm
 | 
						|
*
 | 
						|
                     ITAU = 1
 | 
						|
                     IWORK = ITAU + M
 | 
						|
*
 | 
						|
*                    Compute A=L*Q, copying result to VT
 | 
						|
*                    (Workspace: need 2*M, prefer M + M*NB)
 | 
						|
*
 | 
						|
                     CALL DGELQF( M, N, A, LDA, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     CALL DLACPY( 'U', M, N, A, LDA, VT, LDVT )
 | 
						|
*
 | 
						|
*                    Generate Q in VT
 | 
						|
*                    (Workspace: need M + N, prefer M + N*NB)
 | 
						|
*
 | 
						|
                     CALL DORGLQ( N, N, M, VT, LDVT, WORK( ITAU ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Copy L to U, zeroing out above it
 | 
						|
*
 | 
						|
                     CALL DLACPY( 'L', M, M, A, LDA, U, LDU )
 | 
						|
                     CALL DLASET( 'U', M-1, M-1, ZERO, ZERO, U( 1, 2 ),
 | 
						|
     $                            LDU )
 | 
						|
                     IE = ITAU
 | 
						|
                     ITAUQ = IE + M
 | 
						|
                     ITAUP = ITAUQ + M
 | 
						|
                     IWORK = ITAUP + M
 | 
						|
*
 | 
						|
*                    Bidiagonalize L in U
 | 
						|
*                    (Workspace: need 4*M, prefer 3*M + 2*M*NB)
 | 
						|
*
 | 
						|
                     CALL DGEBRD( M, M, U, LDU, S, WORK( IE ),
 | 
						|
     $                            WORK( ITAUQ ), WORK( ITAUP ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Multiply right bidiagonalizing vectors in U by Q
 | 
						|
*                    in VT
 | 
						|
*                    (Workspace: need 3*M + N, prefer 3*M + N*NB)
 | 
						|
*
 | 
						|
                     CALL DORMBR( 'P', 'L', 'T', M, N, M, U, LDU,
 | 
						|
     $                            WORK( ITAUP ), VT, LDVT,
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
*
 | 
						|
*                    Generate left bidiagonalizing vectors in U
 | 
						|
*                    (Workspace: need 4*M, prefer 3*M + M*NB)
 | 
						|
*
 | 
						|
                     CALL DORGBR( 'Q', M, M, M, U, LDU, WORK( ITAUQ ),
 | 
						|
     $                            WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
                     IWORK = IE + M
 | 
						|
*
 | 
						|
*                    Perform bidiagonal QR iteration, computing left
 | 
						|
*                    singular vectors of A in U and computing right
 | 
						|
*                    singular vectors of A in VT
 | 
						|
*                    (Workspace: need BDSPAC)
 | 
						|
*
 | 
						|
                     CALL DBDSQR( 'U', M, N, M, 0, S, WORK( IE ), VT,
 | 
						|
     $                            LDVT, U, LDU, DUM, 1, WORK( IWORK ),
 | 
						|
     $                            INFO )
 | 
						|
*
 | 
						|
                  END IF
 | 
						|
*
 | 
						|
               END IF
 | 
						|
*
 | 
						|
            END IF
 | 
						|
*
 | 
						|
         ELSE
 | 
						|
*
 | 
						|
*           N .LT. MNTHR
 | 
						|
*
 | 
						|
*           Path 10t(N greater than M, but not much larger)
 | 
						|
*           Reduce to bidiagonal form without LQ decomposition
 | 
						|
*
 | 
						|
            IE = 1
 | 
						|
            ITAUQ = IE + M
 | 
						|
            ITAUP = ITAUQ + M
 | 
						|
            IWORK = ITAUP + M
 | 
						|
*
 | 
						|
*           Bidiagonalize A
 | 
						|
*           (Workspace: need 3*M + N, prefer 3*M + (M + N)*NB)
 | 
						|
*
 | 
						|
            CALL DGEBRD( M, N, A, LDA, S, WORK( IE ), WORK( ITAUQ ),
 | 
						|
     $                   WORK( ITAUP ), WORK( IWORK ), LWORK-IWORK+1,
 | 
						|
     $                   IERR )
 | 
						|
            IF( WNTUAS ) THEN
 | 
						|
*
 | 
						|
*              If left singular vectors desired in U, copy result to U
 | 
						|
*              and generate left bidiagonalizing vectors in U
 | 
						|
*              (Workspace: need 4*M-1, prefer 3*M + (M-1)*NB)
 | 
						|
*
 | 
						|
               CALL DLACPY( 'L', M, M, A, LDA, U, LDU )
 | 
						|
               CALL DORGBR( 'Q', M, M, N, U, LDU, WORK( ITAUQ ),
 | 
						|
     $                      WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
            END IF
 | 
						|
            IF( WNTVAS ) THEN
 | 
						|
*
 | 
						|
*              If right singular vectors desired in VT, copy result to
 | 
						|
*              VT and generate right bidiagonalizing vectors in VT
 | 
						|
*              (Workspace: need 3*M + NRVT, prefer 3*M + NRVT*NB)
 | 
						|
*
 | 
						|
               CALL DLACPY( 'U', M, N, A, LDA, VT, LDVT )
 | 
						|
               IF( WNTVA )
 | 
						|
     $            NRVT = N
 | 
						|
               IF( WNTVS )
 | 
						|
     $            NRVT = M
 | 
						|
               CALL DORGBR( 'P', NRVT, N, M, VT, LDVT, WORK( ITAUP ),
 | 
						|
     $                      WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
            END IF
 | 
						|
            IF( WNTUO ) THEN
 | 
						|
*
 | 
						|
*              If left singular vectors desired in A, generate left
 | 
						|
*              bidiagonalizing vectors in A
 | 
						|
*              (Workspace: need 4*M-1, prefer 3*M + (M-1)*NB)
 | 
						|
*
 | 
						|
               CALL DORGBR( 'Q', M, M, N, A, LDA, WORK( ITAUQ ),
 | 
						|
     $                      WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
            END IF
 | 
						|
            IF( WNTVO ) THEN
 | 
						|
*
 | 
						|
*              If right singular vectors desired in A, generate right
 | 
						|
*              bidiagonalizing vectors in A
 | 
						|
*              (Workspace: need 4*M, prefer 3*M + M*NB)
 | 
						|
*
 | 
						|
               CALL DORGBR( 'P', M, N, M, A, LDA, WORK( ITAUP ),
 | 
						|
     $                      WORK( IWORK ), LWORK-IWORK+1, IERR )
 | 
						|
            END IF
 | 
						|
            IWORK = IE + M
 | 
						|
            IF( WNTUAS .OR. WNTUO )
 | 
						|
     $         NRU = M
 | 
						|
            IF( WNTUN )
 | 
						|
     $         NRU = 0
 | 
						|
            IF( WNTVAS .OR. WNTVO )
 | 
						|
     $         NCVT = N
 | 
						|
            IF( WNTVN )
 | 
						|
     $         NCVT = 0
 | 
						|
            IF( ( .NOT.WNTUO ) .AND. ( .NOT.WNTVO ) ) THEN
 | 
						|
*
 | 
						|
*              Perform bidiagonal QR iteration, if desired, computing
 | 
						|
*              left singular vectors in U and computing right singular
 | 
						|
*              vectors in VT
 | 
						|
*              (Workspace: need BDSPAC)
 | 
						|
*
 | 
						|
               CALL DBDSQR( 'L', M, NCVT, NRU, 0, S, WORK( IE ), VT,
 | 
						|
     $                      LDVT, U, LDU, DUM, 1, WORK( IWORK ), INFO )
 | 
						|
            ELSE IF( ( .NOT.WNTUO ) .AND. WNTVO ) THEN
 | 
						|
*
 | 
						|
*              Perform bidiagonal QR iteration, if desired, computing
 | 
						|
*              left singular vectors in U and computing right singular
 | 
						|
*              vectors in A
 | 
						|
*              (Workspace: need BDSPAC)
 | 
						|
*
 | 
						|
               CALL DBDSQR( 'L', M, NCVT, NRU, 0, S, WORK( IE ), A, LDA,
 | 
						|
     $                      U, LDU, DUM, 1, WORK( IWORK ), INFO )
 | 
						|
            ELSE
 | 
						|
*
 | 
						|
*              Perform bidiagonal QR iteration, if desired, computing
 | 
						|
*              left singular vectors in A and computing right singular
 | 
						|
*              vectors in VT
 | 
						|
*              (Workspace: need BDSPAC)
 | 
						|
*
 | 
						|
               CALL DBDSQR( 'L', M, NCVT, NRU, 0, S, WORK( IE ), VT,
 | 
						|
     $                      LDVT, A, LDA, DUM, 1, WORK( IWORK ), INFO )
 | 
						|
            END IF
 | 
						|
*
 | 
						|
         END IF
 | 
						|
*
 | 
						|
      END IF
 | 
						|
*
 | 
						|
*     If DBDSQR failed to converge, copy unconverged superdiagonals
 | 
						|
*     to WORK( 2:MINMN )
 | 
						|
*
 | 
						|
      IF( INFO.NE.0 ) THEN
 | 
						|
         IF( IE.GT.2 ) THEN
 | 
						|
            DO 50 I = 1, MINMN - 1
 | 
						|
               WORK( I+1 ) = WORK( I+IE-1 )
 | 
						|
   50       CONTINUE
 | 
						|
         END IF
 | 
						|
         IF( IE.LT.2 ) THEN
 | 
						|
            DO 60 I = MINMN - 1, 1, -1
 | 
						|
               WORK( I+1 ) = WORK( I+IE-1 )
 | 
						|
   60       CONTINUE
 | 
						|
         END IF
 | 
						|
      END IF
 | 
						|
*
 | 
						|
*     Undo scaling if necessary
 | 
						|
*
 | 
						|
      IF( ISCL.EQ.1 ) THEN
 | 
						|
         IF( ANRM.GT.BIGNUM )
 | 
						|
     $      CALL DLASCL( 'G', 0, 0, BIGNUM, ANRM, MINMN, 1, S, MINMN,
 | 
						|
     $                   IERR )
 | 
						|
         IF( INFO.NE.0 .AND. ANRM.GT.BIGNUM )
 | 
						|
     $      CALL DLASCL( 'G', 0, 0, BIGNUM, ANRM, MINMN-1, 1, WORK( 2 ),
 | 
						|
     $                   MINMN, IERR )
 | 
						|
         IF( ANRM.LT.SMLNUM )
 | 
						|
     $      CALL DLASCL( 'G', 0, 0, SMLNUM, ANRM, MINMN, 1, S, MINMN,
 | 
						|
     $                   IERR )
 | 
						|
         IF( INFO.NE.0 .AND. ANRM.LT.SMLNUM )
 | 
						|
     $      CALL DLASCL( 'G', 0, 0, SMLNUM, ANRM, MINMN-1, 1, WORK( 2 ),
 | 
						|
     $                   MINMN, IERR )
 | 
						|
      END IF
 | 
						|
*
 | 
						|
*     Return optimal workspace in WORK(1)
 | 
						|
*
 | 
						|
      WORK( 1 ) = MAXWRK
 | 
						|
*
 | 
						|
      RETURN
 | 
						|
*
 | 
						|
*     End of DGESVD
 | 
						|
*
 | 
						|
      END
 |