cgesdd_8f_source.html

*> \brief \b CGESDD

*

*  =========== DOCUMENTATION ===========

*

* Online html documentation available at

*            http://www.netlib.org/lapack/explore-html/

*

*> \htmlonly

*> Download CGESDD + dependencies

*> <a href="http://www.netlib.org/cgi-bin/netlibfiles.tgz?format=tgz&filename=/lapack/lapack_routine/cgesdd.f">

*> [TGZ]</a>

*> <a href="http://www.netlib.org/cgi-bin/netlibfiles.zip?format=zip&filename=/lapack/lapack_routine/cgesdd.f">

*> [ZIP]</a>

*> <a href="http://www.netlib.org/cgi-bin/netlibfiles.txt?format=txt&filename=/lapack/lapack_routine/cgesdd.f">

*> [TXT]</a>

*> \endhtmlonly

*

*  Definition:

*  ===========

*

*       SUBROUTINE CGESDD( JOBZ, M, N, A, LDA, S, U, LDU, VT, LDVT,

*                          WORK, LWORK, RWORK, IWORK, INFO )

*

*       .. Scalar Arguments ..

*       CHARACTER          JOBZ

*       INTEGER            INFO, LDA, LDU, LDVT, LWORK, M, N

*       ..

*       .. Array Arguments ..

*       INTEGER            IWORK( * )

*       REAL               RWORK( * ), S( * )

*       COMPLEX            A( LDA, * ), U( LDU, * ), VT( LDVT, * ),

*      $                   WORK( * )

*       ..

*

*

*> \par Purpose:

*  =============

*>

*> \verbatim

*>

*> CGESDD computes the singular value decomposition (SVD) of a complex

*> M-by-N matrix A, optionally computing the left and/or right singular

*> vectors, by using divide-and-conquer method. The SVD is written

*>

*>      A = U * SIGMA * conjugate-transpose(V)

*>

*> where SIGMA is an M-by-N matrix which is zero except for its

*> min(m,n) diagonal elements, U is an M-by-M unitary matrix, and

*> V is an N-by-N unitary matrix.  The diagonal elements of SIGMA

*> are the singular values of A; they are real and non-negative, and

*> are returned in descending order.  The first min(m,n) columns of

*> U and V are the left and right singular vectors of A.

*>

*> Note that the routine returns VT = V**H, not V.

*>

*> The divide and conquer algorithm makes very mild assumptions about

*> floating point arithmetic. It will work on machines with a guard

*> digit in add/subtract, or on those binary machines without guard

*> digits which subtract like the Cray X-MP, Cray Y-MP, Cray C-90, or

*> Cray-2. It could conceivably fail on hexadecimal or decimal machines

*> without guard digits, but we know of none.

*> \endverbatim

*

*  Arguments:

*  ==========

*

*> \param[in] JOBZ

*> \verbatim

*>          JOBZ is CHARACTER*1

*>          Specifies options for computing all or part of the matrix U:

*>          = 'A':  all M columns of U and all N rows of V**H are

*>                  returned in the arrays U and VT;

*>          = 'S':  the first min(M,N) columns of U and the first

*>                  min(M,N) rows of V**H are returned in the arrays U

*>                  and VT;

*>          = 'O':  If M >= N, the first N columns of U are overwritten

*>                  in the array A and all rows of V**H are returned in

*>                  the array VT;

*>                  otherwise, all columns of U are returned in the

*>                  array U and the first M rows of V**H are overwritten

*>                  in the array A;

*>          = 'N':  no columns of U or rows of V**H are computed.

*> \endverbatim

*>

*> \param[in] M

*> \verbatim

*>          M is INTEGER

*>          The number of rows of the input matrix A.  M >= 0.

*> \endverbatim

*>

*> \param[in] N

*> \verbatim

*>          N is INTEGER

*>          The number of columns of the input matrix A.  N >= 0.

*> \endverbatim

*>

*> \param[in,out] A

*> \verbatim

*>          A is COMPLEX array, dimension (LDA,N)

*>          On entry, the M-by-N matrix A.

*>          On exit,

*>          if JOBZ = 'O',  A is overwritten with the first N columns

*>                          of U (the left singular vectors, stored

*>                          columnwise) if M >= N;

*>                          A is overwritten with the first M rows

*>                          of V**H (the right singular vectors, stored

*>                          rowwise) otherwise.

*>          if JOBZ .ne. 'O', the contents of A are destroyed.

*> \endverbatim

*>

*> \param[in] LDA

*> \verbatim

*>          LDA is INTEGER

*>          The leading dimension of the array A.  LDA >= max(1,M).

*> \endverbatim

*>

*> \param[out] S

*> \verbatim

*>          S is REAL array, dimension (min(M,N))

*>          The singular values of A, sorted so that S(i) >= S(i+1).

*> \endverbatim

*>

*> \param[out] U

*> \verbatim

*>          U is COMPLEX array, dimension (LDU,UCOL)

*>          UCOL = M if JOBZ = 'A' or JOBZ = 'O' and M < N;

*>          UCOL = min(M,N) if JOBZ = 'S'.

*>          If JOBZ = 'A' or JOBZ = 'O' and M < N, U contains the M-by-M

*>          unitary matrix U;

*>          if JOBZ = 'S', U contains the first min(M,N) columns of U

*>          (the left singular vectors, stored columnwise);

*>          if JOBZ = 'O' and M >= N, or JOBZ = 'N', U is not referenced.

*> \endverbatim

*>

*> \param[in] LDU

*> \verbatim

*>          LDU is INTEGER

*>          The leading dimension of the array U.  LDU >= 1;

*>          if JOBZ = 'S' or 'A' or JOBZ = 'O' and M < N, LDU >= M.

*> \endverbatim

*>

*> \param[out] VT

*> \verbatim

*>          VT is COMPLEX array, dimension (LDVT,N)

*>          If JOBZ = 'A' or JOBZ = 'O' and M >= N, VT contains the

*>          N-by-N unitary matrix V**H;

*>          if JOBZ = 'S', VT contains the first min(M,N) rows of

*>          V**H (the right singular vectors, stored rowwise);

*>          if JOBZ = 'O' and M < N, or JOBZ = 'N', VT is not referenced.

*> \endverbatim

*>

*> \param[in] LDVT

*> \verbatim

*>          LDVT is INTEGER

*>          The leading dimension of the array VT.  LDVT >= 1;

*>          if JOBZ = 'A' or JOBZ = 'O' and M >= N, LDVT >= N;

*>          if JOBZ = 'S', LDVT >= min(M,N).

*> \endverbatim

*>

*> \param[out] WORK

*> \verbatim

*>          WORK is COMPLEX array, dimension (MAX(1,LWORK))

*>          On exit, if INFO = 0, WORK(1) returns the optimal LWORK.

*> \endverbatim

*>

*> \param[in] LWORK

*> \verbatim

*>          LWORK is INTEGER

*>          The dimension of the array WORK. LWORK >= 1.

*>          If LWORK = -1, a workspace query is assumed.  The optimal

*>          size for the WORK array is calculated and stored in WORK(1),

*>          and no other work except argument checking is performed.

*>

*>          Let mx = max(M,N) and mn = min(M,N).

*>          If JOBZ = 'N', LWORK >= 2*mn + mx.

*>          If JOBZ = 'O', LWORK >= 2*mn*mn + 2*mn + mx.

*>          If JOBZ = 'S', LWORK >=   mn*mn + 3*mn.

*>          If JOBZ = 'A', LWORK >=   mn*mn + 2*mn + mx.

*>          These are not tight minimums in all cases; see comments inside code.

*>          For good performance, LWORK should generally be larger;

*>          a query is recommended.

*> \endverbatim

*>

*> \param[out] RWORK

*> \verbatim

*>          RWORK is REAL array, dimension (MAX(1,LRWORK))

*>          Let mx = max(M,N) and mn = min(M,N).

*>          If JOBZ = 'N',    LRWORK >= 5*mn (LAPACK <= 3.6 needs 7*mn);

*>          else if mx >> mn, LRWORK >= 5*mn*mn + 5*mn;

*>          else              LRWORK >= max( 5*mn*mn + 5*mn,

*>                                           2*mx*mn + 2*mn*mn + mn ).

*> \endverbatim

*>

*> \param[out] IWORK

*> \verbatim

*>          IWORK is INTEGER array, dimension (8*min(M,N))

*> \endverbatim

*>

*> \param[out] INFO

*> \verbatim

*>          INFO is INTEGER

*>          <  0:  if INFO = -i, the i-th argument had an illegal value.

*>          = -4:  if A had a NAN entry.

*>          >  0:  The updating process of SBDSDC did not converge.

*>          =  0:  successful exit.

*> \endverbatim

*

*  Authors:

*  ========

*

*> \author Univ. of Tennessee

*> \author Univ. of California Berkeley

*> \author Univ. of Colorado Denver

*> \author NAG Ltd.

*

*> \ingroup complexGEsing

*

*> \par Contributors:

*  ==================

*>

*>     Ming Gu and Huan Ren, Computer Science Division, University of

*>     California at Berkeley, USA

*>

*  =====================================================================


      SUBROUTINE cgesdd( JOBZ, M, N, A, LDA, S, U, LDU, VT, LDVT,

     $                   WORK, LWORK, RWORK, IWORK, INFO )

      implicit none

*

*  -- LAPACK driver routine --

*  -- LAPACK is a software package provided by Univ. of Tennessee,    --

*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--

*

*     .. Scalar Arguments ..

      CHARACTER          JOBZ

      INTEGER            INFO, LDA, LDU, LDVT, LWORK, M, N

*     ..

*     .. Array Arguments ..

      INTEGER            IWORK( * )

      REAL               RWORK( * ), S( * )

      COMPLEX            A( LDA, * ), U( LDU, * ), VT( LDVT, * ),

     $                   work( * )

*     ..

*

*  =====================================================================

*

*     .. Parameters ..

      COMPLEX            CZERO, CONE

      parameter( czero = ( 0.0e+0, 0.0e+0 ),

     $                   cone = ( 1.0e+0, 0.0e+0 ) )

      REAL               ZERO, ONE

      parameter( zero = 0.0e+0, one = 1.0e+0 )

*     ..

*     .. Local Scalars ..

      LOGICAL            LQUERY, WNTQA, WNTQAS, WNTQN, WNTQO, WNTQS

      INTEGER            BLK, CHUNK, I, IE, IERR, IL, IR, IRU, IRVT,

     $                   iscl, itau, itaup, itauq, iu, ivt, ldwkvt,

     $                   ldwrkl, ldwrkr, ldwrku, maxwrk, minmn, minwrk,

     $                   mnthr1, mnthr2, nrwork, nwork, wrkbl

      INTEGER            LWORK_CGEBRD_MN, LWORK_CGEBRD_MM,

     $                   lwork_cgebrd_nn, lwork_cgelqf_mn,

     $                   lwork_cgeqrf_mn,

     $                   lwork_cungbr_p_mn, lwork_cungbr_p_nn,

     $                   lwork_cungbr_q_mn, lwork_cungbr_q_mm,

     $                   lwork_cunglq_mn, lwork_cunglq_nn,

     $                   lwork_cungqr_mm, lwork_cungqr_mn,

     $                   lwork_cunmbr_prc_mm, lwork_cunmbr_qln_mm,

     $                   lwork_cunmbr_prc_mn, lwork_cunmbr_qln_mn,

     $                   lwork_cunmbr_prc_nn, lwork_cunmbr_qln_nn

      REAL   ANRM, BIGNUM, EPS, SMLNUM

*     ..

*     .. Local Arrays ..

      INTEGER            IDUM( 1 )

      REAL               DUM( 1 )

      COMPLEX            CDUM( 1 )

*     ..

*     .. External Subroutines ..

      EXTERNAL           cgebrd, cgelqf, cgemm, cgeqrf, clacp2, clacpy,

     $                   clacrm, clarcm, clascl, claset, cungbr, cunglq,

     $                   cungqr, cunmbr, sbdsdc, slascl, xerbla

*     ..

*     .. External Functions ..

      LOGICAL            LSAME, SISNAN

      REAL               SLAMCH, CLANGE, SROUNDUP_LWORK

      EXTERNAL           lsame, slamch, clange, sisnan,

     $                   sroundup_lwork

*     ..

*     .. Intrinsic Functions ..

      INTRINSIC          int, max, min, sqrt

*     ..

*     .. Executable Statements ..

*

*     Test the input arguments

*

      info   = 0

      minmn  = min( m, n )

      mnthr1 = int( minmn*17.0e0 / 9.0e0 )

      mnthr2 = int( minmn*5.0e0 / 3.0e0 )

      wntqa  = lsame( jobz, 'A' )

      wntqs  = lsame( jobz, 'S' )

      wntqas = wntqa .OR. wntqs

      wntqo  = lsame( jobz, 'O' )

      wntqn  = lsame( jobz, 'N' )

      lquery = ( lwork.EQ.-1 )

      minwrk = 1

      maxwrk = 1

*

      IF( .NOT.( wntqa .OR. wntqs .OR. wntqo .OR. wntqn ) ) THEN

         info = -1

      ELSE IF( m.LT.0 ) THEN

         info = -2

      ELSE IF( n.LT.0 ) THEN

         info = -3

      ELSE IF( lda.LT.max( 1, m ) ) THEN

         info = -5

      ELSE IF( ldu.LT.1 .OR. ( wntqas .AND. ldu.LT.m ) .OR.

     $         ( wntqo .AND. m.LT.n .AND. ldu.LT.m ) ) THEN

         info = -8

      ELSE IF( ldvt.LT.1 .OR. ( wntqa .AND. ldvt.LT.n ) .OR.

     $         ( wntqs .AND. ldvt.LT.minmn ) .OR.

     $         ( wntqo .AND. m.GE.n .AND. ldvt.LT.n ) ) THEN

         info = -10

      END IF

*

*     Compute workspace

*       Note: Comments in the code beginning "Workspace:" describe the

*       minimal amount of workspace allocated at that point in the code,

*       as well as the preferred amount for good performance.

*       CWorkspace refers to complex workspace, and RWorkspace to

*       real workspace. NB refers to the optimal block size for the

*       immediately following subroutine, as returned by ILAENV.)

*

      IF( info.EQ.0 ) THEN

         minwrk = 1

         maxwrk = 1

         IF( m.GE.n .AND. minmn.GT.0 ) THEN

*

*           There is no complex work space needed for bidiagonal SVD

*           The real work space needed for bidiagonal SVD (sbdsdc) is

*           BDSPAC = 3*N*N + 4*N for singular values and vectors;

*           BDSPAC = 4*N         for singular values only;

*           not including e, RU, and RVT matrices.

*

*           Compute space preferred for each routine

            CALL cgebrd( m, n, cdum(1), m, dum(1), dum(1), cdum(1),

     $                   cdum(1), cdum(1), -1, ierr )

            lwork_cgebrd_mn = int( cdum(1) )

*

            CALL cgebrd( n, n, cdum(1), n, dum(1), dum(1), cdum(1),

     $                   cdum(1), cdum(1), -1, ierr )

            lwork_cgebrd_nn = int( cdum(1) )

*

            CALL cgeqrf( m, n, cdum(1), m, cdum(1), cdum(1), -1, ierr )

            lwork_cgeqrf_mn = int( cdum(1) )

*

            CALL cungbr( 'P', n, n, n, cdum(1), n, cdum(1), cdum(1),

     $                   -1, ierr )

            lwork_cungbr_p_nn = int( cdum(1) )

*

            CALL cungbr( 'Q', m, m, n, cdum(1), m, cdum(1), cdum(1),

     $                   -1, ierr )

            lwork_cungbr_q_mm = int( cdum(1) )

*

            CALL cungbr( 'Q', m, n, n, cdum(1), m, cdum(1), cdum(1),

     $                   -1, ierr )

            lwork_cungbr_q_mn = int( cdum(1) )

*

            CALL cungqr( m, m, n, cdum(1), m, cdum(1), cdum(1),

     $                   -1, ierr )

            lwork_cungqr_mm = int( cdum(1) )

*

            CALL cungqr( m, n, n, cdum(1), m, cdum(1), cdum(1),

     $                   -1, ierr )

            lwork_cungqr_mn = int( cdum(1) )

*

            CALL cunmbr( 'P', 'R', 'C', n, n, n, cdum(1), n, cdum(1),

     $                   cdum(1), n, cdum(1), -1, ierr )

            lwork_cunmbr_prc_nn = int( cdum(1) )

*

            CALL cunmbr( 'Q', 'L', 'N', m, m, n, cdum(1), m, cdum(1),

     $                   cdum(1), m, cdum(1), -1, ierr )

            lwork_cunmbr_qln_mm = int( cdum(1) )

*

            CALL cunmbr( 'Q', 'L', 'N', m, n, n, cdum(1), m, cdum(1),

     $                   cdum(1), m, cdum(1), -1, ierr )

            lwork_cunmbr_qln_mn = int( cdum(1) )

*

            CALL cunmbr( 'Q', 'L', 'N', n, n, n, cdum(1), n, cdum(1),

     $                   cdum(1), n, cdum(1), -1, ierr )

            lwork_cunmbr_qln_nn = int( cdum(1) )

*

            IF( m.GE.mnthr1 ) THEN

               IF( wntqn ) THEN

*

*                 Path 1 (M >> N, JOBZ='N')

*

                  maxwrk = n + lwork_cgeqrf_mn

                  maxwrk = max( maxwrk, 2*n + lwork_cgebrd_nn )

                  minwrk = 3*n

               ELSE IF( wntqo ) THEN

*

*                 Path 2 (M >> N, JOBZ='O')

*

                  wrkbl = n + lwork_cgeqrf_mn

                  wrkbl = max( wrkbl,   n + lwork_cungqr_mn )

                  wrkbl = max( wrkbl, 2*n + lwork_cgebrd_nn )

                  wrkbl = max( wrkbl, 2*n + lwork_cunmbr_qln_nn )

                  wrkbl = max( wrkbl, 2*n + lwork_cunmbr_prc_nn )

                  maxwrk = m*n + n*n + wrkbl

                  minwrk = 2*n*n + 3*n

               ELSE IF( wntqs ) THEN

*

*                 Path 3 (M >> N, JOBZ='S')

*

                  wrkbl = n + lwork_cgeqrf_mn

                  wrkbl = max( wrkbl,   n + lwork_cungqr_mn )

                  wrkbl = max( wrkbl, 2*n + lwork_cgebrd_nn )

                  wrkbl = max( wrkbl, 2*n + lwork_cunmbr_qln_nn )

                  wrkbl = max( wrkbl, 2*n + lwork_cunmbr_prc_nn )

                  maxwrk = n*n + wrkbl

                  minwrk = n*n + 3*n

               ELSE IF( wntqa ) THEN

*

*                 Path 4 (M >> N, JOBZ='A')

*

                  wrkbl = n + lwork_cgeqrf_mn

                  wrkbl = max( wrkbl,   n + lwork_cungqr_mm )

                  wrkbl = max( wrkbl, 2*n + lwork_cgebrd_nn )

                  wrkbl = max( wrkbl, 2*n + lwork_cunmbr_qln_nn )

                  wrkbl = max( wrkbl, 2*n + lwork_cunmbr_prc_nn )

                  maxwrk = n*n + wrkbl

                  minwrk = n*n + max( 3*n, n + m )

               END IF

            ELSE IF( m.GE.mnthr2 ) THEN

*

*              Path 5 (M >> N, but not as much as MNTHR1)

*

               maxwrk = 2*n + lwork_cgebrd_mn

               minwrk = 2*n + m

               IF( wntqo ) THEN

*                 Path 5o (M >> N, JOBZ='O')

                  maxwrk = max( maxwrk, 2*n + lwork_cungbr_p_nn )

                  maxwrk = max( maxwrk, 2*n + lwork_cungbr_q_mn )

                  maxwrk = maxwrk + m*n

                  minwrk = minwrk + n*n

               ELSE IF( wntqs ) THEN

*                 Path 5s (M >> N, JOBZ='S')

                  maxwrk = max( maxwrk, 2*n + lwork_cungbr_p_nn )

                  maxwrk = max( maxwrk, 2*n + lwork_cungbr_q_mn )

               ELSE IF( wntqa ) THEN

*                 Path 5a (M >> N, JOBZ='A')

                  maxwrk = max( maxwrk, 2*n + lwork_cungbr_p_nn )

                  maxwrk = max( maxwrk, 2*n + lwork_cungbr_q_mm )

               END IF

            ELSE

*

*              Path 6 (M >= N, but not much larger)

*

               maxwrk = 2*n + lwork_cgebrd_mn

               minwrk = 2*n + m

               IF( wntqo ) THEN

*                 Path 6o (M >= N, JOBZ='O')

                  maxwrk = max( maxwrk, 2*n + lwork_cunmbr_prc_nn )

                  maxwrk = max( maxwrk, 2*n + lwork_cunmbr_qln_mn )

                  maxwrk = maxwrk + m*n

                  minwrk = minwrk + n*n

               ELSE IF( wntqs ) THEN

*                 Path 6s (M >= N, JOBZ='S')

                  maxwrk = max( maxwrk, 2*n + lwork_cunmbr_qln_mn )

                  maxwrk = max( maxwrk, 2*n + lwork_cunmbr_prc_nn )

               ELSE IF( wntqa ) THEN

*                 Path 6a (M >= N, JOBZ='A')

                  maxwrk = max( maxwrk, 2*n + lwork_cunmbr_qln_mm )

                  maxwrk = max( maxwrk, 2*n + lwork_cunmbr_prc_nn )

               END IF

            END IF

         ELSE IF( minmn.GT.0 ) THEN

*

*           There is no complex work space needed for bidiagonal SVD

*           The real work space needed for bidiagonal SVD (sbdsdc) is

*           BDSPAC = 3*M*M + 4*M for singular values and vectors;

*           BDSPAC = 4*M         for singular values only;

*           not including e, RU, and RVT matrices.

*

*           Compute space preferred for each routine

            CALL cgebrd( m, n, cdum(1), m, dum(1), dum(1), cdum(1),

     $                   cdum(1), cdum(1), -1, ierr )

            lwork_cgebrd_mn = int( cdum(1) )

*

            CALL cgebrd( m, m, cdum(1), m, dum(1), dum(1), cdum(1),

     $                   cdum(1), cdum(1), -1, ierr )

            lwork_cgebrd_mm = int( cdum(1) )

*

            CALL cgelqf( m, n, cdum(1), m, cdum(1), cdum(1), -1, ierr )

            lwork_cgelqf_mn = int( cdum(1) )

*

            CALL cungbr( 'P', m, n, m, cdum(1), m, cdum(1), cdum(1),

     $                   -1, ierr )

            lwork_cungbr_p_mn = int( cdum(1) )

*

            CALL cungbr( 'P', n, n, m, cdum(1), n, cdum(1), cdum(1),

     $                   -1, ierr )

            lwork_cungbr_p_nn = int( cdum(1) )

*

            CALL cungbr( 'Q', m, m, n, cdum(1), m, cdum(1), cdum(1),

     $                   -1, ierr )

            lwork_cungbr_q_mm = int( cdum(1) )

*

            CALL cunglq( m, n, m, cdum(1), m, cdum(1), cdum(1),

     $                   -1, ierr )

            lwork_cunglq_mn = int( cdum(1) )

*

            CALL cunglq( n, n, m, cdum(1), n, cdum(1), cdum(1),

     $                   -1, ierr )

            lwork_cunglq_nn = int( cdum(1) )

*

            CALL cunmbr( 'P', 'R', 'C', m, m, m, cdum(1), m, cdum(1),

     $                   cdum(1), m, cdum(1), -1, ierr )

            lwork_cunmbr_prc_mm = int( cdum(1) )

*

            CALL cunmbr( 'P', 'R', 'C', m, n, m, cdum(1), m, cdum(1),

     $                   cdum(1), m, cdum(1), -1, ierr )

            lwork_cunmbr_prc_mn = int( cdum(1) )

*

            CALL cunmbr( 'P', 'R', 'C', n, n, m, cdum(1), n, cdum(1),

     $                   cdum(1), n, cdum(1), -1, ierr )

            lwork_cunmbr_prc_nn = int( cdum(1) )

*

            CALL cunmbr( 'Q', 'L', 'N', m, m, m, cdum(1), m, cdum(1),

     $                   cdum(1), m, cdum(1), -1, ierr )

            lwork_cunmbr_qln_mm = int( cdum(1) )

*

            IF( n.GE.mnthr1 ) THEN

               IF( wntqn ) THEN

*

*                 Path 1t (N >> M, JOBZ='N')

*

                  maxwrk = m + lwork_cgelqf_mn

                  maxwrk = max( maxwrk, 2*m + lwork_cgebrd_mm )

                  minwrk = 3*m

               ELSE IF( wntqo ) THEN

*

*                 Path 2t (N >> M, JOBZ='O')

*

                  wrkbl = m + lwork_cgelqf_mn

                  wrkbl = max( wrkbl,   m + lwork_cunglq_mn )

                  wrkbl = max( wrkbl, 2*m + lwork_cgebrd_mm )

                  wrkbl = max( wrkbl, 2*m + lwork_cunmbr_qln_mm )

                  wrkbl = max( wrkbl, 2*m + lwork_cunmbr_prc_mm )

                  maxwrk = m*n + m*m + wrkbl

                  minwrk = 2*m*m + 3*m

               ELSE IF( wntqs ) THEN

*

*                 Path 3t (N >> M, JOBZ='S')

*

                  wrkbl = m + lwork_cgelqf_mn

                  wrkbl = max( wrkbl,   m + lwork_cunglq_mn )

                  wrkbl = max( wrkbl, 2*m + lwork_cgebrd_mm )

                  wrkbl = max( wrkbl, 2*m + lwork_cunmbr_qln_mm )

                  wrkbl = max( wrkbl, 2*m + lwork_cunmbr_prc_mm )

                  maxwrk = m*m + wrkbl

                  minwrk = m*m + 3*m

               ELSE IF( wntqa ) THEN

*

*                 Path 4t (N >> M, JOBZ='A')

*

                  wrkbl = m + lwork_cgelqf_mn

                  wrkbl = max( wrkbl,   m + lwork_cunglq_nn )

                  wrkbl = max( wrkbl, 2*m + lwork_cgebrd_mm )

                  wrkbl = max( wrkbl, 2*m + lwork_cunmbr_qln_mm )

                  wrkbl = max( wrkbl, 2*m + lwork_cunmbr_prc_mm )

                  maxwrk = m*m + wrkbl

                  minwrk = m*m + max( 3*m, m + n )

               END IF

            ELSE IF( n.GE.mnthr2 ) THEN

*

*              Path 5t (N >> M, but not as much as MNTHR1)

*

               maxwrk = 2*m + lwork_cgebrd_mn

               minwrk = 2*m + n

               IF( wntqo ) THEN

*                 Path 5to (N >> M, JOBZ='O')

                  maxwrk = max( maxwrk, 2*m + lwork_cungbr_q_mm )

                  maxwrk = max( maxwrk, 2*m + lwork_cungbr_p_mn )

                  maxwrk = maxwrk + m*n

                  minwrk = minwrk + m*m

               ELSE IF( wntqs ) THEN

*                 Path 5ts (N >> M, JOBZ='S')

                  maxwrk = max( maxwrk, 2*m + lwork_cungbr_q_mm )

                  maxwrk = max( maxwrk, 2*m + lwork_cungbr_p_mn )

               ELSE IF( wntqa ) THEN

*                 Path 5ta (N >> M, JOBZ='A')

                  maxwrk = max( maxwrk, 2*m + lwork_cungbr_q_mm )

                  maxwrk = max( maxwrk, 2*m + lwork_cungbr_p_nn )

               END IF

            ELSE

*

*              Path 6t (N > M, but not much larger)

*

               maxwrk = 2*m + lwork_cgebrd_mn

               minwrk = 2*m + n

               IF( wntqo ) THEN

*                 Path 6to (N > M, JOBZ='O')

                  maxwrk = max( maxwrk, 2*m + lwork_cunmbr_qln_mm )

                  maxwrk = max( maxwrk, 2*m + lwork_cunmbr_prc_mn )

                  maxwrk = maxwrk + m*n

                  minwrk = minwrk + m*m

               ELSE IF( wntqs ) THEN

*                 Path 6ts (N > M, JOBZ='S')

                  maxwrk = max( maxwrk, 2*m + lwork_cunmbr_qln_mm )

                  maxwrk = max( maxwrk, 2*m + lwork_cunmbr_prc_mn )

               ELSE IF( wntqa ) THEN

*                 Path 6ta (N > M, JOBZ='A')

                  maxwrk = max( maxwrk, 2*m + lwork_cunmbr_qln_mm )

                  maxwrk = max( maxwrk, 2*m + lwork_cunmbr_prc_nn )

               END IF

            END IF

         END IF

         maxwrk = max( maxwrk, minwrk )

      END IF

      IF( info.EQ.0 ) THEN

         work( 1 ) = sroundup_lwork( maxwrk )

         IF( lwork.LT.minwrk .AND. .NOT. lquery ) THEN

            info = -12

         END IF

      END IF

*

      IF( info.NE.0 ) THEN

         CALL xerbla( 'CGESDD', -info )

         RETURN

      ELSE IF( lquery ) THEN

         RETURN

      END IF

*

*     Quick return if possible

*

      IF( m.EQ.0 .OR. n.EQ.0 ) THEN

         RETURN

      END IF

*

*     Get machine constants

*

      eps = slamch( 'P' )

      smlnum = sqrt( slamch( 'S' ) ) / eps

      bignum = one / smlnum

*

*     Scale A if max element outside range [SMLNUM,BIGNUM]

*

      anrm = clange( 'M', m, n, a, lda, dum )

      IF( sisnan( anrm ) ) THEN

          info = -4

          RETURN

      END IF

      iscl = 0

      IF( anrm.GT.zero .AND. anrm.LT.smlnum ) THEN

         iscl = 1

         CALL clascl( 'G', 0, 0, anrm, smlnum, m, n, a, lda, ierr )

      ELSE IF( anrm.GT.bignum ) THEN

         iscl = 1

         CALL clascl( 'G', 0, 0, anrm, bignum, m, n, a, lda, ierr )

      END IF

*

      IF( m.GE.n ) THEN

*

*        A has at least as many rows as columns. If A has sufficiently

*        more rows than columns, first reduce using the QR

*        decomposition (if sufficient workspace available)

*

         IF( m.GE.mnthr1 ) THEN

*

            IF( wntqn ) THEN

*

*              Path 1 (M >> N, JOBZ='N')

*              No singular vectors to be computed

*

               itau = 1

               nwork = itau + n

*

*              Compute A=Q*R

*              CWorkspace: need   N [tau] + N    [work]

*              CWorkspace: prefer N [tau] + N*NB [work]

*              RWorkspace: need   0

*

               CALL cgeqrf( m, n, a, lda, work( itau ), work( nwork ),

     $                      lwork-nwork+1, ierr )

*

*              Zero out below R

*

               CALL claset( 'L', n-1, n-1, czero, czero, a( 2, 1 ),

     $                      lda )

               ie = 1

               itauq = 1

               itaup = itauq + n

               nwork = itaup + n

*

*              Bidiagonalize R in A

*              CWorkspace: need   2*N [tauq, taup] + N      [work]

*              CWorkspace: prefer 2*N [tauq, taup] + 2*N*NB [work]

*              RWorkspace: need   N [e]

*

               CALL cgebrd( n, n, a, lda, s, rwork( ie ), work( itauq ),

     $                      work( itaup ), work( nwork ), lwork-nwork+1,

     $                      ierr )

               nrwork = ie + n

*

*              Perform bidiagonal SVD, compute singular values only

*              CWorkspace: need   0

*              RWorkspace: need   N [e] + BDSPAC

*

               CALL sbdsdc( 'U', 'N', n, s, rwork( ie ), dum,1,dum,1,

     $                      dum, idum, rwork( nrwork ), iwork, info )

*

            ELSE IF( wntqo ) THEN

*

*              Path 2 (M >> N, JOBZ='O')

*              N left singular vectors to be overwritten on A and

*              N right singular vectors to be computed in VT

*

               iu = 1

*

*              WORK(IU) is N by N

*

               ldwrku = n

               ir = iu + ldwrku*n

               IF( lwork .GE. m*n + n*n + 3*n ) THEN

*

*                 WORK(IR) is M by N

*

                  ldwrkr = m

               ELSE

                  ldwrkr = ( lwork - n*n - 3*n ) / n

               END IF

               itau = ir + ldwrkr*n

               nwork = itau + n

*

*              Compute A=Q*R

*              CWorkspace: need   N*N [U] + N*N [R] + N [tau] + N    [work]

*              CWorkspace: prefer N*N [U] + N*N [R] + N [tau] + N*NB [work]

*              RWorkspace: need   0

*

               CALL cgeqrf( m, n, a, lda, work( itau ), work( nwork ),

     $                      lwork-nwork+1, ierr )

*

*              Copy R to WORK( IR ), zeroing out below it

*

               CALL clacpy( 'U', n, n, a, lda, work( ir ), ldwrkr )

               CALL claset( 'L', n-1, n-1, czero, czero, work( ir+1 ),

     $                      ldwrkr )

*

*              Generate Q in A

*              CWorkspace: need   N*N [U] + N*N [R] + N [tau] + N    [work]

*              CWorkspace: prefer N*N [U] + N*N [R] + N [tau] + N*NB [work]

*              RWorkspace: need   0

*

               CALL cungqr( m, n, n, a, lda, work( itau ),

     $                      work( nwork ), lwork-nwork+1, ierr )

               ie = 1

               itauq = itau

               itaup = itauq + n

               nwork = itaup + n

*

*              Bidiagonalize R in WORK(IR)

*              CWorkspace: need   N*N [U] + N*N [R] + 2*N [tauq, taup] + N      [work]

*              CWorkspace: prefer N*N [U] + N*N [R] + 2*N [tauq, taup] + 2*N*NB [work]

*              RWorkspace: need   N [e]

*

               CALL cgebrd( n, n, work( ir ), ldwrkr, s, rwork( ie ),

     $                      work( itauq ), work( itaup ), work( nwork ),

     $                      lwork-nwork+1, ierr )

*

*              Perform bidiagonal SVD, computing left singular vectors

*              of R in WORK(IRU) and computing right singular vectors

*              of R in WORK(IRVT)

*              CWorkspace: need   0

*              RWorkspace: need   N [e] + N*N [RU] + N*N [RVT] + BDSPAC

*

               iru = ie + n

               irvt = iru + n*n

               nrwork = irvt + n*n

               CALL sbdsdc( 'U', 'I', n, s, rwork( ie ), rwork( iru ),

     $                      n, rwork( irvt ), n, dum, idum,

     $                      rwork( nrwork ), iwork, info )

*

*              Copy real matrix RWORK(IRU) to complex matrix WORK(IU)

*              Overwrite WORK(IU) by the left singular vectors of R

*              CWorkspace: need   N*N [U] + N*N [R] + 2*N [tauq, taup] + N    [work]

*              CWorkspace: prefer N*N [U] + N*N [R] + 2*N [tauq, taup] + N*NB [work]

*              RWorkspace: need   0

*

               CALL clacp2( 'F', n, n, rwork( iru ), n, work( iu ),

     $                      ldwrku )

               CALL cunmbr( 'Q', 'L', 'N', n, n, n, work( ir ), ldwrkr,

     $                      work( itauq ), work( iu ), ldwrku,

     $                      work( nwork ), lwork-nwork+1, ierr )

*

*              Copy real matrix RWORK(IRVT) to complex matrix VT

*              Overwrite VT by the right singular vectors of R

*              CWorkspace: need   N*N [U] + N*N [R] + 2*N [tauq, taup] + N    [work]

*              CWorkspace: prefer N*N [U] + N*N [R] + 2*N [tauq, taup] + N*NB [work]

*              RWorkspace: need   0

*

               CALL clacp2( 'F', n, n, rwork( irvt ), n, vt, ldvt )

               CALL cunmbr( 'P', 'R', 'C', n, n, n, work( ir ), ldwrkr,

     $                      work( itaup ), vt, ldvt, work( nwork ),

     $                      lwork-nwork+1, ierr )

*

*              Multiply Q in A by left singular vectors of R in

*              WORK(IU), storing result in WORK(IR) and copying to A

*              CWorkspace: need   N*N [U] + N*N [R]

*              CWorkspace: prefer N*N [U] + M*N [R]

*              RWorkspace: need   0

*

               DO 10 i = 1, m, ldwrkr

                  chunk = min( m-i+1, ldwrkr )

                  CALL cgemm( 'N', 'N', chunk, n, n, cone, a( i, 1 ),

     $                        lda, work( iu ), ldwrku, czero,

     $                        work( ir ), ldwrkr )

                  CALL clacpy( 'f', CHUNK, N, WORK( IR ), LDWRKR,

     $                         A( I, 1 ), LDA )

   10          CONTINUE

*

            ELSE IF( WNTQS ) THEN

*

*              Path 3 (M >> N, JOBZ='S')

*              N left singular vectors to be computed in U and

*              N right singular vectors to be computed in VT

*

               IR = 1

*

*              WORK(IR) is N by N

*

               LDWRKR = N

               ITAU = IR + LDWRKR*N

               NWORK = ITAU + N

*

*              Compute A=Q*R

*              CWorkspace: need   N*N [R] + N [tau] + N    [work]

*              CWorkspace: prefer N*N [R] + N [tau] + N*NB [work]

*              RWorkspace: need   0

*

               CALL CGEQRF( M, N, A, LDA, WORK( ITAU ), WORK( NWORK ),

     $                      LWORK-NWORK+1, IERR )

*

*              Copy R to WORK(IR), zeroing out below it

*

               CALL CLACPY( 'u', N, N, A, LDA, WORK( IR ), LDWRKR )

               CALL CLASET( 'l', N-1, N-1, CZERO, CZERO, WORK( IR+1 ),

     $                      LDWRKR )

*

*              Generate Q in A

*              CWorkspace: need   N*N [R] + N [tau] + N    [work]

*              CWorkspace: prefer N*N [R] + N [tau] + N*NB [work]

*              RWorkspace: need   0

*

               CALL CUNGQR( M, N, N, A, LDA, WORK( ITAU ),

     $                      WORK( NWORK ), LWORK-NWORK+1, IERR )

               IE = 1

               ITAUQ = ITAU

               ITAUP = ITAUQ + N

               NWORK = ITAUP + N

*

*              Bidiagonalize R in WORK(IR)

*              CWorkspace: need   N*N [R] + 2*N [tauq, taup] + N      [work]

*              CWorkspace: prefer N*N [R] + 2*N [tauq, taup] + 2*N*NB [work]

*              RWorkspace: need   N [e]

*

               CALL CGEBRD( N, N, WORK( IR ), LDWRKR, S, RWORK( IE ),

     $                      WORK( ITAUQ ), WORK( ITAUP ), WORK( NWORK ),

     $                      LWORK-NWORK+1, IERR )

*

*              Perform bidiagonal SVD, computing left singular vectors

*              of bidiagonal matrix in RWORK(IRU) and computing right

*              singular vectors of bidiagonal matrix in RWORK(IRVT)

*              CWorkspace: need   0

*              RWorkspace: need   N [e] + N*N [RU] + N*N [RVT] + BDSPAC

*

               IRU = IE + N

               IRVT = IRU + N*N

               NRWORK = IRVT + N*N

               CALL SBDSDC( 'u', 'i', N, S, RWORK( IE ), RWORK( IRU ),

     $                      N, RWORK( IRVT ), N, DUM, IDUM,

     $                      RWORK( NRWORK ), IWORK, INFO )

*

*              Copy real matrix RWORK(IRU) to complex matrix U

*              Overwrite U by left singular vectors of R

*              CWorkspace: need   N*N [R] + 2*N [tauq, taup] + N    [work]

*              CWorkspace: prefer N*N [R] + 2*N [tauq, taup] + N*NB [work]

*              RWorkspace: need   0

*

               CALL CLACP2( 'f', N, N, RWORK( IRU ), N, U, LDU )

               CALL CUNMBR( 'q', 'l', 'n', N, N, N, WORK( IR ), LDWRKR,

     $                      WORK( ITAUQ ), U, LDU, WORK( NWORK ),

     $                      LWORK-NWORK+1, IERR )

*

*              Copy real matrix RWORK(IRVT) to complex matrix VT

*              Overwrite VT by right singular vectors of R

*              CWorkspace: need   N*N [R] + 2*N [tauq, taup] + N    [work]

*              CWorkspace: prefer N*N [R] + 2*N [tauq, taup] + N*NB [work]

*              RWorkspace: need   0

*

               CALL CLACP2( 'f', N, N, RWORK( IRVT ), N, VT, LDVT )

               CALL CUNMBR( 'p', 'r', 'c', N, N, N, WORK( IR ), LDWRKR,

     $                      WORK( ITAUP ), VT, LDVT, WORK( NWORK ),

     $                      LWORK-NWORK+1, IERR )

*

*              Multiply Q in A by left singular vectors of R in

*              WORK(IR), storing result in U

*              CWorkspace: need   N*N [R]

*              RWorkspace: need   0

*

               CALL CLACPY( 'f', N, N, U, LDU, WORK( IR ), LDWRKR )

               CALL CGEMM( 'n', 'n', M, N, N, CONE, A, LDA, WORK( IR ),

     $                     LDWRKR, CZERO, U, LDU )

*

            ELSE IF( WNTQA ) THEN

*

*              Path 4 (M >> N, JOBZ='A')

*              M left singular vectors to be computed in U and

*              N right singular vectors to be computed in VT

*

               IU = 1

*

*              WORK(IU) is N by N

*

               LDWRKU = N

               ITAU = IU + LDWRKU*N

               NWORK = ITAU + N

*

*              Compute A=Q*R, copying result to U

*              CWorkspace: need   N*N [U] + N [tau] + N    [work]

*              CWorkspace: prefer N*N [U] + N [tau] + N*NB [work]

*              RWorkspace: need   0

*

               CALL CGEQRF( M, N, A, LDA, WORK( ITAU ), WORK( NWORK ),

     $                      LWORK-NWORK+1, IERR )

               CALL CLACPY( 'l', M, N, A, LDA, U, LDU )

*

*              Generate Q in U

*              CWorkspace: need   N*N [U] + N [tau] + M    [work]

*              CWorkspace: prefer N*N [U] + N [tau] + M*NB [work]

*              RWorkspace: need   0

*

               CALL CUNGQR( M, M, N, U, LDU, WORK( ITAU ),

     $                      WORK( NWORK ), LWORK-NWORK+1, IERR )

*

*              Produce R in A, zeroing out below it

*

               CALL CLASET( 'l', N-1, N-1, CZERO, CZERO, A( 2, 1 ),

     $                      LDA )

               IE = 1

               ITAUQ = ITAU

               ITAUP = ITAUQ + N

               NWORK = ITAUP + N

*

*              Bidiagonalize R in A

*              CWorkspace: need   N*N [U] + 2*N [tauq, taup] + N      [work]

*              CWorkspace: prefer N*N [U] + 2*N [tauq, taup] + 2*N*NB [work]

*              RWorkspace: need   N [e]

*

               CALL CGEBRD( N, N, A, LDA, S, RWORK( IE ), WORK( ITAUQ ),

     $                      WORK( ITAUP ), WORK( NWORK ), LWORK-NWORK+1,

     $                      IERR )

               IRU = IE + N

               IRVT = IRU + N*N

               NRWORK = IRVT + N*N

*

*              Perform bidiagonal SVD, computing left singular vectors

*              of bidiagonal matrix in RWORK(IRU) and computing right

*              singular vectors of bidiagonal matrix in RWORK(IRVT)

*              CWorkspace: need   0

*              RWorkspace: need   N [e] + N*N [RU] + N*N [RVT] + BDSPAC

*

               CALL SBDSDC( 'u', 'i', N, S, RWORK( IE ), RWORK( IRU ),

     $                      N, RWORK( IRVT ), N, DUM, IDUM,

     $                      RWORK( NRWORK ), IWORK, INFO )

*

*              Copy real matrix RWORK(IRU) to complex matrix WORK(IU)

*              Overwrite WORK(IU) by left singular vectors of R

*              CWorkspace: need   N*N [U] + 2*N [tauq, taup] + N    [work]

*              CWorkspace: prefer N*N [U] + 2*N [tauq, taup] + N*NB [work]

*              RWorkspace: need   0

*

               CALL CLACP2( 'f', N, N, RWORK( IRU ), N, WORK( IU ),

     $                      LDWRKU )

               CALL CUNMBR( 'q', 'l', 'n', n, n, n, a, lda,

     $                      work( itauq ), work( iu ), ldwrku,

     $                      work( nwork ), lwork-nwork+1, ierr )

*

*              Copy real matrix RWORK(IRVT) to complex matrix VT

*              Overwrite VT by right singular vectors of R

*              CWorkspace: need   N*N [U] + 2*N [tauq, taup] + N    [work]

*              CWorkspace: prefer N*N [U] + 2*N [tauq, taup] + N*NB [work]

*              RWorkspace: need   0

*

               CALL clacp2( 'F', n, n, rwork( irvt ), n, vt, ldvt )

               CALL cunmbr( 'P', 'R', 'C', n, n, n, a, lda,

     $                      work( itaup ), vt, ldvt, work( nwork ),

     $                      lwork-nwork+1, ierr )

*

*              Multiply Q in U by left singular vectors of R in

*              WORK(IU), storing result in A

*              CWorkspace: need   N*N [U]

*              RWorkspace: need   0

*

               CALL cgemm( 'N', 'N', m, n, n, cone, u, ldu, work( iu ),

     $                     ldwrku, czero, a, lda )

*

*              Copy left singular vectors of A from A to U

*

               CALL clacpy( 'F', m, n, a, lda, u, ldu )

*

            END IF

*

         ELSE IF( m.GE.mnthr2 ) THEN

*

*           MNTHR2 <= M < MNTHR1

*

*           Path 5 (M >> N, but not as much as MNTHR1)

*           Reduce to bidiagonal form without QR decomposition, use

*           CUNGBR and matrix multiplication to compute singular vectors

*

            ie = 1

            nrwork = ie + n

            itauq = 1

            itaup = itauq + n

            nwork = itaup + n

*

*           Bidiagonalize A

*           CWorkspace: need   2*N [tauq, taup] + M        [work]

*           CWorkspace: prefer 2*N [tauq, taup] + (M+N)*NB [work]

*           RWorkspace: need   N [e]

*

            CALL cgebrd( m, n, a, lda, s, rwork( ie ), work( itauq ),

     $                   work( itaup ), work( nwork ), lwork-nwork+1,

     $                   ierr )

            IF( wntqn ) THEN

*

*              Path 5n (M >> N, JOBZ='N')

*              Compute singular values only

*              CWorkspace: need   0

*              RWorkspace: need   N [e] + BDSPAC

*

               CALL sbdsdc( 'U', 'N', n, s, rwork( ie ), dum, 1,dum,1,

     $                      dum, idum, rwork( nrwork ), iwork, info )

            ELSE IF( wntqo ) THEN

               iu = nwork

               iru = nrwork

               irvt = iru + n*n

               nrwork = irvt + n*n

*

*              Path 5o (M >> N, JOBZ='O')

*              Copy A to VT, generate P**H

*              CWorkspace: need   2*N [tauq, taup] + N    [work]

*              CWorkspace: prefer 2*N [tauq, taup] + N*NB [work]

*              RWorkspace: need   0

*

               CALL clacpy( 'U', n, n, a, lda, vt, ldvt )

               CALL cungbr( 'P', n, n, n, vt, ldvt, work( itaup ),

     $                      work( nwork ), lwork-nwork+1, ierr )

*

*              Generate Q in A

*              CWorkspace: need   2*N [tauq, taup] + N    [work]

*              CWorkspace: prefer 2*N [tauq, taup] + N*NB [work]

*              RWorkspace: need   0

*

               CALL cungbr( 'Q', m, n, n, a, lda, work( itauq ),

     $                      work( nwork ), lwork-nwork+1, ierr )

*

               IF( lwork .GE. m*n + 3*n ) THEN

*

*                 WORK( IU ) is M by N

*

                  ldwrku = m

               ELSE

*

*                 WORK(IU) is LDWRKU by N

*

                  ldwrku = ( lwork - 3*n ) / n

               END IF

               nwork = iu + ldwrku*n

*

*              Perform bidiagonal SVD, computing left singular vectors

*              of bidiagonal matrix in RWORK(IRU) and computing right

*              singular vectors of bidiagonal matrix in RWORK(IRVT)

*              CWorkspace: need   0

*              RWorkspace: need   N [e] + N*N [RU] + N*N [RVT] + BDSPAC

*

               CALL sbdsdc( 'U', 'I', n, s, rwork( ie ), rwork( iru ),

     $                      n, rwork( irvt ), n, dum, idum,

     $                      rwork( nrwork ), iwork, info )

*

*              Multiply real matrix RWORK(IRVT) by P**H in VT,

*              storing the result in WORK(IU), copying to VT

*              CWorkspace: need   2*N [tauq, taup] + N*N [U]

*              RWorkspace: need   N [e] + N*N [RU] + N*N [RVT] + 2*N*N [rwork]

*

               CALL clarcm( n, n, rwork( irvt ), n, vt, ldvt,

     $                      work( iu ), ldwrku, rwork( nrwork ) )

               CALL clacpy( 'F', n, n, work( iu ), ldwrku, vt, ldvt )

*

*              Multiply Q in A by real matrix RWORK(IRU), storing the

*              result in WORK(IU), copying to A

*              CWorkspace: need   2*N [tauq, taup] + N*N [U]

*              CWorkspace: prefer 2*N [tauq, taup] + M*N [U]

*              RWorkspace: need   N [e] + N*N [RU] + 2*N*N [rwork]

*              RWorkspace: prefer N [e] + N*N [RU] + 2*M*N [rwork] < N + 5*N*N since M < 2*N here

*

               nrwork = irvt

               DO 20 i = 1, m, ldwrku

                  chunk = min( m-i+1, ldwrku )

                  CALL clacrm( chunk, n, a( i, 1 ), lda, rwork( iru ),

     $                         n, work( iu ), ldwrku, rwork( nrwork ) )

                  CALL clacpy( 'F', chunk, n, work( iu ), ldwrku,

     $                         a( i, 1 ), lda )

   20          CONTINUE

*

            ELSE IF( wntqs ) THEN

*

*              Path 5s (M >> N, JOBZ='S')

*              Copy A to VT, generate P**H

*              CWorkspace: need   2*N [tauq, taup] + N    [work]

*              CWorkspace: prefer 2*N [tauq, taup] + N*NB [work]

*              RWorkspace: need   0

*

               CALL clacpy( 'U', n, n, a, lda, vt, ldvt )

               CALL cungbr( 'P', n, n, n, vt, ldvt, work( itaup ),

     $                      work( nwork ), lwork-nwork+1, ierr )

*

*              Copy A to U, generate Q

*              CWorkspace: need   2*N [tauq, taup] + N    [work]

*              CWorkspace: prefer 2*N [tauq, taup] + N*NB [work]

*              RWorkspace: need   0

*

               CALL clacpy( 'L', m, n, a, lda, u, ldu )

               CALL cungbr( 'Q', m, n, n, u, ldu, work( itauq ),

     $                      work( nwork ), lwork-nwork+1, ierr )

*

*              Perform bidiagonal SVD, computing left singular vectors

*              of bidiagonal matrix in RWORK(IRU) and computing right

*              singular vectors of bidiagonal matrix in RWORK(IRVT)

*              CWorkspace: need   0

*              RWorkspace: need   N [e] + N*N [RU] + N*N [RVT] + BDSPAC

*

               iru = nrwork

               irvt = iru + n*n

               nrwork = irvt + n*n

               CALL sbdsdc( 'U', 'I', n, s, rwork( ie ), rwork( iru ),

     $                      n, rwork( irvt ), n, dum, idum,

     $                      rwork( nrwork ), iwork, info )

*

*              Multiply real matrix RWORK(IRVT) by P**H in VT,

*              storing the result in A, copying to VT

*              CWorkspace: need   0

*              RWorkspace: need   N [e] + N*N [RU] + N*N [RVT] + 2*N*N [rwork]

*

               CALL clarcm( n, n, rwork( irvt ), n, vt, ldvt, a, lda,

     $                      rwork( nrwork ) )

               CALL clacpy( 'F', n, n, a, lda, vt, ldvt )

*

*              Multiply Q in U by real matrix RWORK(IRU), storing the

*              result in A, copying to U

*              CWorkspace: need   0

*              RWorkspace: need   N [e] + N*N [RU] + 2*M*N [rwork] < N + 5*N*N since M < 2*N here

*

               nrwork = irvt

               CALL clacrm( m, n, u, ldu, rwork( iru ), n, a, lda,

     $                      rwork( nrwork ) )

               CALL clacpy( 'F', m, n, a, lda, u, ldu )

            ELSE

*

*              Path 5a (M >> N, JOBZ='A')

*              Copy A to VT, generate P**H

*              CWorkspace: need   2*N [tauq, taup] + N    [work]

*              CWorkspace: prefer 2*N [tauq, taup] + N*NB [work]

*              RWorkspace: need   0

*

               CALL clacpy( 'U', n, n, a, lda, vt, ldvt )

               CALL cungbr( 'P', n, n, n, vt, ldvt, work( itaup ),

     $                      work( nwork ), lwork-nwork+1, ierr )

*

*              Copy A to U, generate Q

*              CWorkspace: need   2*N [tauq, taup] + M    [work]

*              CWorkspace: prefer 2*N [tauq, taup] + M*NB [work]

*              RWorkspace: need   0

*

               CALL clacpy( 'L', m, n, a, lda, u, ldu )

               CALL cungbr( 'Q', m, m, n, u, ldu, work( itauq ),

     $                      work( nwork ), lwork-nwork+1, ierr )

*

*              Perform bidiagonal SVD, computing left singular vectors

*              of bidiagonal matrix in RWORK(IRU) and computing right

*              singular vectors of bidiagonal matrix in RWORK(IRVT)

*              CWorkspace: need   0

*              RWorkspace: need   N [e] + N*N [RU] + N*N [RVT] + BDSPAC

*

               iru = nrwork

               irvt = iru + n*n

               nrwork = irvt + n*n

               CALL sbdsdc( 'U', 'I', n, s, rwork( ie ), rwork( iru ),

     $                      n, rwork( irvt ), n, dum, idum,

     $                      rwork( nrwork ), iwork, info )

*

*              Multiply real matrix RWORK(IRVT) by P**H in VT,

*              storing the result in A, copying to VT

*              CWorkspace: need   0

*              RWorkspace: need   N [e] + N*N [RU] + N*N [RVT] + 2*N*N [rwork]

*

               CALL clarcm( n, n, rwork( irvt ), n, vt, ldvt, a, lda,

     $                      rwork( nrwork ) )

               CALL clacpy( 'F', n, n, a, lda, vt, ldvt )

*

*              Multiply Q in U by real matrix RWORK(IRU), storing the

*              result in A, copying to U

*              CWorkspace: need   0

*              RWorkspace: need   N [e] + N*N [RU] + 2*M*N [rwork] < N + 5*N*N since M < 2*N here

*

               nrwork = irvt

               CALL clacrm( m, n, u, ldu, rwork( iru ), n, a, lda,

     $                      rwork( nrwork ) )

               CALL clacpy( 'F', m, n, a, lda, u, ldu )

            END IF

*

         ELSE

*

*           M .LT. MNTHR2

*

*           Path 6 (M >= N, but not much larger)

*           Reduce to bidiagonal form without QR decomposition

*           Use CUNMBR to compute singular vectors

*

            ie = 1

            nrwork = ie + n

            itauq = 1

            itaup = itauq + n

            nwork = itaup + n

*

*           Bidiagonalize A

*           CWorkspace: need   2*N [tauq, taup] + M        [work]

*           CWorkspace: prefer 2*N [tauq, taup] + (M+N)*NB [work]

*           RWorkspace: need   N [e]

*

            CALL cgebrd( m, n, a, lda, s, rwork( ie ), work( itauq ),

     $                   work( itaup ), work( nwork ), lwork-nwork+1,

     $                   ierr )

            IF( wntqn ) THEN

*

*              Path 6n (M >= N, JOBZ='N')

*              Compute singular values only

*              CWorkspace: need   0

*              RWorkspace: need   N [e] + BDSPAC

*

               CALL sbdsdc( 'U', 'N', n, s, rwork( ie ), dum,1,dum,1,

     $                      dum, idum, rwork( nrwork ), iwork, info )

            ELSE IF( wntqo ) THEN

               iu = nwork

               iru = nrwork

               irvt = iru + n*n

               nrwork = irvt + n*n

               IF( lwork .GE. m*n + 3*n ) THEN

*

*                 WORK( IU ) is M by N

*

                  ldwrku = m

               ELSE

*

*                 WORK( IU ) is LDWRKU by N

*

                  ldwrku = ( lwork - 3*n ) / n

               END IF

               nwork = iu + ldwrku*n

*

*              Path 6o (M >= N, JOBZ='O')

*              Perform bidiagonal SVD, computing left singular vectors

*              of bidiagonal matrix in RWORK(IRU) and computing right

*              singular vectors of bidiagonal matrix in RWORK(IRVT)

*              CWorkspace: need   0

*              RWorkspace: need   N [e] + N*N [RU] + N*N [RVT] + BDSPAC

*

               CALL sbdsdc( 'U', 'I', n, s, rwork( ie ), rwork( iru ),

     $                      n, rwork( irvt ), n, dum, idum,

     $                      rwork( nrwork ), iwork, info )

*

*              Copy real matrix RWORK(IRVT) to complex matrix VT

*              Overwrite VT by right singular vectors of A

*              CWorkspace: need   2*N [tauq, taup] + N*N [U] + N    [work]

*              CWorkspace: prefer 2*N [tauq, taup] + N*N [U] + N*NB [work]

*              RWorkspace: need   N [e] + N*N [RU] + N*N [RVT]

*

               CALL clacp2( 'F', n, n, rwork( irvt ), n, vt, ldvt )

               CALL cunmbr( 'P', 'R', 'C', n, n, n, a, lda,

     $                      work( itaup ), vt, ldvt, work( nwork ),

     $                      lwork-nwork+1, ierr )

*

               IF( lwork .GE. m*n + 3*n ) THEN

*

*                 Path 6o-fast

*                 Copy real matrix RWORK(IRU) to complex matrix WORK(IU)

*                 Overwrite WORK(IU) by left singular vectors of A, copying

*                 to A

*                 CWorkspace: need   2*N [tauq, taup] + M*N [U] + N    [work]

*                 CWorkspace: prefer 2*N [tauq, taup] + M*N [U] + N*NB [work]

*                 RWorkspace: need   N [e] + N*N [RU]

*

                  CALL claset( 'F', m, n, czero, czero, work( iu ),

     $                         ldwrku )

                  CALL clacp2( 'F', n, n, rwork( iru ), n, work( iu ),

     $                         ldwrku )

                  CALL cunmbr( 'Q', 'L', 'N', m, n, n, a, lda,

     $                         work( itauq ), work( iu ), ldwrku,

     $                         work( nwork ), lwork-nwork+1, ierr )

                  CALL clacpy( 'F', m, n, work( iu ), ldwrku, a, lda )

               ELSE

*

*                 Path 6o-slow

*                 Generate Q in A

*                 CWorkspace: need   2*N [tauq, taup] + N*N [U] + N    [work]

*                 CWorkspace: prefer 2*N [tauq, taup] + N*N [U] + N*NB [work]

*                 RWorkspace: need   0

*

                  CALL cungbr( 'Q', m, n, n, a, lda, work( itauq ),

     $                         work( nwork ), lwork-nwork+1, ierr )

*

*                 Multiply Q in A by real matrix RWORK(IRU), storing the

*                 result in WORK(IU), copying to A

*                 CWorkspace: need   2*N [tauq, taup] + N*N [U]

*                 CWorkspace: prefer 2*N [tauq, taup] + M*N [U]

*                 RWorkspace: need   N [e] + N*N [RU] + 2*N*N [rwork]

*                 RWorkspace: prefer N [e] + N*N [RU] + 2*M*N [rwork] < N + 5*N*N since M < 2*N here

*

                  nrwork = irvt

                  DO 30 i = 1, m, ldwrku

                     chunk = min( m-i+1, ldwrku )

                     CALL clacrm( chunk, n, a( i, 1 ), lda,

     $                            rwork( iru ), n, work( iu ), ldwrku,

     $                            rwork( nrwork ) )

                     CALL clacpy( 'F', chunk, n, work( iu ), ldwrku,

     $                            a( i, 1 ), lda )

   30             CONTINUE

               END IF

*

            ELSE IF( wntqs ) THEN

*

*              Path 6s (M >= N, JOBZ='S')

*              Perform bidiagonal SVD, computing left singular vectors

*              of bidiagonal matrix in RWORK(IRU) and computing right

*              singular vectors of bidiagonal matrix in RWORK(IRVT)

*              CWorkspace: need   0

*              RWorkspace: need   N [e] + N*N [RU] + N*N [RVT] + BDSPAC

*

               iru = nrwork

               irvt = iru + n*n

               nrwork = irvt + n*n

               CALL sbdsdc( 'U', 'I', n, s, rwork( ie ), rwork( iru ),

     $                      n, rwork( irvt ), n, dum, idum,

     $                      rwork( nrwork ), iwork, info )

*

*              Copy real matrix RWORK(IRU) to complex matrix U

*              Overwrite U by left singular vectors of A

*              CWorkspace: need   2*N [tauq, taup] + N    [work]

*              CWorkspace: prefer 2*N [tauq, taup] + N*NB [work]

*              RWorkspace: need   N [e] + N*N [RU] + N*N [RVT]

*

               CALL claset( 'F', m, n, czero, czero, u, ldu )

               CALL clacp2( 'F', n, n, rwork( iru ), n, u, ldu )

               CALL cunmbr( 'Q', 'L', 'N', m, n, n, a, lda,

     $                      work( itauq ), u, ldu, work( nwork ),

     $                      lwork-nwork+1, ierr )

*

*              Copy real matrix RWORK(IRVT) to complex matrix VT

*              Overwrite VT by right singular vectors of A

*              CWorkspace: need   2*N [tauq, taup] + N    [work]

*              CWorkspace: prefer 2*N [tauq, taup] + N*NB [work]

*              RWorkspace: need   N [e] + N*N [RU] + N*N [RVT]

*

               CALL clacp2( 'F', n, n, rwork( irvt ), n, vt, ldvt )

               CALL cunmbr( 'P', 'R', 'C', n, n, n, a, lda,

     $                      work( itaup ), vt, ldvt, work( nwork ),

     $                      lwork-nwork+1, ierr )

            ELSE

*

*              Path 6a (M >= N, JOBZ='A')

*              Perform bidiagonal SVD, computing left singular vectors

*              of bidiagonal matrix in RWORK(IRU) and computing right

*              singular vectors of bidiagonal matrix in RWORK(IRVT)

*              CWorkspace: need   0

*              RWorkspace: need   N [e] + N*N [RU] + N*N [RVT] + BDSPAC

*

               iru = nrwork

               irvt = iru + n*n

               nrwork = irvt + n*n

               CALL sbdsdc( 'U', 'I', n, s, rwork( ie ), rwork( iru ),

     $                      n, rwork( irvt ), n, dum, idum,

     $                      rwork( nrwork ), iwork, info )

*

*              Set the right corner of U to identity matrix

*

               CALL claset( 'F', m, m, czero, czero, u, ldu )

               IF( m.GT.n ) THEN

                  CALL claset( 'F', m-n, m-n, czero, cone,

     $                         u( n+1, n+1 ), ldu )

               END IF

*

*              Copy real matrix RWORK(IRU) to complex matrix U

*              Overwrite U by left singular vectors of A

*              CWorkspace: need   2*N [tauq, taup] + M    [work]

*              CWorkspace: prefer 2*N [tauq, taup] + M*NB [work]

*              RWorkspace: need   N [e] + N*N [RU] + N*N [RVT]

*

               CALL clacp2( 'F', n, n, rwork( iru ), n, u, ldu )

               CALL cunmbr( 'Q', 'L', 'N', m, m, n, a, lda,

     $                      work( itauq ), u, ldu, work( nwork ),

     $                      lwork-nwork+1, ierr )

*

*              Copy real matrix RWORK(IRVT) to complex matrix VT

*              Overwrite VT by right singular vectors of A

*              CWorkspace: need   2*N [tauq, taup] + N    [work]

*              CWorkspace: prefer 2*N [tauq, taup] + N*NB [work]

*              RWorkspace: need   N [e] + N*N [RU] + N*N [RVT]

*

               CALL clacp2( 'F', n, n, rwork( irvt ), n, vt, ldvt )

               CALL cunmbr( 'P', 'R', 'C', n, n, n, a, lda,

     $                      work( itaup ), vt, ldvt, work( nwork ),

     $                      lwork-nwork+1, ierr )

            END IF

*

         END IF

*

      ELSE

*

*        A has more columns than rows. If A has sufficiently more

*        columns than rows, first reduce using the LQ decomposition (if

*        sufficient workspace available)

*

         IF( n.GE.mnthr1 ) THEN

*

            IF( wntqn ) THEN

*

*              Path 1t (N >> M, JOBZ='N')

*              No singular vectors to be computed

*

               itau = 1

               nwork = itau + m

*

*              Compute A=L*Q

*              CWorkspace: need   M [tau] + M    [work]

*              CWorkspace: prefer M [tau] + M*NB [work]

*              RWorkspace: need   0

*

               CALL cgelqf( m, n, a, lda, work( itau ), work( nwork ),

     $                      lwork-nwork+1, ierr )

*

*              Zero out above L

*

               CALL claset( 'U', m-1, m-1, czero, czero, a( 1, 2 ),

     $                      lda )

               ie = 1

               itauq = 1

               itaup = itauq + m

               nwork = itaup + m

*

*              Bidiagonalize L in A

*              CWorkspace: need   2*M [tauq, taup] + M      [work]

*              CWorkspace: prefer 2*M [tauq, taup] + 2*M*NB [work]

*              RWorkspace: need   M [e]

*

               CALL cgebrd( m, m, a, lda, s, rwork( ie ), work( itauq ),

     $                      work( itaup ), work( nwork ), lwork-nwork+1,

     $                      ierr )

               nrwork = ie + m

*

*              Perform bidiagonal SVD, compute singular values only

*              CWorkspace: need   0

*              RWorkspace: need   M [e] + BDSPAC

*

               CALL sbdsdc( 'U', 'N', m, s, rwork( ie ), dum,1,dum,1,

     $                      dum, idum, rwork( nrwork ), iwork, info )

*

            ELSE IF( wntqo ) THEN

*

*              Path 2t (N >> M, JOBZ='O')

*              M right singular vectors to be overwritten on A and

*              M left singular vectors to be computed in U

*

               ivt = 1

               ldwkvt = m

*

*              WORK(IVT) is M by M

*

               il = ivt + ldwkvt*m

               IF( lwork .GE. m*n + m*m + 3*m ) THEN

*

*                 WORK(IL) M by N

*

                  ldwrkl = m

                  chunk = n

               ELSE

*

*                 WORK(IL) is M by CHUNK

*

                  ldwrkl = m

                  chunk = ( lwork - m*m - 3*m ) / m

               END IF

               itau = il + ldwrkl*chunk

               nwork = itau + m

*

*              Compute A=L*Q

*              CWorkspace: need   M*M [VT] + M*M [L] + M [tau] + M    [work]

*              CWorkspace: prefer M*M [VT] + M*M [L] + M [tau] + M*NB [work]

*              RWorkspace: need   0

*

               CALL cgelqf( m, n, a, lda, work( itau ), work( nwork ),

     $                      lwork-nwork+1, ierr )

*

*              Copy L to WORK(IL), zeroing about above it

*

               CALL clacpy( 'L', m, m, a, lda, work( il ), ldwrkl )

               CALL claset( 'U', m-1, m-1, czero, czero,

     $                      work( il+ldwrkl ), ldwrkl )

*

*              Generate Q in A

*              CWorkspace: need   M*M [VT] + M*M [L] + M [tau] + M    [work]

*              CWorkspace: prefer M*M [VT] + M*M [L] + M [tau] + M*NB [work]

*              RWorkspace: need   0

*

               CALL cunglq( m, n, m, a, lda, work( itau ),

     $                      work( nwork ), lwork-nwork+1, ierr )

               ie = 1

               itauq = itau

               itaup = itauq + m

               nwork = itaup + m

*

*              Bidiagonalize L in WORK(IL)

*              CWorkspace: need   M*M [VT] + M*M [L] + 2*M [tauq, taup] + M      [work]

*              CWorkspace: prefer M*M [VT] + M*M [L] + 2*M [tauq, taup] + 2*M*NB [work]

*              RWorkspace: need   M [e]

*

               CALL cgebrd( m, m, work( il ), ldwrkl, s, rwork( ie ),

     $                      work( itauq ), work( itaup ), work( nwork ),

     $                      lwork-nwork+1, ierr )

*

*              Perform bidiagonal SVD, computing left singular vectors

*              of bidiagonal matrix in RWORK(IRU) and computing right

*              singular vectors of bidiagonal matrix in RWORK(IRVT)

*              CWorkspace: need   0

*              RWorkspace: need   M [e] + M*M [RU] + M*M [RVT] + BDSPAC

*

               iru = ie + m

               irvt = iru + m*m

               nrwork = irvt + m*m

               CALL sbdsdc( 'U', 'I', m, s, rwork( ie ), rwork( iru ),

     $                      m, rwork( irvt ), m, dum, idum,

     $                      rwork( nrwork ), iwork, info )

*

*              Copy real matrix RWORK(IRU) to complex matrix WORK(IU)

*              Overwrite WORK(IU) by the left singular vectors of L

*              CWorkspace: need   M*M [VT] + M*M [L] + 2*M [tauq, taup] + M    [work]

*              CWorkspace: prefer M*M [VT] + M*M [L] + 2*M [tauq, taup] + M*NB [work]

*              RWorkspace: need   0

*

               CALL clacp2( 'F', m, m, rwork( iru ), m, u, ldu )

               CALL cunmbr( 'Q', 'L', 'N', m, m, m, work( il ), ldwrkl,

     $                      work( itauq ), u, ldu, work( nwork ),

     $                      lwork-nwork+1, ierr )

*

*              Copy real matrix RWORK(IRVT) to complex matrix WORK(IVT)

*              Overwrite WORK(IVT) by the right singular vectors of L

*              CWorkspace: need   M*M [VT] + M*M [L] + 2*M [tauq, taup] + M    [work]

*              CWorkspace: prefer M*M [VT] + M*M [L] + 2*M [tauq, taup] + M*NB [work]

*              RWorkspace: need   0

*

               CALL clacp2( 'F', m, m, rwork( irvt ), m, work( ivt ),

     $                      ldwkvt )

               CALL cunmbr( 'P', 'R', 'C', m, m, m, work( il ), ldwrkl,

     $                      work( itaup ), work( ivt ), ldwkvt,

     $                      work( nwork ), lwork-nwork+1, ierr )

*

*              Multiply right singular vectors of L in WORK(IL) by Q

*              in A, storing result in WORK(IL) and copying to A

*              CWorkspace: need   M*M [VT] + M*M [L]

*              CWorkspace: prefer M*M [VT] + M*N [L]

*              RWorkspace: need   0

*

               DO 40 i = 1, n, chunk

                  blk = min( n-i+1, chunk )

                  CALL cgemm( 'N', 'N', m, blk, m, cone, work( ivt ), m,

     $                        a( 1, i ), lda, czero, work( il ),

     $                        ldwrkl )

                  CALL clacpy( 'F', m, blk, work( il ), ldwrkl,

     $                         a( 1, i ), lda )

   40          CONTINUE

*

            ELSE IF( wntqs ) THEN

*

*              Path 3t (N >> M, JOBZ='S')

*              M right singular vectors to be computed in VT and

*              M left singular vectors to be computed in U

*

               il = 1

*

*              WORK(IL) is M by M

*

               ldwrkl = m

               itau = il + ldwrkl*m

               nwork = itau + m

*

*              Compute A=L*Q

*              CWorkspace: need   M*M [L] + M [tau] + M    [work]

*              CWorkspace: prefer M*M [L] + M [tau] + M*NB [work]

*              RWorkspace: need   0

*

               CALL cgelqf( m, n, a, lda, work( itau ), work( nwork ),

     $                      lwork-nwork+1, ierr )

*

*              Copy L to WORK(IL), zeroing out above it

*

               CALL clacpy( 'L', m, m, a, lda, work( il ), ldwrkl )

               CALL claset( 'U', m-1, m-1, czero, czero,

     $                      work( il+ldwrkl ), ldwrkl )

*

*              Generate Q in A

*              CWorkspace: need   M*M [L] + M [tau] + M    [work]

*              CWorkspace: prefer M*M [L] + M [tau] + M*NB [work]

*              RWorkspace: need   0

*

               CALL cunglq( m, n, m, a, lda, work( itau ),

     $                      work( nwork ), lwork-nwork+1, ierr )

               ie = 1

               itauq = itau

               itaup = itauq + m

               nwork = itaup + m

*

*              Bidiagonalize L in WORK(IL)

*              CWorkspace: need   M*M [L] + 2*M [tauq, taup] + M      [work]

*              CWorkspace: prefer M*M [L] + 2*M [tauq, taup] + 2*M*NB [work]

*              RWorkspace: need   M [e]

*

               CALL cgebrd( m, m, work( il ), ldwrkl, s, rwork( ie ),

     $                      work( itauq ), work( itaup ), work( nwork ),

     $                      lwork-nwork+1, ierr )

*

*              Perform bidiagonal SVD, computing left singular vectors

*              of bidiagonal matrix in RWORK(IRU) and computing right

*              singular vectors of bidiagonal matrix in RWORK(IRVT)

*              CWorkspace: need   0

*              RWorkspace: need   M [e] + M*M [RU] + M*M [RVT] + BDSPAC

*

               iru = ie + m

               irvt = iru + m*m

               nrwork = irvt + m*m

               CALL sbdsdc( 'U', 'I', m, s, rwork( ie ), rwork( iru ),

     $                      m, rwork( irvt ), m, dum, idum,

     $                      rwork( nrwork ), iwork, info )

*

*              Copy real matrix RWORK(IRU) to complex matrix U

*              Overwrite U by left singular vectors of L

*              CWorkspace: need   M*M [L] + 2*M [tauq, taup] + M    [work]

*              CWorkspace: prefer M*M [L] + 2*M [tauq, taup] + M*NB [work]

*              RWorkspace: need   0

*

               CALL clacp2( 'F', m, m, rwork( iru ), m, u, ldu )

               CALL cunmbr( 'Q', 'L', 'N', m, m, m, work( il ), ldwrkl,

     $                      work( itauq ), u, ldu, work( nwork ),

     $                      lwork-nwork+1, ierr )

*

*              Copy real matrix RWORK(IRVT) to complex matrix VT

*              Overwrite VT by left singular vectors of L

*              CWorkspace: need   M*M [L] + 2*M [tauq, taup] + M    [work]

*              CWorkspace: prefer M*M [L] + 2*M [tauq, taup] + M*NB [work]

*              RWorkspace: need   0

*

               CALL clacp2( 'F', m, m, rwork( irvt ), m, vt, ldvt )

               CALL cunmbr( 'P', 'R', 'C', m, m, m, work( il ), ldwrkl,

     $                      work( itaup ), vt, ldvt, work( nwork ),

     $                      lwork-nwork+1, ierr )

*

*              Copy VT to WORK(IL), multiply right singular vectors of L

*              in WORK(IL) by Q in A, storing result in VT

*              CWorkspace: need   M*M [L]

*              RWorkspace: need   0

*

               CALL clacpy( 'F', m, m, vt, ldvt, work( il ), ldwrkl )

               CALL cgemm( 'N', 'N', m, n, m, cone, work( il ), ldwrkl,

     $                     a, lda, czero, vt, ldvt )

*

            ELSE IF( wntqa ) THEN

*

*              Path 4t (N >> M, JOBZ='A')

*              N right singular vectors to be computed in VT and

*              M left singular vectors to be computed in U

*

               ivt = 1

*

*              WORK(IVT) is M by M

*

               ldwkvt = m

               itau = ivt + ldwkvt*m

               nwork = itau + m

*

*              Compute A=L*Q, copying result to VT

*              CWorkspace: need   M*M [VT] + M [tau] + M    [work]

*              CWorkspace: prefer M*M [VT] + M [tau] + M*NB [work]

*              RWorkspace: need   0

*

               CALL cgelqf( m, n, a, lda, work( itau ), work( nwork ),

     $                      lwork-nwork+1, ierr )

               CALL clacpy( 'U', m, n, a, lda, vt, ldvt )

*

*              Generate Q in VT

*              CWorkspace: need   M*M [VT] + M [tau] + N    [work]

*              CWorkspace: prefer M*M [VT] + M [tau] + N*NB [work]

*              RWorkspace: need   0

*

               CALL cunglq( n, n, m, vt, ldvt, work( itau ),

     $                      work( nwork ), lwork-nwork+1, ierr )

*

*              Produce L in A, zeroing out above it

*

               CALL claset( 'U', m-1, m-1, czero, czero, a( 1, 2 ),

     $                      lda )

               ie = 1

               itauq = itau

               itaup = itauq + m

               nwork = itaup + m

*

*              Bidiagonalize L in A

*              CWorkspace: need   M*M [VT] + 2*M [tauq, taup] + M      [work]

*              CWorkspace: prefer M*M [VT] + 2*M [tauq, taup] + 2*M*NB [work]

*              RWorkspace: need   M [e]

*

               CALL cgebrd( m, m, a, lda, s, rwork( ie ), work( itauq ),

     $                      work( itaup ), work( nwork ), lwork-nwork+1,

     $                      ierr )

*

*              Perform bidiagonal SVD, computing left singular vectors

*              of bidiagonal matrix in RWORK(IRU) and computing right

*              singular vectors of bidiagonal matrix in RWORK(IRVT)

*              CWorkspace: need   0

*              RWorkspace: need   M [e] + M*M [RU] + M*M [RVT] + BDSPAC

*

               iru = ie + m

               irvt = iru + m*m

               nrwork = irvt + m*m

               CALL sbdsdc( 'U', 'I', m, s, rwork( ie ), rwork( iru ),

     $                      m, rwork( irvt ), m, dum, idum,

     $                      rwork( nrwork ), iwork, info )

*

*              Copy real matrix RWORK(IRU) to complex matrix U

*              Overwrite U by left singular vectors of L

*              CWorkspace: need   M*M [VT] + 2*M [tauq, taup] + M    [work]

*              CWorkspace: prefer M*M [VT] + 2*M [tauq, taup] + M*NB [work]

*              RWorkspace: need   0

*

               CALL clacp2( 'F', m, m, rwork( iru ), m, u, ldu )

               CALL cunmbr( 'Q', 'L', 'N', m, m, m, a, lda,

     $                      work( itauq ), u, ldu, work( nwork ),

     $                      lwork-nwork+1, ierr )

*

*              Copy real matrix RWORK(IRVT) to complex matrix WORK(IVT)

*              Overwrite WORK(IVT) by right singular vectors of L

*              CWorkspace: need   M*M [VT] + 2*M [tauq, taup] + M    [work]

*              CWorkspace: prefer M*M [VT] + 2*M [tauq, taup] + M*NB [work]

*              RWorkspace: need   0

*

               CALL clacp2( 'F', m, m, rwork( irvt ), m, work( ivt ),

     $                      ldwkvt )

               CALL cunmbr( 'P', 'R', 'C', m, m, m, a, lda,

     $                      work( itaup ), work( ivt ), ldwkvt,

     $                      work( nwork ), lwork-nwork+1, ierr )

*

*              Multiply right singular vectors of L in WORK(IVT) by

*              Q in VT, storing result in A

*              CWorkspace: need   M*M [VT]

*              RWorkspace: need   0

*

               CALL cgemm( 'N', 'N', m, n, m, cone, work( ivt ), ldwkvt,

     $                     vt, ldvt, czero, a, lda )

*

*              Copy right singular vectors of A from A to VT

*

               CALL clacpy( 'F', m, n, a, lda, vt, ldvt )

*

            END IF

*

         ELSE IF( n.GE.mnthr2 ) THEN

*

*           MNTHR2 <= N < MNTHR1

*

*           Path 5t (N >> M, but not as much as MNTHR1)

*           Reduce to bidiagonal form without QR decomposition, use

*           CUNGBR and matrix multiplication to compute singular vectors

*

            ie = 1

            nrwork = ie + m

            itauq = 1

            itaup = itauq + m

            nwork = itaup + m

*

*           Bidiagonalize A

*           CWorkspace: need   2*M [tauq, taup] + N        [work]

*           CWorkspace: prefer 2*M [tauq, taup] + (M+N)*NB [work]

*           RWorkspace: need   M [e]

*

            CALL cgebrd( m, n, a, lda, s, rwork( ie ), work( itauq ),

     $                   work( itaup ), work( nwork ), lwork-nwork+1,

     $                   ierr )

*

            IF( wntqn ) THEN

*

*              Path 5tn (N >> M, JOBZ='N')

*              Compute singular values only

*              CWorkspace: need   0

*              RWorkspace: need   M [e] + BDSPAC

*

               CALL sbdsdc( 'L', 'N', m, s, rwork( ie ), dum,1,dum,1,

     $                      dum, idum, rwork( nrwork ), iwork, info )

            ELSE IF( wntqo ) THEN

               irvt = nrwork

               iru = irvt + m*m

               nrwork = iru + m*m

               ivt = nwork

*

*              Path 5to (N >> M, JOBZ='O')

*              Copy A to U, generate Q

*              CWorkspace: need   2*M [tauq, taup] + M    [work]

*              CWorkspace: prefer 2*M [tauq, taup] + M*NB [work]

*              RWorkspace: need   0

*

               CALL clacpy( 'L', m, m, a, lda, u, ldu )

               CALL cungbr( 'Q', m, m, n, u, ldu, work( itauq ),

     $                      work( nwork ), lwork-nwork+1, ierr )

*

*              Generate P**H in A

*              CWorkspace: need   2*M [tauq, taup] + M    [work]

*              CWorkspace: prefer 2*M [tauq, taup] + M*NB [work]

*              RWorkspace: need   0

*

               CALL cungbr( 'P', m, n, m, a, lda, work( itaup ),

     $                      work( nwork ), lwork-nwork+1, ierr )

*

               ldwkvt = m

               IF( lwork .GE. m*n + 3*m ) THEN

*

*                 WORK( IVT ) is M by N

*

                  nwork = ivt + ldwkvt*n

                  chunk = n

               ELSE

*

*                 WORK( IVT ) is M by CHUNK

*

                  chunk = ( lwork - 3*m ) / m

                  nwork = ivt + ldwkvt*chunk

               END IF

*

*              Perform bidiagonal SVD, computing left singular vectors

*              of bidiagonal matrix in RWORK(IRU) and computing right

*              singular vectors of bidiagonal matrix in RWORK(IRVT)

*              CWorkspace: need   0

*              RWorkspace: need   M [e] + M*M [RVT] + M*M [RU] + BDSPAC

*

               CALL sbdsdc( 'L', 'I', m, s, rwork( ie ), rwork( iru ),

     $                      m, rwork( irvt ), m, dum, idum,

     $                      rwork( nrwork ), iwork, info )

*

*              Multiply Q in U by real matrix RWORK(IRVT)

*              storing the result in WORK(IVT), copying to U

*              CWorkspace: need   2*M [tauq, taup] + M*M [VT]

*              RWorkspace: need   M [e] + M*M [RVT] + M*M [RU] + 2*M*M [rwork]

*

               CALL clacrm( m, m, u, ldu, rwork( iru ), m, work( ivt ),

     $                      ldwkvt, rwork( nrwork ) )

               CALL clacpy( 'F', m, m, work( ivt ), ldwkvt, u, ldu )

*

*              Multiply RWORK(IRVT) by P**H in A, storing the

*              result in WORK(IVT), copying to A

*              CWorkspace: need   2*M [tauq, taup] + M*M [VT]

*              CWorkspace: prefer 2*M [tauq, taup] + M*N [VT]

*              RWorkspace: need   M [e] + M*M [RVT] + 2*M*M [rwork]

*              RWorkspace: prefer M [e] + M*M [RVT] + 2*M*N [rwork] < M + 5*M*M since N < 2*M here

*

               nrwork = iru

               DO 50 i = 1, n, chunk

                  blk = min( n-i+1, chunk )

                  CALL clarcm( m, blk, rwork( irvt ), m, a( 1, i ), lda,

     $                         work( ivt ), ldwkvt, rwork( nrwork ) )

                  CALL clacpy( 'F', m, blk, work( ivt ), ldwkvt,

     $                         a( 1, i ), lda )

   50          CONTINUE

            ELSE IF( wntqs ) THEN

*

*              Path 5ts (N >> M, JOBZ='S')

*              Copy A to U, generate Q

*              CWorkspace: need   2*M [tauq, taup] + M    [work]

*              CWorkspace: prefer 2*M [tauq, taup] + M*NB [work]

*              RWorkspace: need   0

*

               CALL clacpy( 'L', m, m, a, lda, u, ldu )

               CALL cungbr( 'Q', m, m, n, u, ldu, work( itauq ),

     $                      work( nwork ), lwork-nwork+1, ierr )

*

*              Copy A to VT, generate P**H

*              CWorkspace: need   2*M [tauq, taup] + M    [work]

*              CWorkspace: prefer 2*M [tauq, taup] + M*NB [work]

*              RWorkspace: need   0

*

               CALL clacpy( 'U', m, n, a, lda, vt, ldvt )

               CALL cungbr( 'P', m, n, m, vt, ldvt, work( itaup ),

     $                      work( nwork ), lwork-nwork+1, ierr )

*

*              Perform bidiagonal SVD, computing left singular vectors

*              of bidiagonal matrix in RWORK(IRU) and computing right

*              singular vectors of bidiagonal matrix in RWORK(IRVT)

*              CWorkspace: need   0

*              RWorkspace: need   M [e] + M*M [RVT] + M*M [RU] + BDSPAC

*

               irvt = nrwork

               iru = irvt + m*m

               nrwork = iru + m*m

               CALL sbdsdc( 'L', 'I', m, s, rwork( ie ), rwork( iru ),

     $                      m, rwork( irvt ), m, dum, idum,

     $                      rwork( nrwork ), iwork, info )

*

*              Multiply Q in U by real matrix RWORK(IRU), storing the

*              result in A, copying to U

*              CWorkspace: need   0

*              RWorkspace: need   M [e] + M*M [RVT] + M*M [RU] + 2*M*M [rwork]

*

               CALL clacrm( m, m, u, ldu, rwork( iru ), m, a, lda,

     $                      rwork( nrwork ) )

               CALL clacpy( 'F', m, m, a, lda, u, ldu )

*

*              Multiply real matrix RWORK(IRVT) by P**H in VT,

*              storing the result in A, copying to VT

*              CWorkspace: need   0

*              RWorkspace: need   M [e] + M*M [RVT] + 2*M*N [rwork] < M + 5*M*M since N < 2*M here

*

               nrwork = iru

               CALL clarcm( m, n, rwork( irvt ), m, vt, ldvt, a, lda,

     $                      rwork( nrwork ) )

               CALL clacpy( 'F', m, n, a, lda, vt, ldvt )

            ELSE

*

*              Path 5ta (N >> M, JOBZ='A')

*              Copy A to U, generate Q

*              CWorkspace: need   2*M [tauq, taup] + M    [work]

*              CWorkspace: prefer 2*M [tauq, taup] + M*NB [work]

*              RWorkspace: need   0

*

               CALL clacpy( 'L', m, m, a, lda, u, ldu )

               CALL cungbr( 'Q', m, m, n, u, ldu, work( itauq ),

     $                      work( nwork ), lwork-nwork+1, ierr )

*

*              Copy A to VT, generate P**H

*              CWorkspace: need   2*M [tauq, taup] + N    [work]

*              CWorkspace: prefer 2*M [tauq, taup] + N*NB [work]

*              RWorkspace: need   0

*

               CALL clacpy( 'U', m, n, a, lda, vt, ldvt )

               CALL cungbr( 'P', n, n, m, vt, ldvt, work( itaup ),

     $                      work( nwork ), lwork-nwork+1, ierr )

*

*              Perform bidiagonal SVD, computing left singular vectors

*              of bidiagonal matrix in RWORK(IRU) and computing right

*              singular vectors of bidiagonal matrix in RWORK(IRVT)

*              CWorkspace: need   0

*              RWorkspace: need   M [e] + M*M [RVT] + M*M [RU] + BDSPAC

*

               irvt = nrwork

               iru = irvt + m*m

               nrwork = iru + m*m

               CALL sbdsdc( 'L', 'I', m, s, rwork( ie ), rwork( iru ),

     $                      m, rwork( irvt ), m, dum, idum,

     $                      rwork( nrwork ), iwork, info )

*

*              Multiply Q in U by real matrix RWORK(IRU), storing the

*              result in A, copying to U

*              CWorkspace: need   0

*              RWorkspace: need   M [e] + M*M [RVT] + M*M [RU] + 2*M*M [rwork]

*

               CALL clacrm( m, m, u, ldu, rwork( iru ), m, a, lda,

     $                      rwork( nrwork ) )

               CALL clacpy( 'F', m, m, a, lda, u, ldu )

*

*              Multiply real matrix RWORK(IRVT) by P**H in VT,

*              storing the result in A, copying to VT

*              CWorkspace: need   0

*              RWorkspace: need   M [e] + M*M [RVT] + 2*M*N [rwork] < M + 5*M*M since N < 2*M here

*

               nrwork = iru

               CALL clarcm( m, n, rwork( irvt ), m, vt, ldvt, a, lda,

     $                      rwork( nrwork ) )

               CALL clacpy( 'f', M, N, A, LDA, VT, LDVT )

            END IF

*

         ELSE

*

*           N .LT. MNTHR2

*

*           Path 6t (N > M, but not much larger)

*           Reduce to bidiagonal form without LQ decomposition

*           Use CUNMBR to compute singular vectors

*

            IE = 1

            NRWORK = IE + M

            ITAUQ = 1

            ITAUP = ITAUQ + M

            NWORK = ITAUP + M

*

*           Bidiagonalize A

*           CWorkspace: need   2*M [tauq, taup] + N        [work]

*           CWorkspace: prefer 2*M [tauq, taup] + (M+N)*NB [work]

*           RWorkspace: need   M [e]

*

            CALL CGEBRD( M, N, A, LDA, S, RWORK( IE ), WORK( ITAUQ ),

     $                   WORK( ITAUP ), WORK( NWORK ), LWORK-NWORK+1,

     $                   IERR )

            IF( WNTQN ) THEN

*

*              Path 6tn (N > M, JOBZ='N')

*              Compute singular values only

*              CWorkspace: need   0

*              RWorkspace: need   M [e] + BDSPAC

*

               CALL SBDSDC( 'l', 'n', M, S, RWORK( IE ), DUM,1,DUM,1,

     $                      DUM, IDUM, RWORK( NRWORK ), IWORK, INFO )

            ELSE IF( WNTQO ) THEN

*              Path 6to (N > M, JOBZ='O')

               LDWKVT = M

               IVT = NWORK

.GE.               IF( LWORK  M*N + 3*M ) THEN

*

*                 WORK( IVT ) is M by N

*

                  CALL CLASET( 'f', M, N, CZERO, CZERO, WORK( IVT ),

     $                         LDWKVT )

                  NWORK = IVT + LDWKVT*N

               ELSE

*

*                 WORK( IVT ) is M by CHUNK

*

                  CHUNK = ( LWORK - 3*M ) / M

                  NWORK = IVT + LDWKVT*CHUNK

               END IF

*

*              Perform bidiagonal SVD, computing left singular vectors

*              of bidiagonal matrix in RWORK(IRU) and computing right

*              singular vectors of bidiagonal matrix in RWORK(IRVT)

*              CWorkspace: need   0

*              RWorkspace: need   M [e] + M*M [RVT] + M*M [RU] + BDSPAC

*

               IRVT = NRWORK

               IRU = IRVT + M*M

               NRWORK = IRU + M*M

               CALL SBDSDC( 'l', 'i', M, S, RWORK( IE ), RWORK( IRU ),

     $                      M, RWORK( IRVT ), M, DUM, IDUM,

     $                      RWORK( NRWORK ), IWORK, INFO )

*

*              Copy real matrix RWORK(IRU) to complex matrix U

*              Overwrite U by left singular vectors of A

*              CWorkspace: need   2*M [tauq, taup] + M*M [VT] + M    [work]

*              CWorkspace: prefer 2*M [tauq, taup] + M*M [VT] + M*NB [work]

*              RWorkspace: need   M [e] + M*M [RVT] + M*M [RU]

*

               CALL CLACP2( 'f', M, M, RWORK( IRU ), M, U, LDU )

               CALL CUNMBR( 'q', 'l', 'n', M, M, N, A, LDA,

     $                      WORK( ITAUQ ), U, LDU, WORK( NWORK ),

     $                      LWORK-NWORK+1, IERR )

*

.GE.               IF( LWORK  M*N + 3*M ) THEN

*

*                 Path 6to-fast

*                 Copy real matrix RWORK(IRVT) to complex matrix WORK(IVT)

*                 Overwrite WORK(IVT) by right singular vectors of A,

*                 copying to A

*                 CWorkspace: need   2*M [tauq, taup] + M*N [VT] + M    [work]

*                 CWorkspace: prefer 2*M [tauq, taup] + M*N [VT] + M*NB [work]

*                 RWorkspace: need   M [e] + M*M [RVT]

*

                  CALL CLACP2( 'f', M, M, RWORK( IRVT ), M, WORK( IVT ),

     $                         LDWKVT )

                  CALL CUNMBR( 'p', 'r', 'C', m, n, m, a, lda,

     $                         work( itaup ), work( ivt ), ldwkvt,

     $                         work( nwork ), lwork-nwork+1, ierr )

                  CALL clacpy( 'F', m, n, work( ivt ), ldwkvt, a, lda )

               ELSE

*

*                 Path 6to-slow

*                 Generate P**H in A

*                 CWorkspace: need   2*M [tauq, taup] + M*M [VT] + M    [work]

*                 CWorkspace: prefer 2*M [tauq, taup] + M*M [VT] + M*NB [work]

*                 RWorkspace: need   0

*

                  CALL cungbr( 'P', m, n, m, a, lda, work( itaup ),

     $                         work( nwork ), lwork-nwork+1, ierr )

*

*                 Multiply Q in A by real matrix RWORK(IRU), storing the

*                 result in WORK(IU), copying to A

*                 CWorkspace: need   2*M [tauq, taup] + M*M [VT]

*                 CWorkspace: prefer 2*M [tauq, taup] + M*N [VT]

*                 RWorkspace: need   M [e] + M*M [RVT] + 2*M*M [rwork]

*                 RWorkspace: prefer M [e] + M*M [RVT] + 2*M*N [rwork] < M + 5*M*M since N < 2*M here

*

                  nrwork = iru

                  DO 60 i = 1, n, chunk

                     blk = min( n-i+1, chunk )

                     CALL clarcm( m, blk, rwork( irvt ), m, a( 1, i ),

     $                            lda, work( ivt ), ldwkvt,

     $                            rwork( nrwork ) )

                     CALL clacpy( 'F', m, blk, work( ivt ), ldwkvt,

     $                            a( 1, i ), lda )

   60             CONTINUE

               END IF

            ELSE IF( wntqs ) THEN

*

*              Path 6ts (N > M, JOBZ='S')

*              Perform bidiagonal SVD, computing left singular vectors

*              of bidiagonal matrix in RWORK(IRU) and computing right

*              singular vectors of bidiagonal matrix in RWORK(IRVT)

*              CWorkspace: need   0

*              RWorkspace: need   M [e] + M*M [RVT] + M*M [RU] + BDSPAC

*

               irvt = nrwork

               iru = irvt + m*m

               nrwork = iru + m*m

               CALL sbdsdc( 'L', 'I', m, s, rwork( ie ), rwork( iru ),

     $                      m, rwork( irvt ), m, dum, idum,

     $                      rwork( nrwork ), iwork, info )

*

*              Copy real matrix RWORK(IRU) to complex matrix U

*              Overwrite U by left singular vectors of A

*              CWorkspace: need   2*M [tauq, taup] + M    [work]

*              CWorkspace: prefer 2*M [tauq, taup] + M*NB [work]

*              RWorkspace: need   M [e] + M*M [RVT] + M*M [RU]

*

               CALL clacp2( 'F', m, m, rwork( iru ), m, u, ldu )

               CALL cunmbr( 'Q', 'L', 'N', m, m, n, a, lda,

     $                      work( itauq ), u, ldu, work( nwork ),

     $                      lwork-nwork+1, ierr )

*

*              Copy real matrix RWORK(IRVT) to complex matrix VT

*              Overwrite VT by right singular vectors of A

*              CWorkspace: need   2*M [tauq, taup] + M    [work]

*              CWorkspace: prefer 2*M [tauq, taup] + M*NB [work]

*              RWorkspace: need   M [e] + M*M [RVT]

*

               CALL claset( 'F', m, n, czero, czero, vt, ldvt )

               CALL clacp2( 'F', m, m, rwork( irvt ), m, vt, ldvt )

               CALL cunmbr( 'P', 'R', 'C', m, n, m, a, lda,

     $                      work( itaup ), vt, ldvt, work( nwork ),

     $                      lwork-nwork+1, ierr )

            ELSE

*

*              Path 6ta (N > M, JOBZ='A')

*              Perform bidiagonal SVD, computing left singular vectors

*              of bidiagonal matrix in RWORK(IRU) and computing right

*              singular vectors of bidiagonal matrix in RWORK(IRVT)

*              CWorkspace: need   0

*              RWorkspace: need   M [e] + M*M [RVT] + M*M [RU] + BDSPAC

*

               irvt = nrwork

               iru = irvt + m*m

               nrwork = iru + m*m

*

               CALL sbdsdc( 'L', 'I', m, s, rwork( ie ), rwork( iru ),

     $                      m, rwork( irvt ), m, dum, idum,

     $                      rwork( nrwork ), iwork, info )

*

*              Copy real matrix RWORK(IRU) to complex matrix U

*              Overwrite U by left singular vectors of A

*              CWorkspace: need   2*M [tauq, taup] + M    [work]

*              CWorkspace: prefer 2*M [tauq, taup] + M*NB [work]

*              RWorkspace: need   M [e] + M*M [RVT] + M*M [RU]

*

               CALL clacp2( 'F', m, m, rwork( iru ), m, u, ldu )

               CALL cunmbr( 'Q', 'L', 'N', m, m, n, a, lda,

     $                      work( itauq ), u, ldu, work( nwork ),

     $                      lwork-nwork+1, ierr )

*

*              Set all of VT to identity matrix

*

               CALL claset( 'F', n, n, czero, cone, vt, ldvt )

*

*              Copy real matrix RWORK(IRVT) to complex matrix VT

*              Overwrite VT by right singular vectors of A

*              CWorkspace: need   2*M [tauq, taup] + N    [work]

*              CWorkspace: prefer 2*M [tauq, taup] + N*NB [work]

*              RWorkspace: need   M [e] + M*M [RVT]

*

               CALL clacp2( 'F', m, m, rwork( irvt ), m, vt, ldvt )

               CALL cunmbr( 'P', 'R', 'C', n, n, m, a, lda,

     $                      work( itaup ), vt, ldvt, work( nwork ),

     $                      lwork-nwork+1, ierr )

            END IF

*

         END IF

*

      END IF

*

*     Undo scaling if necessary

*

      IF( iscl.EQ.1 ) THEN

         IF( anrm.GT.bignum )

     $      CALL slascl( 'G', 0, 0, bignum, anrm, minmn, 1, s, minmn,

     $                   ierr )

         IF( info.NE.0 .AND. anrm.GT.bignum )

     $      CALL slascl( 'G', 0, 0, bignum, anrm, minmn-1, 1,

     $                   rwork( ie ), minmn, ierr )

         IF( anrm.LT.smlnum )

     $      CALL slascl( 'G', 0, 0, smlnum, anrm, minmn, 1, s, minmn,

     $                   ierr )

         IF( info.NE.0 .AND. anrm.LT.smlnum )

     $      CALL slascl( 'G', 0, 0, smlnum, anrm, minmn-1, 1,

     $                   rwork( ie ), minmn, ierr )

      END IF

*

*     Return optimal workspace in WORK(1)

*

      work( 1 ) = sroundup_lwork( maxwrk )

*

      RETURN

*

*     End of CGESDD

*


      END

slascl
subroutine slascl(type, kl, ku, cfrom, cto, m, n, a, lda, info)
SLASCL multiplies a general rectangular matrix by a real scalar defined as cto/cfrom.
Definition slascl.f:143

sbdsdc
subroutine sbdsdc(uplo, compq, n, d, e, u, ldu, vt, ldvt, q, iq, work, iwork, info)
SBDSDC
Definition sbdsdc.f:205

xerbla
subroutine xerbla(srname, info)
XERBLA
Definition xerbla.f:60

cungbr
subroutine cungbr(vect, m, n, k, a, lda, tau, work, lwork, info)
CUNGBR
Definition cungbr.f:157

cgeqrf
subroutine cgeqrf(m, n, a, lda, tau, work, lwork, info)
CGEQRF
Definition cgeqrf.f:146

cgebrd
subroutine cgebrd(m, n, a, lda, d, e, tauq, taup, work, lwork, info)
CGEBRD
Definition cgebrd.f:206

cgelqf
subroutine cgelqf(m, n, a, lda, tau, work, lwork, info)
CGELQF
Definition cgelqf.f:143

cgesdd
subroutine cgesdd(jobz, m, n, a, lda, s, u, ldu, vt, ldvt, work, lwork, rwork, iwork, info)
CGESDD
Definition cgesdd.f:227

clascl
subroutine clascl(type, kl, ku, cfrom, cto, m, n, a, lda, info)
CLASCL multiplies a general rectangular matrix by a real scalar defined as cto/cfrom.
Definition clascl.f:143

clacrm
subroutine clacrm(m, n, a, lda, b, ldb, c, ldc, rwork)
CLACRM multiplies a complex matrix by a square real matrix.
Definition clacrm.f:114

clacp2
subroutine clacp2(uplo, m, n, a, lda, b, ldb)
CLACP2 copies all or part of a real two-dimensional array to a complex array.
Definition clacp2.f:104

clacpy
subroutine clacpy(uplo, m, n, a, lda, b, ldb)
CLACPY copies all or part of one two-dimensional array to another.
Definition clacpy.f:103

claset
subroutine claset(uplo, m, n, alpha, beta, a, lda)
CLASET initializes the off-diagonal elements and the diagonal elements of a matrix to given values.
Definition claset.f:106

clarcm
subroutine clarcm(m, n, a, lda, b, ldb, c, ldc, rwork)
CLARCM copies all or part of a real two-dimensional array to a complex array.
Definition clarcm.f:114

cunglq
subroutine cunglq(m, n, k, a, lda, tau, work, lwork, info)
CUNGLQ
Definition cunglq.f:127

cungqr
subroutine cungqr(m, n, k, a, lda, tau, work, lwork, info)
CUNGQR
Definition cungqr.f:128

cunmbr
subroutine cunmbr(vect, side, trans, m, n, k, a, lda, tau, c, ldc, work, lwork, info)
CUNMBR
Definition cunmbr.f:197

cgemm
subroutine cgemm(transa, transb, m, n, k, alpha, a, lda, b, ldb, beta, c, ldc)
CGEMM
Definition cgemm.f:187

min
#define min(a, b)
Definition macros.h:20

max
#define max(a, b)
Definition macros.h:21