Functions
program	__secondtst_f__
	SECONDTST
program	__slamchtst_f__
	SLAMCHTST
character *1 function	chla_transtype (trans)
	CHLA_TRANSTYPE
subroutine	dbdsdc (uplo, compq, n, d, e, u, ldu, vt, ldvt, q, iq, work, iwork, info)
	DBDSDC
subroutine	dbdsqr (uplo, n, ncvt, nru, ncc, d, e, vt, ldvt, u, ldu, c, ldc, work, info)
	DBDSQR
subroutine	ddisna (job, m, n, d, sep, info)
	DDISNA
subroutine	dlaed0 (icompq, qsiz, n, d, e, q, ldq, qstore, ldqs, work, iwork, info)
	DLAED0 used by DSTEDC. Computes all eigenvalues and corresponding eigenvectors of an unreduced symmetric tridiagonal matrix using the divide and conquer method.
subroutine	dlaed1 (n, d, q, ldq, indxq, rho, cutpnt, work, iwork, info)
	DLAED1 used by DSTEDC. Computes the updated eigensystem of a diagonal matrix after modification by a rank-one symmetric matrix. Used when the original matrix is tridiagonal.
subroutine	dlaed2 (k, n, n1, d, q, ldq, indxq, rho, z, dlamda, w, q2, indx, indxc, indxp, coltyp, info)
	DLAED2 used by DSTEDC. Merges eigenvalues and deflates secular equation. Used when the original matrix is tridiagonal.
subroutine	dlaed3 (k, n, n1, d, q, ldq, rho, dlamda, q2, indx, ctot, w, s, info)
	DLAED3 used by DSTEDC. Finds the roots of the secular equation and updates the eigenvectors. Used when the original matrix is tridiagonal.
subroutine	dlaed4 (n, i, d, z, delta, rho, dlam, info)
	DLAED4 used by DSTEDC. Finds a single root of the secular equation.
subroutine	dlaed5 (i, d, z, delta, rho, dlam)
	DLAED5 used by DSTEDC. Solves the 2-by-2 secular equation.
subroutine	dlaed6 (kniter, orgati, rho, d, z, finit, tau, info)
	DLAED6 used by DSTEDC. Computes one Newton step in solution of the secular equation.
subroutine	dlaed7 (icompq, n, qsiz, tlvls, curlvl, curpbm, d, q, ldq, indxq, rho, cutpnt, qstore, qptr, prmptr, perm, givptr, givcol, givnum, work, iwork, info)
	DLAED7 used by DSTEDC. Computes the updated eigensystem of a diagonal matrix after modification by a rank-one symmetric matrix. Used when the original matrix is dense.
subroutine	dlaed8 (icompq, k, n, qsiz, d, q, ldq, indxq, rho, cutpnt, z, dlamda, q2, ldq2, w, perm, givptr, givcol, givnum, indxp, indx, info)
	DLAED8 used by DSTEDC. Merges eigenvalues and deflates secular equation. Used when the original matrix is dense.
subroutine	dlaed9 (k, kstart, kstop, n, d, q, ldq, rho, dlamda, w, s, lds, info)
	DLAED9 used by DSTEDC. Finds the roots of the secular equation and updates the eigenvectors. Used when the original matrix is dense.
subroutine	dlaeda (n, tlvls, curlvl, curpbm, prmptr, perm, givptr, givcol, givnum, q, qptr, z, ztemp, info)
	DLAEDA used by DSTEDC. Computes the Z vector determining the rank-one modification of the diagonal matrix. Used when the original matrix is dense.
subroutine	dlagtf (n, a, lambda, b, c, tol, d, in, info)
	DLAGTF computes an LU factorization of a matrix T-λI, where T is a general tridiagonal matrix, and λ a scalar, using partial pivoting with row interchanges.
subroutine	dlamrg (n1, n2, a, dtrd1, dtrd2, index)
	DLAMRG creates a permutation list to merge the entries of two independently sorted sets into a single set sorted in ascending order.
subroutine	dlartgs (x, y, sigma, cs, sn)
	DLARTGS generates a plane rotation designed to introduce a bulge in implicit QR iteration for the bidiagonal SVD problem.
subroutine	dlasq1 (n, d, e, work, info)
	DLASQ1 computes the singular values of a real square bidiagonal matrix. Used by sbdsqr.
subroutine	dlasq2 (n, z, info)
	DLASQ2 computes all the eigenvalues of the symmetric positive definite tridiagonal matrix associated with the qd Array Z to high relative accuracy. Used by sbdsqr and sstegr.
subroutine	dlasq3 (i0, n0, z, pp, dmin, sigma, desig, qmax, nfail, iter, ndiv, ieee, ttype, dmin1, dmin2, dn, dn1, dn2, g, tau)
	DLASQ3 checks for deflation, computes a shift and calls dqds. Used by sbdsqr.
subroutine	dlasq4 (i0, n0, z, pp, n0in, dmin, dmin1, dmin2, dn, dn1, dn2, tau, ttype, g)
	DLASQ4 computes an approximation to the smallest eigenvalue using values of d from the previous transform. Used by sbdsqr.
subroutine	dlasq5 (i0, n0, z, pp, tau, sigma, dmin, dmin1, dmin2, dn, dnm1, dnm2, ieee, eps)
	DLASQ5 computes one dqds transform in ping-pong form. Used by sbdsqr and sstegr.
subroutine	dlasq6 (i0, n0, z, pp, dmin, dmin1, dmin2, dn, dnm1, dnm2)
	DLASQ6 computes one dqd transform in ping-pong form. Used by sbdsqr and sstegr.
subroutine	dlasrt (id, n, d, info)
	DLASRT sorts numbers in increasing or decreasing order.
subroutine	dstebz (range, order, n, vl, vu, il, iu, abstol, d, e, m, nsplit, w, iblock, isplit, work, iwork, info)
	DSTEBZ
subroutine	dstedc (compz, n, d, e, z, ldz, work, lwork, iwork, liwork, info)
	DSTEDC
subroutine	dsteqr (compz, n, d, e, z, ldz, work, info)
	DSTEQR
subroutine	dsterf (n, d, e, info)
	DSTERF
integer function	iladiag (diag)
	ILADIAG
integer function	ilaprec (prec)
	ILAPREC
integer function	ilatrans (trans)
	ILATRANS
integer function	ilauplo (uplo)
	ILAUPLO
subroutine	sbdsdc (uplo, compq, n, d, e, u, ldu, vt, ldvt, q, iq, work, iwork, info)
	SBDSDC
subroutine	sbdsqr (uplo, n, ncvt, nru, ncc, d, e, vt, ldvt, u, ldu, c, ldc, work, info)
	SBDSQR
subroutine	sdisna (job, m, n, d, sep, info)
	SDISNA
subroutine	slaed0 (icompq, qsiz, n, d, e, q, ldq, qstore, ldqs, work, iwork, info)
	SLAED0 used by SSTEDC. Computes all eigenvalues and corresponding eigenvectors of an unreduced symmetric tridiagonal matrix using the divide and conquer method.
subroutine	slaed1 (n, d, q, ldq, indxq, rho, cutpnt, work, iwork, info)
	SLAED1 used by SSTEDC. Computes the updated eigensystem of a diagonal matrix after modification by a rank-one symmetric matrix. Used when the original matrix is tridiagonal.
subroutine	slaed2 (k, n, n1, d, q, ldq, indxq, rho, z, dlamda, w, q2, indx, indxc, indxp, coltyp, info)
	SLAED2 used by SSTEDC. Merges eigenvalues and deflates secular equation. Used when the original matrix is tridiagonal.
subroutine	slaed3 (k, n, n1, d, q, ldq, rho, dlamda, q2, indx, ctot, w, s, info)
	SLAED3 used by SSTEDC. Finds the roots of the secular equation and updates the eigenvectors. Used when the original matrix is tridiagonal.
subroutine	slaed4 (n, i, d, z, delta, rho, dlam, info)
	SLAED4 used by SSTEDC. Finds a single root of the secular equation.
subroutine	slaed5 (i, d, z, delta, rho, dlam)
	SLAED5 used by SSTEDC. Solves the 2-by-2 secular equation.
subroutine	slaed6 (kniter, orgati, rho, d, z, finit, tau, info)
	SLAED6 used by SSTEDC. Computes one Newton step in solution of the secular equation.
subroutine	slaed7 (icompq, n, qsiz, tlvls, curlvl, curpbm, d, q, ldq, indxq, rho, cutpnt, qstore, qptr, prmptr, perm, givptr, givcol, givnum, work, iwork, info)
	SLAED7 used by SSTEDC. Computes the updated eigensystem of a diagonal matrix after modification by a rank-one symmetric matrix. Used when the original matrix is dense.
subroutine	slaed8 (icompq, k, n, qsiz, d, q, ldq, indxq, rho, cutpnt, z, dlamda, q2, ldq2, w, perm, givptr, givcol, givnum, indxp, indx, info)
	SLAED8 used by SSTEDC. Merges eigenvalues and deflates secular equation. Used when the original matrix is dense.
subroutine	slaed9 (k, kstart, kstop, n, d, q, ldq, rho, dlamda, w, s, lds, info)
	SLAED9 used by SSTEDC. Finds the roots of the secular equation and updates the eigenvectors. Used when the original matrix is dense.
subroutine	slaeda (n, tlvls, curlvl, curpbm, prmptr, perm, givptr, givcol, givnum, q, qptr, z, ztemp, info)
	SLAEDA used by SSTEDC. Computes the Z vector determining the rank-one modification of the diagonal matrix. Used when the original matrix is dense.
subroutine	slagtf (n, a, lambda, b, c, tol, d, in, info)
	SLAGTF computes an LU factorization of a matrix T-λI, where T is a general tridiagonal matrix, and λ a scalar, using partial pivoting with row interchanges.
subroutine	slamrg (n1, n2, a, strd1, strd2, index)
	SLAMRG creates a permutation list to merge the entries of two independently sorted sets into a single set sorted in ascending order.
subroutine	slartgs (x, y, sigma, cs, sn)
	SLARTGS generates a plane rotation designed to introduce a bulge in implicit QR iteration for the bidiagonal SVD problem.
subroutine	slasq1 (n, d, e, work, info)
	SLASQ1 computes the singular values of a real square bidiagonal matrix. Used by sbdsqr.
subroutine	slasq2 (n, z, info)
	SLASQ2 computes all the eigenvalues of the symmetric positive definite tridiagonal matrix associated with the qd Array Z to high relative accuracy. Used by sbdsqr and sstegr.
subroutine	slasq3 (i0, n0, z, pp, dmin, sigma, desig, qmax, nfail, iter, ndiv, ieee, ttype, dmin1, dmin2, dn, dn1, dn2, g, tau)
	SLASQ3 checks for deflation, computes a shift and calls dqds. Used by sbdsqr.
subroutine	slasq4 (i0, n0, z, pp, n0in, dmin, dmin1, dmin2, dn, dn1, dn2, tau, ttype, g)
	SLASQ4 computes an approximation to the smallest eigenvalue using values of d from the previous transform. Used by sbdsqr.
subroutine	slasq5 (i0, n0, z, pp, tau, sigma, dmin, dmin1, dmin2, dn, dnm1, dnm2, ieee, eps)
	SLASQ5 computes one dqds transform in ping-pong form. Used by sbdsqr and sstegr.
subroutine	slasq6 (i0, n0, z, pp, dmin, dmin1, dmin2, dn, dnm1, dnm2)
	SLASQ6 computes one dqd transform in ping-pong form. Used by sbdsqr and sstegr.
subroutine	slasrt (id, n, d, info)
	SLASRT sorts numbers in increasing or decreasing order.
subroutine	spttrf (n, d, e, info)
	SPTTRF
subroutine	sstebz (range, order, n, vl, vu, il, iu, abstol, d, e, m, nsplit, w, iblock, isplit, work, iwork, info)
	SSTEBZ
subroutine	sstedc (compz, n, d, e, z, ldz, work, lwork, iwork, liwork, info)
	SSTEDC
subroutine	ssteqr (compz, n, d, e, z, ldz, work, info)
	SSTEQR
subroutine	ssterf (n, d, e, info)
	SSTERF

Detailed Description

This is the group of auxiliary Computational routines

Function Documentation

◆ __secondtst_f__()

program __secondtst_f__

SECONDTST

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 30 of file secondtst.f.

30 INTEGER NMAX, ITS

◆ __slamchtst_f__()

program __slamchtst_f__

SLAMCHTST

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 28 of file slamchtst.f.

28 REAL BASE, EMAX, EMIN, EPS, RMAX, RMIN, RND, SFMIN,

29 $ T, PREC

◆ chla_transtype()

character*1 function chla_transtype ( integer trans )

CHLA_TRANSTYPE

Download CHLA_TRANSTYPE + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> This subroutine translates from a BLAST-specified integer constant to
!> the character string specifying a transposition operation.
!>
!> CHLA_TRANSTYPE returns an CHARACTER*1.  If CHLA_TRANSTYPE is 'X',
!> then input is not an integer indicating a transposition operator.
!> Otherwise CHLA_TRANSTYPE returns the constant value corresponding to
!> TRANS.
!>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 57 of file chla_transtype.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            TRANS
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      INTEGER BLAS_NO_TRANS, BLAS_TRANS, BLAS_CONJ_TRANS
      parameter( blas_no_trans = 111, blas_trans = 112,
     $     blas_conj_trans = 113 )
*     ..
*     .. Executable Statements ..
      IF( trans.EQ.blas_no_trans ) THEN
         chla_transtype = 'N'
      ELSE IF( trans.EQ.blas_trans ) THEN
         chla_transtype = 'T'
      ELSE IF( trans.EQ.blas_conj_trans ) THEN
         chla_transtype = 'C'
      ELSE
         chla_transtype = 'X'
      END IF
      RETURN
*
*     End of CHLA_TRANSTYPE
*

◆ dbdsdc()

subroutine dbdsdc	(	character	uplo,
		character	compq,
		integer	n,
		double precision, dimension( * )	d,
		double precision, dimension( * )	e,
		double precision, dimension( ldu, * )	u,
		integer	ldu,
		double precision, dimension( ldvt, * )	vt,
		integer	ldvt,
		double precision, dimension( * )	q,
		integer, dimension( * )	iq,
		double precision, dimension( * )	work,
		integer, dimension( * )	iwork,
		integer	info )

DBDSDC

Download DBDSDC + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DBDSDC computes the singular value decomposition (SVD) of a real
!> N-by-N (upper or lower) bidiagonal matrix B:  B = U * S * VT,
!> using a divide and conquer method, where S is a diagonal matrix
!> with non-negative diagonal elements (the singular values of B), and
!> U and VT are orthogonal matrices of left and right singular vectors,
!> respectively. DBDSDC can be used to compute all singular values,
!> and optionally, singular vectors or singular vectors in compact form.
!>
!> This code makes very mild assumptions about floating point
!> arithmetic. It will work on machines with a guard digit in
!> add/subtract, or on those binary machines without guard digits
!> which subtract like the Cray X-MP, Cray Y-MP, Cray C-90, or Cray-2.
!> It could conceivably fail on hexadecimal or decimal machines
!> without guard digits, but we know of none.  See DLASD3 for details.
!>
!> The code currently calls DLASDQ if singular values only are desired.
!> However, it can be slightly modified to compute singular values
!> using the divide and conquer method.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': B is upper bidiagonal. !> = 'L': B is lower bidiagonal. !>
[in]	COMPQ	!> COMPQ is CHARACTER*1 !> Specifies whether singular vectors are to be computed !> as follows: !> = 'N': Compute singular values only; !> = 'P': Compute singular values and compute singular !> vectors in compact form; !> = 'I': Compute singular values and singular vectors. !>
[in]	N	!> N is INTEGER !> The order of the matrix B. N >= 0. !>
[in,out]	D	!> D is DOUBLE PRECISION array, dimension (N) !> On entry, the n diagonal elements of the bidiagonal matrix B. !> On exit, if INFO=0, the singular values of B. !>
[in,out]	E	!> E is DOUBLE PRECISION array, dimension (N-1) !> On entry, the elements of E contain the offdiagonal !> elements of the bidiagonal matrix whose SVD is desired. !> On exit, E has been destroyed. !>
[out]	U	!> U is DOUBLE PRECISION array, dimension (LDU,N) !> If COMPQ = 'I', then: !> On exit, if INFO = 0, U contains the left singular vectors !> of the bidiagonal matrix. !> For other values of COMPQ, U is not referenced. !>
[in]	LDU	!> LDU is INTEGER !> The leading dimension of the array U. LDU >= 1. !> If singular vectors are desired, then LDU >= max( 1, N ). !>
[out]	VT	!> VT is DOUBLE PRECISION array, dimension (LDVT,N) !> If COMPQ = 'I', then: !> On exit, if INFO = 0, VT**T contains the right singular !> vectors of the bidiagonal matrix. !> For other values of COMPQ, VT is not referenced. !>
[in]	LDVT	!> LDVT is INTEGER !> The leading dimension of the array VT. LDVT >= 1. !> If singular vectors are desired, then LDVT >= max( 1, N ). !>
[out]	Q	!> Q is DOUBLE PRECISION array, dimension (LDQ) !> If COMPQ = 'P', then: !> On exit, if INFO = 0, Q and IQ contain the left !> and right singular vectors in a compact form, !> requiring O(N log N) space instead of 2N2. !> In particular, Q contains all the DOUBLE PRECISION data in !> LDQ >= N(11 + 2SMLSIZ + 8INT(LOG_2(N/(SMLSIZ+1)))) !> words of memory, where SMLSIZ is returned by ILAENV and !> is equal to the maximum size of the subproblems at the !> bottom of the computation tree (usually about 25). !> For other values of COMPQ, Q is not referenced. !>
[out]	IQ	!> IQ is INTEGER array, dimension (LDIQ) !> If COMPQ = 'P', then: !> On exit, if INFO = 0, Q and IQ contain the left !> and right singular vectors in a compact form, !> requiring O(N log N) space instead of 2N2. !> In particular, IQ contains all INTEGER data in !> LDIQ >= N(3 + 3*INT(LOG_2(N/(SMLSIZ+1)))) !> words of memory, where SMLSIZ is returned by ILAENV and !> is equal to the maximum size of the subproblems at the !> bottom of the computation tree (usually about 25). !> For other values of COMPQ, IQ is not referenced. !>
[out]	WORK	!> WORK is DOUBLE PRECISION array, dimension (MAX(1,LWORK)) !> If COMPQ = 'N' then LWORK >= (4 * N). !> If COMPQ = 'P' then LWORK >= (6 * N). !> If COMPQ = 'I' then LWORK >= (3 * N*2 + 4 N). !>
[out]	IWORK	!> IWORK is INTEGER array, dimension (8*N) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> < 0: if INFO = -i, the i-th argument had an illegal value. !> > 0: The algorithm failed to compute a singular value. !> The update process of divide and conquer failed. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: Ming Gu and Huan Ren, Computer Science Division, University of California at Berkeley, USA

Definition at line 203 of file dbdsdc.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          COMPQ, UPLO
      INTEGER            INFO, LDU, LDVT, N
*     ..
*     .. Array Arguments ..
      INTEGER            IQ( * ), IWORK( * )
      DOUBLE PRECISION   D( * ), E( * ), Q( * ), U( LDU, * ),
     $                   VT( LDVT, * ), WORK( * )
*     ..
*
*  =====================================================================
*  Changed dimension statement in comment describing E from (N) to
*  (N-1).  Sven, 17 Feb 05.
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ZERO, ONE, TWO
      parameter( zero = 0.0d+0, one = 1.0d+0, two = 2.0d+0 )
*     ..
*     .. Local Scalars ..
      INTEGER            DIFL, DIFR, GIVCOL, GIVNUM, GIVPTR, I, IC,
     $                   ICOMPQ, IERR, II, IS, IU, IUPLO, IVT, J, K, KK,
     $                   MLVL, NM1, NSIZE, PERM, POLES, QSTART, SMLSIZ,
     $                   SMLSZP, SQRE, START, WSTART, Z
      DOUBLE PRECISION   CS, EPS, ORGNRM, P, R, SN
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      INTEGER            ILAENV
      DOUBLE PRECISION   DLAMCH, DLANST
      EXTERNAL           lsame, ilaenv, dlamch, dlanst
*     ..
*     .. External Subroutines ..
      EXTERNAL           dcopy, dlartg, dlascl, dlasd0, dlasda, dlasdq,
     $                   dlaset, dlasr, dswap, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, dble, int, log, sign
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
*
      iuplo = 0
      IF( lsame( uplo, 'U' ) )
     $   iuplo = 1
      IF( lsame( uplo, 'L' ) )
     $   iuplo = 2
      IF( lsame( compq, 'N' ) ) THEN
         icompq = 0
      ELSE IF( lsame( compq, 'P' ) ) THEN
         icompq = 1
      ELSE IF( lsame( compq, 'I' ) ) THEN
         icompq = 2
      ELSE
         icompq = -1
      END IF
      IF( iuplo.EQ.0 ) THEN
         info = -1
      ELSE IF( icompq.LT.0 ) THEN
         info = -2
      ELSE IF( n.LT.0 ) THEN
         info = -3
      ELSE IF( ( ldu.LT.1 ) .OR. ( ( icompq.EQ.2 ) .AND. ( ldu.LT.
     $         n ) ) ) THEN
         info = -7
      ELSE IF( ( ldvt.LT.1 ) .OR. ( ( icompq.EQ.2 ) .AND. ( ldvt.LT.
     $         n ) ) ) THEN
         info = -9
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'DBDSDC', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
      smlsiz = ilaenv( 9, 'DBDSDC', ' ', 0, 0, 0, 0 )
      IF( n.EQ.1 ) THEN
         IF( icompq.EQ.1 ) THEN
            q( 1 ) = sign( one, d( 1 ) )
            q( 1+smlsiz*n ) = one
         ELSE IF( icompq.EQ.2 ) THEN
            u( 1, 1 ) = sign( one, d( 1 ) )
            vt( 1, 1 ) = one
         END IF
         d( 1 ) = abs( d( 1 ) )
         RETURN
      END IF
      nm1 = n - 1
*
*     If matrix lower bidiagonal, rotate to be upper bidiagonal
*     by applying Givens rotations on the left
*
      wstart = 1
      qstart = 3
      IF( icompq.EQ.1 ) THEN
         CALL dcopy( n, d, 1, q( 1 ), 1 )
         CALL dcopy( n-1, e, 1, q( n+1 ), 1 )
      END IF
      IF( iuplo.EQ.2 ) THEN
         qstart = 5
         IF( icompq .EQ. 2 ) wstart = 2*n - 1
         DO 10 i = 1, n - 1
            CALL dlartg( d( i ), e( i ), cs, sn, r )
            d( i ) = r
            e( i ) = sn*d( i+1 )
            d( i+1 ) = cs*d( i+1 )
            IF( icompq.EQ.1 ) THEN
               q( i+2*n ) = cs
               q( i+3*n ) = sn
            ELSE IF( icompq.EQ.2 ) THEN
               work( i ) = cs
               work( nm1+i ) = -sn
            END IF
   10    CONTINUE
      END IF
*
*     If ICOMPQ = 0, use DLASDQ to compute the singular values.
*
      IF( icompq.EQ.0 ) THEN
*        Ignore WSTART, instead using WORK( 1 ), since the two vectors
*        for CS and -SN above are added only if ICOMPQ == 2,
*        and adding them exceeds documented WORK size of 4*n.
         CALL dlasdq( 'U', 0, n, 0, 0, 0, d, e, vt, ldvt, u, ldu, u,
     $                ldu, work( 1 ), info )
         GO TO 40
      END IF
*
*     If N is smaller than the minimum divide size SMLSIZ, then solve
*     the problem with another solver.
*
      IF( n.LE.smlsiz ) THEN
         IF( icompq.EQ.2 ) THEN
            CALL dlaset( 'A', n, n, zero, one, u, ldu )
            CALL dlaset( 'A', n, n, zero, one, vt, ldvt )
            CALL dlasdq( 'U', 0, n, n, n, 0, d, e, vt, ldvt, u, ldu, u,
     $                   ldu, work( wstart ), info )
         ELSE IF( icompq.EQ.1 ) THEN
            iu = 1
            ivt = iu + n
            CALL dlaset( 'A', n, n, zero, one, q( iu+( qstart-1 )*n ),
     $                   n )
            CALL dlaset( 'A', n, n, zero, one, q( ivt+( qstart-1 )*n ),
     $                   n )
            CALL dlasdq( 'U', 0, n, n, n, 0, d, e,
     $                   q( ivt+( qstart-1 )*n ), n,
     $                   q( iu+( qstart-1 )*n ), n,
     $                   q( iu+( qstart-1 )*n ), n, work( wstart ),
     $                   info )
         END IF
         GO TO 40
      END IF
*
      IF( icompq.EQ.2 ) THEN
         CALL dlaset( 'A', n, n, zero, one, u, ldu )
         CALL dlaset( 'A', n, n, zero, one, vt, ldvt )
      END IF
*
*     Scale.
*
      orgnrm = dlanst( 'M', n, d, e )
      IF( orgnrm.EQ.zero )
     $   RETURN
      CALL dlascl( 'G', 0, 0, orgnrm, one, n, 1, d, n, ierr )
      CALL dlascl( 'G', 0, 0, orgnrm, one, nm1, 1, e, nm1, ierr )
*
      eps = (0.9d+0)*dlamch( 'Epsilon' )
*
      mlvl = int( log( dble( n ) / dble( smlsiz+1 ) ) / log( two ) ) + 1
      smlszp = smlsiz + 1
*
      IF( icompq.EQ.1 ) THEN
         iu = 1
         ivt = 1 + smlsiz
         difl = ivt + smlszp
         difr = difl + mlvl
         z = difr + mlvl*2
         ic = z + mlvl
         is = ic + 1
         poles = is + 1
         givnum = poles + 2*mlvl
*
         k = 1
         givptr = 2
         perm = 3
         givcol = perm + mlvl
      END IF
*
      DO 20 i = 1, n
         IF( abs( d( i ) ).LT.eps ) THEN
            d( i ) = sign( eps, d( i ) )
         END IF
   20 CONTINUE
*
      start = 1
      sqre = 0
*
      DO 30 i = 1, nm1
         IF( ( abs( e( i ) ).LT.eps ) .OR. ( i.EQ.nm1 ) ) THEN
*
*           Subproblem found. First determine its size and then
*           apply divide and conquer on it.
*
            IF( i.LT.nm1 ) THEN
*
*              A subproblem with E(I) small for I < NM1.
*
               nsize = i - start + 1
            ELSE IF( abs( e( i ) ).GE.eps ) THEN
*
*              A subproblem with E(NM1) not too small but I = NM1.
*
               nsize = n - start + 1
            ELSE
*
*              A subproblem with E(NM1) small. This implies an
*              1-by-1 subproblem at D(N). Solve this 1-by-1 problem
*              first.
*
               nsize = i - start + 1
               IF( icompq.EQ.2 ) THEN
                  u( n, n ) = sign( one, d( n ) )
                  vt( n, n ) = one
               ELSE IF( icompq.EQ.1 ) THEN
                  q( n+( qstart-1 )*n ) = sign( one, d( n ) )
                  q( n+( smlsiz+qstart-1 )*n ) = one
               END IF
               d( n ) = abs( d( n ) )
            END IF
            IF( icompq.EQ.2 ) THEN
               CALL dlasd0( nsize, sqre, d( start ), e( start ),
     $                      u( start, start ), ldu, vt( start, start ),
     $                      ldvt, smlsiz, iwork, work( wstart ), info )
            ELSE
               CALL dlasda( icompq, smlsiz, nsize, sqre, d( start ),
     $                      e( start ), q( start+( iu+qstart-2 )*n ), n,
     $                      q( start+( ivt+qstart-2 )*n ),
     $                      iq( start+k*n ), q( start+( difl+qstart-2 )*
     $                      n ), q( start+( difr+qstart-2 )*n ),
     $                      q( start+( z+qstart-2 )*n ),
     $                      q( start+( poles+qstart-2 )*n ),
     $                      iq( start+givptr*n ), iq( start+givcol*n ),
     $                      n, iq( start+perm*n ),
     $                      q( start+( givnum+qstart-2 )*n ),
     $                      q( start+( ic+qstart-2 )*n ),
     $                      q( start+( is+qstart-2 )*n ),
     $                      work( wstart ), iwork, info )
            END IF
            IF( info.NE.0 ) THEN
               RETURN
            END IF
            start = i + 1
         END IF
   30 CONTINUE
*
*     Unscale
*
      CALL dlascl( 'G', 0, 0, one, orgnrm, n, 1, d, n, ierr )
   40 CONTINUE
*
*     Use Selection Sort to minimize swaps of singular vectors
*
      DO 60 ii = 2, n
         i = ii - 1
         kk = i
         p = d( i )
         DO 50 j = ii, n
            IF( d( j ).GT.p ) THEN
               kk = j
               p = d( j )
            END IF
   50    CONTINUE
         IF( kk.NE.i ) THEN
            d( kk ) = d( i )
            d( i ) = p
            IF( icompq.EQ.1 ) THEN
               iq( i ) = kk
            ELSE IF( icompq.EQ.2 ) THEN
               CALL dswap( n, u( 1, i ), 1, u( 1, kk ), 1 )
               CALL dswap( n, vt( i, 1 ), ldvt, vt( kk, 1 ), ldvt )
            END IF
         ELSE IF( icompq.EQ.1 ) THEN
            iq( i ) = i
         END IF
   60 CONTINUE
*
*     If ICOMPQ = 1, use IQ(N,1) as the indicator for UPLO
*
      IF( icompq.EQ.1 ) THEN
         IF( iuplo.EQ.1 ) THEN
            iq( n ) = 1
         ELSE
            iq( n ) = 0
         END IF
      END IF
*
*     If B is lower bidiagonal, update U by those Givens rotations
*     which rotated B to be upper bidiagonal
*
      IF( ( iuplo.EQ.2 ) .AND. ( icompq.EQ.2 ) )
     $   CALL dlasr( 'L', 'V', 'B', n, n, work( 1 ), work( n ), u, ldu )
*
      RETURN
*
*     End of DBDSDC
*

◆ dbdsqr()

subroutine dbdsqr	(	character	uplo,
		integer	n,
		integer	ncvt,
		integer	nru,
		integer	ncc,
		double precision, dimension( * )	d,
		double precision, dimension( * )	e,
		double precision, dimension( ldvt, * )	vt,
		integer	ldvt,
		double precision, dimension( ldu, * )	u,
		integer	ldu,
		double precision, dimension( ldc, * )	c,
		integer	ldc,
		double precision, dimension( * )	work,
		integer	info )

DBDSQR

Download DBDSQR + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DBDSQR computes the singular values and, optionally, the right and/or
!> left singular vectors from the singular value decomposition (SVD) of
!> a real N-by-N (upper or lower) bidiagonal matrix B using the implicit
!> zero-shift QR algorithm.  The SVD of B has the form
!>
!>    B = Q * S * P**T
!>
!> where S is the diagonal matrix of singular values, Q is an orthogonal
!> matrix of left singular vectors, and P is an orthogonal matrix of
!> right singular vectors.  If left singular vectors are requested, this
!> subroutine actually returns U*Q instead of Q, and, if right singular
!> vectors are requested, this subroutine returns P**T*VT instead of
!> P**T, for given real input matrices U and VT.  When U and VT are the
!> orthogonal matrices that reduce a general matrix A to bidiagonal
!> form:  A = U*B*VT, as computed by DGEBRD, then
!>
!>    A = (U*Q) * S * (P**T*VT)
!>
!> is the SVD of A.  Optionally, the subroutine may also compute Q**T*C
!> for a given real input matrix C.
!>
!> See  by J. Demmel and W. Kahan,
!> LAPACK Working Note #3 (or SIAM J. Sci. Statist. Comput. vol. 11,
!> no. 5, pp. 873-912, Sept 1990) and
!>  by
!> B. Parlett and V. Fernando, Technical Report CPAM-554, Mathematics
!> Department, University of California at Berkeley, July 1992
!> for a detailed description of the algorithm.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': B is upper bidiagonal; !> = 'L': B is lower bidiagonal. !>
[in]	N	!> N is INTEGER !> The order of the matrix B. N >= 0. !>
[in]	NCVT	!> NCVT is INTEGER !> The number of columns of the matrix VT. NCVT >= 0. !>
[in]	NRU	!> NRU is INTEGER !> The number of rows of the matrix U. NRU >= 0. !>
[in]	NCC	!> NCC is INTEGER !> The number of columns of the matrix C. NCC >= 0. !>
[in,out]	D	!> D is DOUBLE PRECISION array, dimension (N) !> On entry, the n diagonal elements of the bidiagonal matrix B. !> On exit, if INFO=0, the singular values of B in decreasing !> order. !>
[in,out]	E	!> E is DOUBLE PRECISION array, dimension (N-1) !> On entry, the N-1 offdiagonal elements of the bidiagonal !> matrix B. !> On exit, if INFO = 0, E is destroyed; if INFO > 0, D and E !> will contain the diagonal and superdiagonal elements of a !> bidiagonal matrix orthogonally equivalent to the one given !> as input. !>
[in,out]	VT	!> VT is DOUBLE PRECISION array, dimension (LDVT, NCVT) !> On entry, an N-by-NCVT matrix VT. !> On exit, VT is overwritten by P*T VT. !> Not referenced if NCVT = 0. !>
[in]	LDVT	!> LDVT is INTEGER !> The leading dimension of the array VT. !> LDVT >= max(1,N) if NCVT > 0; LDVT >= 1 if NCVT = 0. !>
[in,out]	U	!> U is DOUBLE PRECISION array, dimension (LDU, N) !> On entry, an NRU-by-N matrix U. !> On exit, U is overwritten by U * Q. !> Not referenced if NRU = 0. !>
[in]	LDU	!> LDU is INTEGER !> The leading dimension of the array U. LDU >= max(1,NRU). !>
[in,out]	C	!> C is DOUBLE PRECISION array, dimension (LDC, NCC) !> On entry, an N-by-NCC matrix C. !> On exit, C is overwritten by Q*T C. !> Not referenced if NCC = 0. !>
[in]	LDC	!> LDC is INTEGER !> The leading dimension of the array C. !> LDC >= max(1,N) if NCC > 0; LDC >=1 if NCC = 0. !>
[out]	WORK	!> WORK is DOUBLE PRECISION array, dimension (4*(N-1)) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: If INFO = -i, the i-th argument had an illegal value !> > 0: !> if NCVT = NRU = NCC = 0, !> = 1, a split was marked by a positive value in E !> = 2, current block of Z not diagonalized after 30*N !> iterations (in inner while loop) !> = 3, termination criterion of outer while loop not met !> (program created more than N unreduced blocks) !> else NCVT = NRU = NCC = 0, !> the algorithm did not converge; D and E contain the !> elements of a bidiagonal matrix which is orthogonally !> similar to the input matrix B; if INFO = i, i !> elements of E have not converged to zero. !>

Internal Parameters:

!>  TOLMUL  DOUBLE PRECISION, default = max(10,min(100,EPS**(-1/8)))
!>          TOLMUL controls the convergence criterion of the QR loop.
!>          If it is positive, TOLMUL*EPS is the desired relative
!>             precision in the computed singular values.
!>          If it is negative, abs(TOLMUL*EPS*sigma_max) is the
!>             desired absolute accuracy in the computed singular
!>             values (corresponds to relative accuracy
!>             abs(TOLMUL*EPS) in the largest singular value.
!>          abs(TOLMUL) should be between 1 and 1/EPS, and preferably
!>             between 10 (for fast convergence) and .1/EPS
!>             (for there to be some accuracy in the results).
!>          Default is to lose at either one eighth or 2 of the
!>             available decimal digits in each computed singular value
!>             (whichever is smaller).
!>
!>  MAXITR  INTEGER, default = 6
!>          MAXITR controls the maximum number of passes of the
!>          algorithm through its inner loop. The algorithms stops
!>          (and so fails to converge) if the number of passes
!>          through the inner loop exceeds MAXITR*N**2.
!>
!>

Note:

!>  Bug report from Cezary Dendek.
!>  On March 23rd 2017, the INTEGER variable MAXIT = MAXITR*N**2 is
!>  removed since it can overflow pretty easily (for N larger or equal
!>  than 18,919). We instead use MAXITDIVN = MAXITR*N.
!>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 239 of file dbdsqr.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          UPLO
      INTEGER            INFO, LDC, LDU, LDVT, N, NCC, NCVT, NRU
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   C( LDC, * ), D( * ), E( * ), U( LDU, * ),
     $                   VT( LDVT, * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ZERO
      parameter( zero = 0.0d0 )
      DOUBLE PRECISION   ONE
      parameter( one = 1.0d0 )
      DOUBLE PRECISION   NEGONE
      parameter( negone = -1.0d0 )
      DOUBLE PRECISION   HNDRTH
      parameter( hndrth = 0.01d0 )
      DOUBLE PRECISION   TEN
      parameter( ten = 10.0d0 )
      DOUBLE PRECISION   HNDRD
      parameter( hndrd = 100.0d0 )
      DOUBLE PRECISION   MEIGTH
      parameter( meigth = -0.125d0 )
      INTEGER            MAXITR
      parameter( maxitr = 6 )
*     ..
*     .. Local Scalars ..
      LOGICAL            LOWER, ROTATE
      INTEGER            I, IDIR, ISUB, ITER, ITERDIVN, J, LL, LLL, M,
     $                   MAXITDIVN, NM1, NM12, NM13, OLDLL, OLDM
      DOUBLE PRECISION   ABSE, ABSS, COSL, COSR, CS, EPS, F, G, H, MU,
     $                   OLDCS, OLDSN, R, SHIFT, SIGMN, SIGMX, SINL,
     $                   SINR, SLL, SMAX, SMIN, SMINL, SMINOA,
     $                   SN, THRESH, TOL, TOLMUL, UNFL
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      DOUBLE PRECISION   DLAMCH
      EXTERNAL           lsame, dlamch
*     ..
*     .. External Subroutines ..
      EXTERNAL           dlartg, dlas2, dlasq1, dlasr, dlasv2, drot,
     $                   dscal, dswap, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, dble, max, min, sign, sqrt
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      lower = lsame( uplo, 'L' )
      IF( .NOT.lsame( uplo, 'U' ) .AND. .NOT.lower ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( ncvt.LT.0 ) THEN
         info = -3
      ELSE IF( nru.LT.0 ) THEN
         info = -4
      ELSE IF( ncc.LT.0 ) THEN
         info = -5
      ELSE IF( ( ncvt.EQ.0 .AND. ldvt.LT.1 ) .OR.
     $         ( ncvt.GT.0 .AND. ldvt.LT.max( 1, n ) ) ) THEN
         info = -9
      ELSE IF( ldu.LT.max( 1, nru ) ) THEN
         info = -11
      ELSE IF( ( ncc.EQ.0 .AND. ldc.LT.1 ) .OR.
     $         ( ncc.GT.0 .AND. ldc.LT.max( 1, n ) ) ) THEN
         info = -13
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'DBDSQR', -info )
         RETURN
      END IF
      IF( n.EQ.0 )
     $   RETURN
      IF( n.EQ.1 )
     $   GO TO 160
*
*     ROTATE is true if any singular vectors desired, false otherwise
*
      rotate = ( ncvt.GT.0 ) .OR. ( nru.GT.0 ) .OR. ( ncc.GT.0 )
*
*     If no singular vectors desired, use qd algorithm
*
      IF( .NOT.rotate ) THEN
         CALL dlasq1( n, d, e, work, info )
*
*     If INFO equals 2, dqds didn't finish, try to finish
*
         IF( info .NE. 2 ) RETURN
         info = 0
      END IF
*
      nm1 = n - 1
      nm12 = nm1 + nm1
      nm13 = nm12 + nm1
      idir = 0
*
*     Get machine constants
*
      eps = dlamch( 'Epsilon' )
      unfl = dlamch( 'Safe minimum' )
*
*     If matrix lower bidiagonal, rotate to be upper bidiagonal
*     by applying Givens rotations on the left
*
      IF( lower ) THEN
         DO 10 i = 1, n - 1
            CALL dlartg( d( i ), e( i ), cs, sn, r )
            d( i ) = r
            e( i ) = sn*d( i+1 )
            d( i+1 ) = cs*d( i+1 )
            work( i ) = cs
            work( nm1+i ) = sn
   10    CONTINUE
*
*        Update singular vectors if desired
*
         IF( nru.GT.0 )
     $      CALL dlasr( 'R', 'V', 'F', nru, n, work( 1 ), work( n ), u,
     $                  ldu )
         IF( ncc.GT.0 )
     $      CALL dlasr( 'L', 'V', 'F', n, ncc, work( 1 ), work( n ), c,
     $                  ldc )
      END IF
*
*     Compute singular values to relative accuracy TOL
*     (By setting TOL to be negative, algorithm will compute
*     singular values to absolute accuracy ABS(TOL)*norm(input matrix))
*
      tolmul = max( ten, min( hndrd, eps**meigth ) )
      tol = tolmul*eps
*
*     Compute approximate maximum, minimum singular values
*
      smax = zero
      DO 20 i = 1, n
         smax = max( smax, abs( d( i ) ) )
   20 CONTINUE
      DO 30 i = 1, n - 1
         smax = max( smax, abs( e( i ) ) )
   30 CONTINUE
      sminl = zero
      IF( tol.GE.zero ) THEN
*
*        Relative accuracy desired
*
         sminoa = abs( d( 1 ) )
         IF( sminoa.EQ.zero )
     $      GO TO 50
         mu = sminoa
         DO 40 i = 2, n
            mu = abs( d( i ) )*( mu / ( mu+abs( e( i-1 ) ) ) )
            sminoa = min( sminoa, mu )
            IF( sminoa.EQ.zero )
     $         GO TO 50
   40    CONTINUE
   50    CONTINUE
         sminoa = sminoa / sqrt( dble( n ) )
         thresh = max( tol*sminoa, maxitr*(n*(n*unfl)) )
      ELSE
*
*        Absolute accuracy desired
*
         thresh = max( abs( tol )*smax, maxitr*(n*(n*unfl)) )
      END IF
*
*     Prepare for main iteration loop for the singular values
*     (MAXIT is the maximum number of passes through the inner
*     loop permitted before nonconvergence signalled.)
*
      maxitdivn = maxitr*n
      iterdivn = 0
      iter = -1
      oldll = -1
      oldm = -1
*
*     M points to last element of unconverged part of matrix
*
      m = n
*
*     Begin main iteration loop
*
   60 CONTINUE
*
*     Check for convergence or exceeding iteration count
*
      IF( m.LE.1 )
     $   GO TO 160
*
      IF( iter.GE.n ) THEN
         iter = iter - n
         iterdivn = iterdivn + 1
         IF( iterdivn.GE.maxitdivn )
     $      GO TO 200
      END IF
*
*     Find diagonal block of matrix to work on
*
      IF( tol.LT.zero .AND. abs( d( m ) ).LE.thresh )
     $   d( m ) = zero
      smax = abs( d( m ) )
      smin = smax
      DO 70 lll = 1, m - 1
         ll = m - lll
         abss = abs( d( ll ) )
         abse = abs( e( ll ) )
         IF( tol.LT.zero .AND. abss.LE.thresh )
     $      d( ll ) = zero
         IF( abse.LE.thresh )
     $      GO TO 80
         smin = min( smin, abss )
         smax = max( smax, abss, abse )
   70 CONTINUE
      ll = 0
      GO TO 90
   80 CONTINUE
      e( ll ) = zero
*
*     Matrix splits since E(LL) = 0
*
      IF( ll.EQ.m-1 ) THEN
*
*        Convergence of bottom singular value, return to top of loop
*
         m = m - 1
         GO TO 60
      END IF
   90 CONTINUE
      ll = ll + 1
*
*     E(LL) through E(M-1) are nonzero, E(LL-1) is zero
*
      IF( ll.EQ.m-1 ) THEN
*
*        2 by 2 block, handle separately
*
         CALL dlasv2( d( m-1 ), e( m-1 ), d( m ), sigmn, sigmx, sinr,
     $                cosr, sinl, cosl )
         d( m-1 ) = sigmx
         e( m-1 ) = zero
         d( m ) = sigmn
*
*        Compute singular vectors, if desired
*
         IF( ncvt.GT.0 )
     $      CALL drot( ncvt, vt( m-1, 1 ), ldvt, vt( m, 1 ), ldvt, cosr,
     $                 sinr )
         IF( nru.GT.0 )
     $      CALL drot( nru, u( 1, m-1 ), 1, u( 1, m ), 1, cosl, sinl )
         IF( ncc.GT.0 )
     $      CALL drot( ncc, c( m-1, 1 ), ldc, c( m, 1 ), ldc, cosl,
     $                 sinl )
         m = m - 2
         GO TO 60
      END IF
*
*     If working on new submatrix, choose shift direction
*     (from larger end diagonal element towards smaller)
*
      IF( ll.GT.oldm .OR. m.LT.oldll ) THEN
         IF( abs( d( ll ) ).GE.abs( d( m ) ) ) THEN
*
*           Chase bulge from top (big end) to bottom (small end)
*
            idir = 1
         ELSE
*
*           Chase bulge from bottom (big end) to top (small end)
*
            idir = 2
         END IF
      END IF
*
*     Apply convergence tests
*
      IF( idir.EQ.1 ) THEN
*
*        Run convergence test in forward direction
*        First apply standard test to bottom of matrix
*
         IF( abs( e( m-1 ) ).LE.abs( tol )*abs( d( m ) ) .OR.
     $       ( tol.LT.zero .AND. abs( e( m-1 ) ).LE.thresh ) ) THEN
            e( m-1 ) = zero
            GO TO 60
         END IF
*
         IF( tol.GE.zero ) THEN
*
*           If relative accuracy desired,
*           apply convergence criterion forward
*
            mu = abs( d( ll ) )
            sminl = mu
            DO 100 lll = ll, m - 1
               IF( abs( e( lll ) ).LE.tol*mu ) THEN
                  e( lll ) = zero
                  GO TO 60
               END IF
               mu = abs( d( lll+1 ) )*( mu / ( mu+abs( e( lll ) ) ) )
               sminl = min( sminl, mu )
  100       CONTINUE
         END IF
*
      ELSE
*
*        Run convergence test in backward direction
*        First apply standard test to top of matrix
*
         IF( abs( e( ll ) ).LE.abs( tol )*abs( d( ll ) ) .OR.
     $       ( tol.LT.zero .AND. abs( e( ll ) ).LE.thresh ) ) THEN
            e( ll ) = zero
            GO TO 60
         END IF
*
         IF( tol.GE.zero ) THEN
*
*           If relative accuracy desired,
*           apply convergence criterion backward
*
            mu = abs( d( m ) )
            sminl = mu
            DO 110 lll = m - 1, ll, -1
               IF( abs( e( lll ) ).LE.tol*mu ) THEN
                  e( lll ) = zero
                  GO TO 60
               END IF
               mu = abs( d( lll ) )*( mu / ( mu+abs( e( lll ) ) ) )
               sminl = min( sminl, mu )
  110       CONTINUE
         END IF
      END IF
      oldll = ll
      oldm = m
*
*     Compute shift.  First, test if shifting would ruin relative
*     accuracy, and if so set the shift to zero.
*
      IF( tol.GE.zero .AND. n*tol*( sminl / smax ).LE.
     $    max( eps, hndrth*tol ) ) THEN
*
*        Use a zero shift to avoid loss of relative accuracy
*
         shift = zero
      ELSE
*
*        Compute the shift from 2-by-2 block at end of matrix
*
         IF( idir.EQ.1 ) THEN
            sll = abs( d( ll ) )
            CALL dlas2( d( m-1 ), e( m-1 ), d( m ), shift, r )
         ELSE
            sll = abs( d( m ) )
            CALL dlas2( d( ll ), e( ll ), d( ll+1 ), shift, r )
         END IF
*
*        Test if shift negligible, and if so set to zero
*
         IF( sll.GT.zero ) THEN
            IF( ( shift / sll )**2.LT.eps )
     $         shift = zero
         END IF
      END IF
*
*     Increment iteration count
*
      iter = iter + m - ll
*
*     If SHIFT = 0, do simplified QR iteration
*
      IF( shift.EQ.zero ) THEN
         IF( idir.EQ.1 ) THEN
*
*           Chase bulge from top to bottom
*           Save cosines and sines for later singular vector updates
*
            cs = one
            oldcs = one
            DO 120 i = ll, m - 1
               CALL dlartg( d( i )*cs, e( i ), cs, sn, r )
               IF( i.GT.ll )
     $            e( i-1 ) = oldsn*r
               CALL dlartg( oldcs*r, d( i+1 )*sn, oldcs, oldsn, d( i ) )
               work( i-ll+1 ) = cs
               work( i-ll+1+nm1 ) = sn
               work( i-ll+1+nm12 ) = oldcs
               work( i-ll+1+nm13 ) = oldsn
  120       CONTINUE
            h = d( m )*cs
            d( m ) = h*oldcs
            e( m-1 ) = h*oldsn
*
*           Update singular vectors
*
            IF( ncvt.GT.0 )
     $         CALL dlasr( 'L', 'V', 'F', m-ll+1, ncvt, work( 1 ),
     $                     work( n ), vt( ll, 1 ), ldvt )
            IF( nru.GT.0 )
     $         CALL dlasr( 'R', 'V', 'F', nru, m-ll+1, work( nm12+1 ),
     $                     work( nm13+1 ), u( 1, ll ), ldu )
            IF( ncc.GT.0 )
     $         CALL dlasr( 'L', 'V', 'F', m-ll+1, ncc, work( nm12+1 ),
     $                     work( nm13+1 ), c( ll, 1 ), ldc )
*
*           Test convergence
*
            IF( abs( e( m-1 ) ).LE.thresh )
     $         e( m-1 ) = zero
*
         ELSE
*
*           Chase bulge from bottom to top
*           Save cosines and sines for later singular vector updates
*
            cs = one
            oldcs = one
            DO 130 i = m, ll + 1, -1
               CALL dlartg( d( i )*cs, e( i-1 ), cs, sn, r )
               IF( i.LT.m )
     $            e( i ) = oldsn*r
               CALL dlartg( oldcs*r, d( i-1 )*sn, oldcs, oldsn, d( i ) )
               work( i-ll ) = cs
               work( i-ll+nm1 ) = -sn
               work( i-ll+nm12 ) = oldcs
               work( i-ll+nm13 ) = -oldsn
  130       CONTINUE
            h = d( ll )*cs
            d( ll ) = h*oldcs
            e( ll ) = h*oldsn
*
*           Update singular vectors
*
            IF( ncvt.GT.0 )
     $         CALL dlasr( 'L', 'V', 'B', m-ll+1, ncvt, work( nm12+1 ),
     $                     work( nm13+1 ), vt( ll, 1 ), ldvt )
            IF( nru.GT.0 )
     $         CALL dlasr( 'R', 'V', 'B', nru, m-ll+1, work( 1 ),
     $                     work( n ), u( 1, ll ), ldu )
            IF( ncc.GT.0 )
     $         CALL dlasr( 'L', 'V', 'B', m-ll+1, ncc, work( 1 ),
     $                     work( n ), c( ll, 1 ), ldc )
*
*           Test convergence
*
            IF( abs( e( ll ) ).LE.thresh )
     $         e( ll ) = zero
         END IF
      ELSE
*
*        Use nonzero shift
*
         IF( idir.EQ.1 ) THEN
*
*           Chase bulge from top to bottom
*           Save cosines and sines for later singular vector updates
*
            f = ( abs( d( ll ) )-shift )*
     $          ( sign( one, d( ll ) )+shift / d( ll ) )
            g = e( ll )
            DO 140 i = ll, m - 1
               CALL dlartg( f, g, cosr, sinr, r )
               IF( i.GT.ll )
     $            e( i-1 ) = r
               f = cosr*d( i ) + sinr*e( i )
               e( i ) = cosr*e( i ) - sinr*d( i )
               g = sinr*d( i+1 )
               d( i+1 ) = cosr*d( i+1 )
               CALL dlartg( f, g, cosl, sinl, r )
               d( i ) = r
               f = cosl*e( i ) + sinl*d( i+1 )
               d( i+1 ) = cosl*d( i+1 ) - sinl*e( i )
               IF( i.LT.m-1 ) THEN
                  g = sinl*e( i+1 )
                  e( i+1 ) = cosl*e( i+1 )
               END IF
               work( i-ll+1 ) = cosr
               work( i-ll+1+nm1 ) = sinr
               work( i-ll+1+nm12 ) = cosl
               work( i-ll+1+nm13 ) = sinl
  140       CONTINUE
            e( m-1 ) = f
*
*           Update singular vectors
*
            IF( ncvt.GT.0 )
     $         CALL dlasr( 'L', 'V', 'F', m-ll+1, ncvt, work( 1 ),
     $                     work( n ), vt( ll, 1 ), ldvt )
            IF( nru.GT.0 )
     $         CALL dlasr( 'R', 'V', 'F', nru, m-ll+1, work( nm12+1 ),
     $                     work( nm13+1 ), u( 1, ll ), ldu )
            IF( ncc.GT.0 )
     $         CALL dlasr( 'L', 'V', 'F', m-ll+1, ncc, work( nm12+1 ),
     $                     work( nm13+1 ), c( ll, 1 ), ldc )
*
*           Test convergence
*
            IF( abs( e( m-1 ) ).LE.thresh )
     $         e( m-1 ) = zero
*
         ELSE
*
*           Chase bulge from bottom to top
*           Save cosines and sines for later singular vector updates
*
            f = ( abs( d( m ) )-shift )*( sign( one, d( m ) )+shift /
     $          d( m ) )
            g = e( m-1 )
            DO 150 i = m, ll + 1, -1
               CALL dlartg( f, g, cosr, sinr, r )
               IF( i.LT.m )
     $            e( i ) = r
               f = cosr*d( i ) + sinr*e( i-1 )
               e( i-1 ) = cosr*e( i-1 ) - sinr*d( i )
               g = sinr*d( i-1 )
               d( i-1 ) = cosr*d( i-1 )
               CALL dlartg( f, g, cosl, sinl, r )
               d( i ) = r
               f = cosl*e( i-1 ) + sinl*d( i-1 )
               d( i-1 ) = cosl*d( i-1 ) - sinl*e( i-1 )
               IF( i.GT.ll+1 ) THEN
                  g = sinl*e( i-2 )
                  e( i-2 ) = cosl*e( i-2 )
               END IF
               work( i-ll ) = cosr
               work( i-ll+nm1 ) = -sinr
               work( i-ll+nm12 ) = cosl
               work( i-ll+nm13 ) = -sinl
  150       CONTINUE
            e( ll ) = f
*
*           Test convergence
*
            IF( abs( e( ll ) ).LE.thresh )
     $         e( ll ) = zero
*
*           Update singular vectors if desired
*
            IF( ncvt.GT.0 )
     $         CALL dlasr( 'L', 'V', 'B', m-ll+1, ncvt, work( nm12+1 ),
     $                     work( nm13+1 ), vt( ll, 1 ), ldvt )
            IF( nru.GT.0 )
     $         CALL dlasr( 'R', 'V', 'B', nru, m-ll+1, work( 1 ),
     $                     work( n ), u( 1, ll ), ldu )
            IF( ncc.GT.0 )
     $         CALL dlasr( 'L', 'V', 'B', m-ll+1, ncc, work( 1 ),
     $                     work( n ), c( ll, 1 ), ldc )
         END IF
      END IF
*
*     QR iteration finished, go back and check convergence
*
      GO TO 60
*
*     All singular values converged, so make them positive
*
  160 CONTINUE
      DO 170 i = 1, n
         IF( d( i ).LT.zero ) THEN
            d( i ) = -d( i )
*
*           Change sign of singular vectors, if desired
*
            IF( ncvt.GT.0 )
     $         CALL dscal( ncvt, negone, vt( i, 1 ), ldvt )
         END IF
  170 CONTINUE
*
*     Sort the singular values into decreasing order (insertion sort on
*     singular values, but only one transposition per singular vector)
*
      DO 190 i = 1, n - 1
*
*        Scan for smallest D(I)
*
         isub = 1
         smin = d( 1 )
         DO 180 j = 2, n + 1 - i
            IF( d( j ).LE.smin ) THEN
               isub = j
               smin = d( j )
            END IF
  180    CONTINUE
         IF( isub.NE.n+1-i ) THEN
*
*           Swap singular values and vectors
*
            d( isub ) = d( n+1-i )
            d( n+1-i ) = smin
            IF( ncvt.GT.0 )
     $         CALL dswap( ncvt, vt( isub, 1 ), ldvt, vt( n+1-i, 1 ),
     $                     ldvt )
            IF( nru.GT.0 )
     $         CALL dswap( nru, u( 1, isub ), 1, u( 1, n+1-i ), 1 )
            IF( ncc.GT.0 )
     $         CALL dswap( ncc, c( isub, 1 ), ldc, c( n+1-i, 1 ), ldc )
         END IF
  190 CONTINUE
      GO TO 220
*
*     Maximum number of iterations exceeded, failure to converge
*
  200 CONTINUE
      info = 0
      DO 210 i = 1, n - 1
         IF( e( i ).NE.zero )
     $      info = info + 1
  210 CONTINUE
  220 CONTINUE
      RETURN
*
*     End of DBDSQR
*

◆ ddisna()

subroutine ddisna	(	character	job,
		integer	m,
		integer	n,
		double precision, dimension( * )	d,
		double precision, dimension( * )	sep,
		integer	info )

DDISNA

Download DDISNA + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DDISNA computes the reciprocal condition numbers for the eigenvectors
!> of a real symmetric or complex Hermitian matrix or for the left or
!> right singular vectors of a general m-by-n matrix. The reciprocal
!> condition number is the 'gap' between the corresponding eigenvalue or
!> singular value and the nearest other one.
!>
!> The bound on the error, measured by angle in radians, in the I-th
!> computed vector is given by
!>
!>        DLAMCH( 'E' ) * ( ANORM / SEP( I ) )
!>
!> where ANORM = 2-norm(A) = max( abs( D(j) ) ).  SEP(I) is not allowed
!> to be smaller than DLAMCH( 'E' )*ANORM in order to limit the size of
!> the error bound.
!>
!> DDISNA may also be used to compute error bounds for eigenvectors of
!> the generalized symmetric definite eigenproblem.
!>

Parameters

[in]	JOB	!> JOB is CHARACTER*1 !> Specifies for which problem the reciprocal condition numbers !> should be computed: !> = 'E': the eigenvectors of a symmetric/Hermitian matrix; !> = 'L': the left singular vectors of a general matrix; !> = 'R': the right singular vectors of a general matrix. !>
[in]	M	!> M is INTEGER !> The number of rows of the matrix. M >= 0. !>
[in]	N	!> N is INTEGER !> If JOB = 'L' or 'R', the number of columns of the matrix, !> in which case N >= 0. Ignored if JOB = 'E'. !>
[in]	D	!> D is DOUBLE PRECISION array, dimension (M) if JOB = 'E' !> dimension (min(M,N)) if JOB = 'L' or 'R' !> The eigenvalues (if JOB = 'E') or singular values (if JOB = !> 'L' or 'R') of the matrix, in either increasing or decreasing !> order. If singular values, they must be non-negative. !>
[out]	SEP	!> SEP is DOUBLE PRECISION array, dimension (M) if JOB = 'E' !> dimension (min(M,N)) if JOB = 'L' or 'R' !> The reciprocal condition numbers of the vectors. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> < 0: if INFO = -i, the i-th argument had an illegal value. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 116 of file ddisna.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          JOB
      INTEGER            INFO, M, N
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   D( * ), SEP( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ZERO
      parameter( zero = 0.0d+0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            DECR, EIGEN, INCR, LEFT, RIGHT, SING
      INTEGER            I, K
      DOUBLE PRECISION   ANORM, EPS, NEWGAP, OLDGAP, SAFMIN, THRESH
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      DOUBLE PRECISION   DLAMCH
      EXTERNAL           lsame, dlamch
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, max, min
*     ..
*     .. External Subroutines ..
      EXTERNAL           xerbla
*     ..
*     .. Executable Statements ..
*
*     Test the input arguments
*
      info = 0
      eigen = lsame( job, 'E' )
      left = lsame( job, 'L' )
      right = lsame( job, 'R' )
      sing = left .OR. right
      IF( eigen ) THEN
         k = m
      ELSE IF( sing ) THEN
         k = min( m, n )
      END IF
      IF( .NOT.eigen .AND. .NOT.sing ) THEN
         info = -1
      ELSE IF( m.LT.0 ) THEN
         info = -2
      ELSE IF( k.LT.0 ) THEN
         info = -3
      ELSE
         incr = .true.
         decr = .true.
         DO 10 i = 1, k - 1
            IF( incr )
     $         incr = incr .AND. d( i ).LE.d( i+1 )
            IF( decr )
     $         decr = decr .AND. d( i ).GE.d( i+1 )
   10    CONTINUE
         IF( sing .AND. k.GT.0 ) THEN
            IF( incr )
     $         incr = incr .AND. zero.LE.d( 1 )
            IF( decr )
     $         decr = decr .AND. d( k ).GE.zero
         END IF
         IF( .NOT.( incr .OR. decr ) )
     $      info = -4
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'DDISNA', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( k.EQ.0 )
     $   RETURN
*
*     Compute reciprocal condition numbers
*
      IF( k.EQ.1 ) THEN
         sep( 1 ) = dlamch( 'O' )
      ELSE
         oldgap = abs( d( 2 )-d( 1 ) )
         sep( 1 ) = oldgap
         DO 20 i = 2, k - 1
            newgap = abs( d( i+1 )-d( i ) )
            sep( i ) = min( oldgap, newgap )
            oldgap = newgap
   20    CONTINUE
         sep( k ) = oldgap
      END IF
      IF( sing ) THEN
         IF( ( left .AND. m.GT.n ) .OR. ( right .AND. m.LT.n ) ) THEN
            IF( incr )
     $         sep( 1 ) = min( sep( 1 ), d( 1 ) )
            IF( decr )
     $         sep( k ) = min( sep( k ), d( k ) )
         END IF
      END IF
*
*     Ensure that reciprocal condition numbers are not less than
*     threshold, in order to limit the size of the error bound
*
      eps = dlamch( 'E' )
      safmin = dlamch( 'S' )
      anorm = max( abs( d( 1 ) ), abs( d( k ) ) )
      IF( anorm.EQ.zero ) THEN
         thresh = eps
      ELSE
         thresh = max( eps*anorm, safmin )
      END IF
      DO 30 i = 1, k
         sep( i ) = max( sep( i ), thresh )
   30 CONTINUE
*
      RETURN
*
*     End of DDISNA
*

◆ dlaed0()

subroutine dlaed0	(	integer	icompq,
		integer	qsiz,
		integer	n,
		double precision, dimension( * )	d,
		double precision, dimension( * )	e,
		double precision, dimension( ldq, * )	q,
		integer	ldq,
		double precision, dimension( ldqs, * )	qstore,
		integer	ldqs,
		double precision, dimension( * )	work,
		integer, dimension( * )	iwork,
		integer	info )

DLAED0 used by DSTEDC. Computes all eigenvalues and corresponding eigenvectors of an unreduced symmetric tridiagonal matrix using the divide and conquer method.

Download DLAED0 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLAED0 computes all eigenvalues and corresponding eigenvectors of a
!> symmetric tridiagonal matrix using the divide and conquer method.
!>

Parameters

[in]	ICOMPQ	!> ICOMPQ is INTEGER !> = 0: Compute eigenvalues only. !> = 1: Compute eigenvectors of original dense symmetric matrix !> also. On entry, Q contains the orthogonal matrix used !> to reduce the original matrix to tridiagonal form. !> = 2: Compute eigenvalues and eigenvectors of tridiagonal !> matrix. !>
[in]	QSIZ	!> QSIZ is INTEGER !> The dimension of the orthogonal matrix used to reduce !> the full matrix to tridiagonal form. QSIZ >= N if ICOMPQ = 1. !>
[in]	N	!> N is INTEGER !> The dimension of the symmetric tridiagonal matrix. N >= 0. !>
[in,out]	D	!> D is DOUBLE PRECISION array, dimension (N) !> On entry, the main diagonal of the tridiagonal matrix. !> On exit, its eigenvalues. !>
[in]	E	!> E is DOUBLE PRECISION array, dimension (N-1) !> The off-diagonal elements of the tridiagonal matrix. !> On exit, E has been destroyed. !>
[in,out]	Q	!> Q is DOUBLE PRECISION array, dimension (LDQ, N) !> On entry, Q must contain an N-by-N orthogonal matrix. !> If ICOMPQ = 0 Q is not referenced. !> If ICOMPQ = 1 On entry, Q is a subset of the columns of the !> orthogonal matrix used to reduce the full !> matrix to tridiagonal form corresponding to !> the subset of the full matrix which is being !> decomposed at this time. !> If ICOMPQ = 2 On entry, Q will be the identity matrix. !> On exit, Q contains the eigenvectors of the !> tridiagonal matrix. !>
[in]	LDQ	!> LDQ is INTEGER !> The leading dimension of the array Q. If eigenvectors are !> desired, then LDQ >= max(1,N). In any case, LDQ >= 1. !>
[out]	QSTORE	!> QSTORE is DOUBLE PRECISION array, dimension (LDQS, N) !> Referenced only when ICOMPQ = 1. Used to store parts of !> the eigenvector matrix when the updating matrix multiplies !> take place. !>
[in]	LDQS	!> LDQS is INTEGER !> The leading dimension of the array QSTORE. If ICOMPQ = 1, !> then LDQS >= max(1,N). In any case, LDQS >= 1. !>
[out]	WORK	!> WORK is DOUBLE PRECISION array, !> If ICOMPQ = 0 or 1, the dimension of WORK must be at least !> 1 + 3N + 2Nlg N + 3N*2 !> ( lg( N ) = smallest integer k !> such that 2^k >= N ) !> If ICOMPQ = 2, the dimension of WORK must be at least !> 4N + N**2. !>
[out]	IWORK	!> IWORK is INTEGER array, !> If ICOMPQ = 0 or 1, the dimension of IWORK must be at least !> 6 + 6N + 5Nlg N. !> ( lg( N ) = smallest integer k !> such that 2^k >= N ) !> If ICOMPQ = 2, the dimension of IWORK must be at least !> 3 + 5N. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> < 0: if INFO = -i, the i-th argument had an illegal value. !> > 0: The algorithm failed to compute an eigenvalue while !> working on the submatrix lying in rows and columns !> INFO/(N+1) through mod(INFO,N+1). !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: Jeff Rutter, Computer Science Division, University of California at Berkeley, USA

Definition at line 170 of file dlaed0.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            ICOMPQ, INFO, LDQ, LDQS, N, QSIZ
*     ..
*     .. Array Arguments ..
      INTEGER            IWORK( * )
      DOUBLE PRECISION   D( * ), E( * ), Q( LDQ, * ), QSTORE( LDQS, * ),
     $                   WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ZERO, ONE, TWO
      parameter( zero = 0.d0, one = 1.d0, two = 2.d0 )
*     ..
*     .. Local Scalars ..
      INTEGER            CURLVL, CURPRB, CURR, I, IGIVCL, IGIVNM,
     $                   IGIVPT, INDXQ, IPERM, IPRMPT, IQ, IQPTR, IWREM,
     $                   J, K, LGN, MATSIZ, MSD2, SMLSIZ, SMM1, SPM1,
     $                   SPM2, SUBMAT, SUBPBS, TLVLS
      DOUBLE PRECISION   TEMP
*     ..
*     .. External Subroutines ..
      EXTERNAL           dcopy, dgemm, dlacpy, dlaed1, dlaed7, dsteqr,
     $                   xerbla
*     ..
*     .. External Functions ..
      INTEGER            ILAENV
      EXTERNAL           ilaenv
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, dble, int, log, max
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
*
      IF( icompq.LT.0 .OR. icompq.GT.2 ) THEN
         info = -1
      ELSE IF( ( icompq.EQ.1 ) .AND. ( qsiz.LT.max( 0, n ) ) ) THEN
         info = -2
      ELSE IF( n.LT.0 ) THEN
         info = -3
      ELSE IF( ldq.LT.max( 1, n ) ) THEN
         info = -7
      ELSE IF( ldqs.LT.max( 1, n ) ) THEN
         info = -9
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'DLAED0', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
      smlsiz = ilaenv( 9, 'DLAED0', ' ', 0, 0, 0, 0 )
*
*     Determine the size and placement of the submatrices, and save in
*     the leading elements of IWORK.
*
      iwork( 1 ) = n
      subpbs = 1
      tlvls = 0
   10 CONTINUE
      IF( iwork( subpbs ).GT.smlsiz ) THEN
         DO 20 j = subpbs, 1, -1
            iwork( 2*j ) = ( iwork( j )+1 ) / 2
            iwork( 2*j-1 ) = iwork( j ) / 2
   20    CONTINUE
         tlvls = tlvls + 1
         subpbs = 2*subpbs
         GO TO 10
      END IF
      DO 30 j = 2, subpbs
         iwork( j ) = iwork( j ) + iwork( j-1 )
   30 CONTINUE
*
*     Divide the matrix into SUBPBS submatrices of size at most SMLSIZ+1
*     using rank-1 modifications (cuts).
*
      spm1 = subpbs - 1
      DO 40 i = 1, spm1
         submat = iwork( i ) + 1
         smm1 = submat - 1
         d( smm1 ) = d( smm1 ) - abs( e( smm1 ) )
         d( submat ) = d( submat ) - abs( e( smm1 ) )
   40 CONTINUE
*
      indxq = 4*n + 3
      IF( icompq.NE.2 ) THEN
*
*        Set up workspaces for eigenvalues only/accumulate new vectors
*        routine
*
         temp = log( dble( n ) ) / log( two )
         lgn = int( temp )
         IF( 2**lgn.LT.n )
     $      lgn = lgn + 1
         IF( 2**lgn.LT.n )
     $      lgn = lgn + 1
         iprmpt = indxq + n + 1
         iperm = iprmpt + n*lgn
         iqptr = iperm + n*lgn
         igivpt = iqptr + n + 2
         igivcl = igivpt + n*lgn
*
         igivnm = 1
         iq = igivnm + 2*n*lgn
         iwrem = iq + n**2 + 1
*
*        Initialize pointers
*
         DO 50 i = 0, subpbs
            iwork( iprmpt+i ) = 1
            iwork( igivpt+i ) = 1
   50    CONTINUE
         iwork( iqptr ) = 1
      END IF
*
*     Solve each submatrix eigenproblem at the bottom of the divide and
*     conquer tree.
*
      curr = 0
      DO 70 i = 0, spm1
         IF( i.EQ.0 ) THEN
            submat = 1
            matsiz = iwork( 1 )
         ELSE
            submat = iwork( i ) + 1
            matsiz = iwork( i+1 ) - iwork( i )
         END IF
         IF( icompq.EQ.2 ) THEN
            CALL dsteqr( 'I', matsiz, d( submat ), e( submat ),
     $                   q( submat, submat ), ldq, work, info )
            IF( info.NE.0 )
     $         GO TO 130
         ELSE
            CALL dsteqr( 'I', matsiz, d( submat ), e( submat ),
     $                   work( iq-1+iwork( iqptr+curr ) ), matsiz, work,
     $                   info )
            IF( info.NE.0 )
     $         GO TO 130
            IF( icompq.EQ.1 ) THEN
               CALL dgemm( 'N', 'N', qsiz, matsiz, matsiz, one,
     $                     q( 1, submat ), ldq, work( iq-1+iwork( iqptr+
     $                     curr ) ), matsiz, zero, qstore( 1, submat ),
     $                     ldqs )
            END IF
            iwork( iqptr+curr+1 ) = iwork( iqptr+curr ) + matsiz**2
            curr = curr + 1
         END IF
         k = 1
         DO 60 j = submat, iwork( i+1 )
            iwork( indxq+j ) = k
            k = k + 1
   60    CONTINUE
   70 CONTINUE
*
*     Successively merge eigensystems of adjacent submatrices
*     into eigensystem for the corresponding larger matrix.
*
*     while ( SUBPBS > 1 )
*
      curlvl = 1
   80 CONTINUE
      IF( subpbs.GT.1 ) THEN
         spm2 = subpbs - 2
         DO 90 i = 0, spm2, 2
            IF( i.EQ.0 ) THEN
               submat = 1
               matsiz = iwork( 2 )
               msd2 = iwork( 1 )
               curprb = 0
            ELSE
               submat = iwork( i ) + 1
               matsiz = iwork( i+2 ) - iwork( i )
               msd2 = matsiz / 2
               curprb = curprb + 1
            END IF
*
*     Merge lower order eigensystems (of size MSD2 and MATSIZ - MSD2)
*     into an eigensystem of size MATSIZ.
*     DLAED1 is used only for the full eigensystem of a tridiagonal
*     matrix.
*     DLAED7 handles the cases in which eigenvalues only or eigenvalues
*     and eigenvectors of a full symmetric matrix (which was reduced to
*     tridiagonal form) are desired.
*
            IF( icompq.EQ.2 ) THEN
               CALL dlaed1( matsiz, d( submat ), q( submat, submat ),
     $                      ldq, iwork( indxq+submat ),
     $                      e( submat+msd2-1 ), msd2, work,
     $                      iwork( subpbs+1 ), info )
            ELSE
               CALL dlaed7( icompq, matsiz, qsiz, tlvls, curlvl, curprb,
     $                      d( submat ), qstore( 1, submat ), ldqs,
     $                      iwork( indxq+submat ), e( submat+msd2-1 ),
     $                      msd2, work( iq ), iwork( iqptr ),
     $                      iwork( iprmpt ), iwork( iperm ),
     $                      iwork( igivpt ), iwork( igivcl ),
     $                      work( igivnm ), work( iwrem ),
     $                      iwork( subpbs+1 ), info )
            END IF
            IF( info.NE.0 )
     $         GO TO 130
            iwork( i / 2+1 ) = iwork( i+2 )
   90    CONTINUE
         subpbs = subpbs / 2
         curlvl = curlvl + 1
         GO TO 80
      END IF
*
*     end while
*
*     Re-merge the eigenvalues/vectors which were deflated at the final
*     merge step.
*
      IF( icompq.EQ.1 ) THEN
         DO 100 i = 1, n
            j = iwork( indxq+i )
            work( i ) = d( j )
            CALL dcopy( qsiz, qstore( 1, j ), 1, q( 1, i ), 1 )
  100    CONTINUE
         CALL dcopy( n, work, 1, d, 1 )
      ELSE IF( icompq.EQ.2 ) THEN
         DO 110 i = 1, n
            j = iwork( indxq+i )
            work( i ) = d( j )
            CALL dcopy( n, q( 1, j ), 1, work( n*i+1 ), 1 )
  110    CONTINUE
         CALL dcopy( n, work, 1, d, 1 )
         CALL dlacpy( 'A', n, n, work( n+1 ), n, q, ldq )
      ELSE
         DO 120 i = 1, n
            j = iwork( indxq+i )
            work( i ) = d( j )
  120    CONTINUE
         CALL dcopy( n, work, 1, d, 1 )
      END IF
      GO TO 140
*
  130 CONTINUE
      info = submat*( n+1 ) + submat + matsiz - 1
*
  140 CONTINUE
      RETURN
*
*     End of DLAED0
*

◆ dlaed1()

subroutine dlaed1	(	integer	n,
		double precision, dimension( * )	d,
		double precision, dimension( ldq, * )	q,
		integer	ldq,
		integer, dimension( * )	indxq,
		double precision	rho,
		integer	cutpnt,
		double precision, dimension( * )	work,
		integer, dimension( * )	iwork,
		integer	info )

DLAED1 used by DSTEDC. Computes the updated eigensystem of a diagonal matrix after modification by a rank-one symmetric matrix. Used when the original matrix is tridiagonal.

Download DLAED1 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLAED1 computes the updated eigensystem of a diagonal
!> matrix after modification by a rank-one symmetric matrix.  This
!> routine is used only for the eigenproblem which requires all
!> eigenvalues and eigenvectors of a tridiagonal matrix.  DLAED7 handles
!> the case in which eigenvalues only or eigenvalues and eigenvectors
!> of a full symmetric matrix (which was reduced to tridiagonal form)
!> are desired.
!>
!>   T = Q(in) ( D(in) + RHO * Z*Z**T ) Q**T(in) = Q(out) * D(out) * Q**T(out)
!>
!>    where Z = Q**T*u, u is a vector of length N with ones in the
!>    CUTPNT and CUTPNT + 1 th elements and zeros elsewhere.
!>
!>    The eigenvectors of the original matrix are stored in Q, and the
!>    eigenvalues are in D.  The algorithm consists of three stages:
!>
!>       The first stage consists of deflating the size of the problem
!>       when there are multiple eigenvalues or if there is a zero in
!>       the Z vector.  For each such occurrence the dimension of the
!>       secular equation problem is reduced by one.  This stage is
!>       performed by the routine DLAED2.
!>
!>       The second stage consists of calculating the updated
!>       eigenvalues. This is done by finding the roots of the secular
!>       equation via the routine DLAED4 (as called by DLAED3).
!>       This routine also calculates the eigenvectors of the current
!>       problem.
!>
!>       The final stage consists of computing the updated eigenvectors
!>       directly using the updated eigenvalues.  The eigenvectors for
!>       the current problem are multiplied with the eigenvectors from
!>       the overall problem.
!>

Parameters

[in]	N	!> N is INTEGER !> The dimension of the symmetric tridiagonal matrix. N >= 0. !>
[in,out]	D	!> D is DOUBLE PRECISION array, dimension (N) !> On entry, the eigenvalues of the rank-1-perturbed matrix. !> On exit, the eigenvalues of the repaired matrix. !>
[in,out]	Q	!> Q is DOUBLE PRECISION array, dimension (LDQ,N) !> On entry, the eigenvectors of the rank-1-perturbed matrix. !> On exit, the eigenvectors of the repaired tridiagonal matrix. !>
[in]	LDQ	!> LDQ is INTEGER !> The leading dimension of the array Q. LDQ >= max(1,N). !>
[in,out]	INDXQ	!> INDXQ is INTEGER array, dimension (N) !> On entry, the permutation which separately sorts the two !> subproblems in D into ascending order. !> On exit, the permutation which will reintegrate the !> subproblems back into sorted order, !> i.e. D( INDXQ( I = 1, N ) ) will be in ascending order. !>
[in]	RHO	!> RHO is DOUBLE PRECISION !> The subdiagonal entry used to create the rank-1 modification. !>
[in]	CUTPNT	!> CUTPNT is INTEGER !> The location of the last eigenvalue in the leading sub-matrix. !> min(1,N) <= CUTPNT <= N/2. !>
[out]	WORK	!> WORK is DOUBLE PRECISION array, dimension (4N + N*2) !>
[out]	IWORK	!> IWORK is INTEGER array, dimension (4*N) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> < 0: if INFO = -i, the i-th argument had an illegal value. !> > 0: if INFO = 1, an eigenvalue did not converge !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: Jeff Rutter, Computer Science Division, University of California at Berkeley, USA
Modified by Francoise Tisseur, University of Tennessee

Definition at line 161 of file dlaed1.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            CUTPNT, INFO, LDQ, N
      DOUBLE PRECISION   RHO
*     ..
*     .. Array Arguments ..
      INTEGER            INDXQ( * ), IWORK( * )
      DOUBLE PRECISION   D( * ), Q( LDQ, * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Local Scalars ..
      INTEGER            COLTYP, I, IDLMDA, INDX, INDXC, INDXP, IQ2, IS,
     $                   IW, IZ, K, N1, N2, ZPP1
*     ..
*     .. External Subroutines ..
      EXTERNAL           dcopy, dlaed2, dlaed3, dlamrg, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, min
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
*
      IF( n.LT.0 ) THEN
         info = -1
      ELSE IF( ldq.LT.max( 1, n ) ) THEN
         info = -4
      ELSE IF( min( 1, n / 2 ).GT.cutpnt .OR. ( n / 2 ).LT.cutpnt ) THEN
         info = -7
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'DLAED1', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
*     The following values are integer pointers which indicate
*     the portion of the workspace
*     used by a particular array in DLAED2 and DLAED3.
*
      iz = 1
      idlmda = iz + n
      iw = idlmda + n
      iq2 = iw + n
*
      indx = 1
      indxc = indx + n
      coltyp = indxc + n
      indxp = coltyp + n
*
*
*     Form the z-vector which consists of the last row of Q_1 and the
*     first row of Q_2.
*
      CALL dcopy( cutpnt, q( cutpnt, 1 ), ldq, work( iz ), 1 )
      zpp1 = cutpnt + 1
      CALL dcopy( n-cutpnt, q( zpp1, zpp1 ), ldq, work( iz+cutpnt ), 1 )
*
*     Deflate eigenvalues.
*
      CALL dlaed2( k, n, cutpnt, d, q, ldq, indxq, rho, work( iz ),
     $             work( idlmda ), work( iw ), work( iq2 ),
     $             iwork( indx ), iwork( indxc ), iwork( indxp ),
     $             iwork( coltyp ), info )
*
      IF( info.NE.0 )
     $   GO TO 20
*
*     Solve Secular Equation.
*
      IF( k.NE.0 ) THEN
         is = ( iwork( coltyp )+iwork( coltyp+1 ) )*cutpnt +
     $        ( iwork( coltyp+1 )+iwork( coltyp+2 ) )*( n-cutpnt ) + iq2
         CALL dlaed3( k, n, cutpnt, d, q, ldq, rho, work( idlmda ),
     $                work( iq2 ), iwork( indxc ), iwork( coltyp ),
     $                work( iw ), work( is ), info )
         IF( info.NE.0 )
     $      GO TO 20
*
*     Prepare the INDXQ sorting permutation.
*
         n1 = k
         n2 = n - k
         CALL dlamrg( n1, n2, d, 1, -1, indxq )
      ELSE
         DO 10 i = 1, n
            indxq( i ) = i
   10    CONTINUE
      END IF
*
   20 CONTINUE
      RETURN
*
*     End of DLAED1
*

◆ dlaed2()

subroutine dlaed2	(	integer	k,
		integer	n,
		integer	n1,
		double precision, dimension( * )	d,
		double precision, dimension( ldq, * )	q,
		integer	ldq,
		integer, dimension( * )	indxq,
		double precision	rho,
		double precision, dimension( * )	z,
		double precision, dimension( * )	dlamda,
		double precision, dimension( * )	w,
		double precision, dimension( * )	q2,
		integer, dimension( * )	indx,
		integer, dimension( * )	indxc,
		integer, dimension( * )	indxp,
		integer, dimension( * )	coltyp,
		integer	info )

DLAED2 used by DSTEDC. Merges eigenvalues and deflates secular equation. Used when the original matrix is tridiagonal.

Download DLAED2 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLAED2 merges the two sets of eigenvalues together into a single
!> sorted set.  Then it tries to deflate the size of the problem.
!> There are two ways in which deflation can occur:  when two or more
!> eigenvalues are close together or if there is a tiny entry in the
!> Z vector.  For each such occurrence the order of the related secular
!> equation problem is reduced by one.
!>

Parameters

[out]	K	!> K is INTEGER !> The number of non-deflated eigenvalues, and the order of the !> related secular equation. 0 <= K <=N. !>
[in]	N	!> N is INTEGER !> The dimension of the symmetric tridiagonal matrix. N >= 0. !>
[in]	N1	!> N1 is INTEGER !> The location of the last eigenvalue in the leading sub-matrix. !> min(1,N) <= N1 <= N/2. !>
[in,out]	D	!> D is DOUBLE PRECISION array, dimension (N) !> On entry, D contains the eigenvalues of the two submatrices to !> be combined. !> On exit, D contains the trailing (N-K) updated eigenvalues !> (those which were deflated) sorted into increasing order. !>
[in,out]	Q	!> Q is DOUBLE PRECISION array, dimension (LDQ, N) !> On entry, Q contains the eigenvectors of two submatrices in !> the two square blocks with corners at (1,1), (N1,N1) !> and (N1+1, N1+1), (N,N). !> On exit, Q contains the trailing (N-K) updated eigenvectors !> (those which were deflated) in its last N-K columns. !>
[in]	LDQ	!> LDQ is INTEGER !> The leading dimension of the array Q. LDQ >= max(1,N). !>
[in,out]	INDXQ	!> INDXQ is INTEGER array, dimension (N) !> The permutation which separately sorts the two sub-problems !> in D into ascending order. Note that elements in the second !> half of this permutation must first have N1 added to their !> values. Destroyed on exit. !>
[in,out]	RHO	!> RHO is DOUBLE PRECISION !> On entry, the off-diagonal element associated with the rank-1 !> cut which originally split the two submatrices which are now !> being recombined. !> On exit, RHO has been modified to the value required by !> DLAED3. !>
[in]	Z	!> Z is DOUBLE PRECISION array, dimension (N) !> On entry, Z contains the updating vector (the last !> row of the first sub-eigenvector matrix and the first row of !> the second sub-eigenvector matrix). !> On exit, the contents of Z have been destroyed by the updating !> process. !>
[out]	DLAMDA	!> DLAMDA is DOUBLE PRECISION array, dimension (N) !> A copy of the first K eigenvalues which will be used by !> DLAED3 to form the secular equation. !>
[out]	W	!> W is DOUBLE PRECISION array, dimension (N) !> The first k values of the final deflation-altered z-vector !> which will be passed to DLAED3. !>
[out]	Q2	!> Q2 is DOUBLE PRECISION array, dimension (N12+(N-N1)2) !> A copy of the first K eigenvectors which will be used by !> DLAED3 in a matrix multiply (DGEMM) to solve for the new !> eigenvectors. !>
[out]	INDX	!> INDX is INTEGER array, dimension (N) !> The permutation used to sort the contents of DLAMDA into !> ascending order. !>
[out]	INDXC	!> INDXC is INTEGER array, dimension (N) !> The permutation used to arrange the columns of the deflated !> Q matrix into three groups: the first group contains non-zero !> elements only at and above N1, the second contains !> non-zero elements only below N1, and the third is dense. !>
[out]	INDXP	!> INDXP is INTEGER array, dimension (N) !> The permutation used to place deflated values of D at the end !> of the array. INDXP(1:K) points to the nondeflated D-values !> and INDXP(K+1:N) points to the deflated eigenvalues. !>
[out]	COLTYP	!> COLTYP is INTEGER array, dimension (N) !> During execution, a label which will indicate which of the !> following types a column in the Q2 matrix is: !> 1 : non-zero in the upper half only; !> 2 : dense; !> 3 : non-zero in the lower half only; !> 4 : deflated. !> On exit, COLTYP(i) is the number of columns of type i, !> for i=1 to 4 only. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> < 0: if INFO = -i, the i-th argument had an illegal value. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: Jeff Rutter, Computer Science Division, University of California at Berkeley, USA
Modified by Francoise Tisseur, University of Tennessee

Definition at line 210 of file dlaed2.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INFO, K, LDQ, N, N1
      DOUBLE PRECISION   RHO
*     ..
*     .. Array Arguments ..
      INTEGER            COLTYP( * ), INDX( * ), INDXC( * ), INDXP( * ),
     $                   INDXQ( * )
      DOUBLE PRECISION   D( * ), DLAMDA( * ), Q( LDQ, * ), Q2( * ),
     $                   W( * ), Z( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   MONE, ZERO, ONE, TWO, EIGHT
      parameter( mone = -1.0d0, zero = 0.0d0, one = 1.0d0,
     $                   two = 2.0d0, eight = 8.0d0 )
*     ..
*     .. Local Arrays ..
      INTEGER            CTOT( 4 ), PSM( 4 )
*     ..
*     .. Local Scalars ..
      INTEGER            CT, I, IMAX, IQ1, IQ2, J, JMAX, JS, K2, N1P1,
     $                   N2, NJ, PJ
      DOUBLE PRECISION   C, EPS, S, T, TAU, TOL
*     ..
*     .. External Functions ..
      INTEGER            IDAMAX
      DOUBLE PRECISION   DLAMCH, DLAPY2
      EXTERNAL           idamax, dlamch, dlapy2
*     ..
*     .. External Subroutines ..
      EXTERNAL           dcopy, dlacpy, dlamrg, drot, dscal, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, max, min, sqrt
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
*
      IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( ldq.LT.max( 1, n ) ) THEN
         info = -6
      ELSE IF( min( 1, ( n / 2 ) ).GT.n1 .OR. ( n / 2 ).LT.n1 ) THEN
         info = -3
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'DLAED2', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
      n2 = n - n1
      n1p1 = n1 + 1
*
      IF( rho.LT.zero ) THEN
         CALL dscal( n2, mone, z( n1p1 ), 1 )
      END IF
*
*     Normalize z so that norm(z) = 1.  Since z is the concatenation of
*     two normalized vectors, norm2(z) = sqrt(2).
*
      t = one / sqrt( two )
      CALL dscal( n, t, z, 1 )
*
*     RHO = ABS( norm(z)**2 * RHO )
*
      rho = abs( two*rho )
*
*     Sort the eigenvalues into increasing order
*
      DO 10 i = n1p1, n
         indxq( i ) = indxq( i ) + n1
   10 CONTINUE
*
*     re-integrate the deflated parts from the last pass
*
      DO 20 i = 1, n
         dlamda( i ) = d( indxq( i ) )
   20 CONTINUE
      CALL dlamrg( n1, n2, dlamda, 1, 1, indxc )
      DO 30 i = 1, n
         indx( i ) = indxq( indxc( i ) )
   30 CONTINUE
*
*     Calculate the allowable deflation tolerance
*
      imax = idamax( n, z, 1 )
      jmax = idamax( n, d, 1 )
      eps = dlamch( 'Epsilon' )
      tol = eight*eps*max( abs( d( jmax ) ), abs( z( imax ) ) )
*
*     If the rank-1 modifier is small enough, no more needs to be done
*     except to reorganize Q so that its columns correspond with the
*     elements in D.
*
      IF( rho*abs( z( imax ) ).LE.tol ) THEN
         k = 0
         iq2 = 1
         DO 40 j = 1, n
            i = indx( j )
            CALL dcopy( n, q( 1, i ), 1, q2( iq2 ), 1 )
            dlamda( j ) = d( i )
            iq2 = iq2 + n
   40    CONTINUE
         CALL dlacpy( 'A', n, n, q2, n, q, ldq )
         CALL dcopy( n, dlamda, 1, d, 1 )
         GO TO 190
      END IF
*
*     If there are multiple eigenvalues then the problem deflates.  Here
*     the number of equal eigenvalues are found.  As each equal
*     eigenvalue is found, an elementary reflector is computed to rotate
*     the corresponding eigensubspace so that the corresponding
*     components of Z are zero in this new basis.
*
      DO 50 i = 1, n1
         coltyp( i ) = 1
   50 CONTINUE
      DO 60 i = n1p1, n
         coltyp( i ) = 3
   60 CONTINUE
*
*
      k = 0
      k2 = n + 1
      DO 70 j = 1, n
         nj = indx( j )
         IF( rho*abs( z( nj ) ).LE.tol ) THEN
*
*           Deflate due to small z component.
*
            k2 = k2 - 1
            coltyp( nj ) = 4
            indxp( k2 ) = nj
            IF( j.EQ.n )
     $         GO TO 100
         ELSE
            pj = nj
            GO TO 80
         END IF
   70 CONTINUE
   80 CONTINUE
      j = j + 1
      nj = indx( j )
      IF( j.GT.n )
     $   GO TO 100
      IF( rho*abs( z( nj ) ).LE.tol ) THEN
*
*        Deflate due to small z component.
*
         k2 = k2 - 1
         coltyp( nj ) = 4
         indxp( k2 ) = nj
      ELSE
*
*        Check if eigenvalues are close enough to allow deflation.
*
         s = z( pj )
         c = z( nj )
*
*        Find sqrt(a**2+b**2) without overflow or
*        destructive underflow.
*
         tau = dlapy2( c, s )
         t = d( nj ) - d( pj )
         c = c / tau
         s = -s / tau
         IF( abs( t*c*s ).LE.tol ) THEN
*
*           Deflation is possible.
*
            z( nj ) = tau
            z( pj ) = zero
            IF( coltyp( nj ).NE.coltyp( pj ) )
     $         coltyp( nj ) = 2
            coltyp( pj ) = 4
            CALL drot( n, q( 1, pj ), 1, q( 1, nj ), 1, c, s )
            t = d( pj )*c**2 + d( nj )*s**2
            d( nj ) = d( pj )*s**2 + d( nj )*c**2
            d( pj ) = t
            k2 = k2 - 1
            i = 1
   90       CONTINUE
            IF( k2+i.LE.n ) THEN
               IF( d( pj ).LT.d( indxp( k2+i ) ) ) THEN
                  indxp( k2+i-1 ) = indxp( k2+i )
                  indxp( k2+i ) = pj
                  i = i + 1
                  GO TO 90
               ELSE
                  indxp( k2+i-1 ) = pj
               END IF
            ELSE
               indxp( k2+i-1 ) = pj
            END IF
            pj = nj
         ELSE
            k = k + 1
            dlamda( k ) = d( pj )
            w( k ) = z( pj )
            indxp( k ) = pj
            pj = nj
         END IF
      END IF
      GO TO 80
  100 CONTINUE
*
*     Record the last eigenvalue.
*
      k = k + 1
      dlamda( k ) = d( pj )
      w( k ) = z( pj )
      indxp( k ) = pj
*
*     Count up the total number of the various types of columns, then
*     form a permutation which positions the four column types into
*     four uniform groups (although one or more of these groups may be
*     empty).
*
      DO 110 j = 1, 4
         ctot( j ) = 0
  110 CONTINUE
      DO 120 j = 1, n
         ct = coltyp( j )
         ctot( ct ) = ctot( ct ) + 1
  120 CONTINUE
*
*     PSM(*) = Position in SubMatrix (of types 1 through 4)
*
      psm( 1 ) = 1
      psm( 2 ) = 1 + ctot( 1 )
      psm( 3 ) = psm( 2 ) + ctot( 2 )
      psm( 4 ) = psm( 3 ) + ctot( 3 )
      k = n - ctot( 4 )
*
*     Fill out the INDXC array so that the permutation which it induces
*     will place all type-1 columns first, all type-2 columns next,
*     then all type-3's, and finally all type-4's.
*
      DO 130 j = 1, n
         js = indxp( j )
         ct = coltyp( js )
         indx( psm( ct ) ) = js
         indxc( psm( ct ) ) = j
         psm( ct ) = psm( ct ) + 1
  130 CONTINUE
*
*     Sort the eigenvalues and corresponding eigenvectors into DLAMDA
*     and Q2 respectively.  The eigenvalues/vectors which were not
*     deflated go into the first K slots of DLAMDA and Q2 respectively,
*     while those which were deflated go into the last N - K slots.
*
      i = 1
      iq1 = 1
      iq2 = 1 + ( ctot( 1 )+ctot( 2 ) )*n1
      DO 140 j = 1, ctot( 1 )
         js = indx( i )
         CALL dcopy( n1, q( 1, js ), 1, q2( iq1 ), 1 )
         z( i ) = d( js )
         i = i + 1
         iq1 = iq1 + n1
  140 CONTINUE
*
      DO 150 j = 1, ctot( 2 )
         js = indx( i )
         CALL dcopy( n1, q( 1, js ), 1, q2( iq1 ), 1 )
         CALL dcopy( n2, q( n1+1, js ), 1, q2( iq2 ), 1 )
         z( i ) = d( js )
         i = i + 1
         iq1 = iq1 + n1
         iq2 = iq2 + n2
  150 CONTINUE
*
      DO 160 j = 1, ctot( 3 )
         js = indx( i )
         CALL dcopy( n2, q( n1+1, js ), 1, q2( iq2 ), 1 )
         z( i ) = d( js )
         i = i + 1
         iq2 = iq2 + n2
  160 CONTINUE
*
      iq1 = iq2
      DO 170 j = 1, ctot( 4 )
         js = indx( i )
         CALL dcopy( n, q( 1, js ), 1, q2( iq2 ), 1 )
         iq2 = iq2 + n
         z( i ) = d( js )
         i = i + 1
  170 CONTINUE
*
*     The deflated eigenvalues and their corresponding vectors go back
*     into the last N - K slots of D and Q respectively.
*
      IF( k.LT.n ) THEN
         CALL dlacpy( 'A', n, ctot( 4 ), q2( iq1 ), n,
     $                q( 1, k+1 ), ldq )
         CALL dcopy( n-k, z( k+1 ), 1, d( k+1 ), 1 )
      END IF
*
*     Copy CTOT into COLTYP for referencing in DLAED3.
*
      DO 180 j = 1, 4
         coltyp( j ) = ctot( j )
  180 CONTINUE
*
  190 CONTINUE
      RETURN
*
*     End of DLAED2
*

◆ dlaed3()

subroutine dlaed3	(	integer	k,
		integer	n,
		integer	n1,
		double precision, dimension( * )	d,
		double precision, dimension( ldq, * )	q,
		integer	ldq,
		double precision	rho,
		double precision, dimension( * )	dlamda,
		double precision, dimension( * )	q2,
		integer, dimension( * )	indx,
		integer, dimension( * )	ctot,
		double precision, dimension( * )	w,
		double precision, dimension( * )	s,
		integer	info )

DLAED3 used by DSTEDC. Finds the roots of the secular equation and updates the eigenvectors. Used when the original matrix is tridiagonal.

Download DLAED3 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLAED3 finds the roots of the secular equation, as defined by the
!> values in D, W, and RHO, between 1 and K.  It makes the
!> appropriate calls to DLAED4 and then updates the eigenvectors by
!> multiplying the matrix of eigenvectors of the pair of eigensystems
!> being combined by the matrix of eigenvectors of the K-by-K system
!> which is solved here.
!>
!> This code makes very mild assumptions about floating point
!> arithmetic. It will work on machines with a guard digit in
!> add/subtract, or on those binary machines without guard digits
!> which subtract like the Cray X-MP, Cray Y-MP, Cray C-90, or Cray-2.
!> It could conceivably fail on hexadecimal or decimal machines
!> without guard digits, but we know of none.
!>

Parameters

[in]	K	!> K is INTEGER !> The number of terms in the rational function to be solved by !> DLAED4. K >= 0. !>
[in]	N	!> N is INTEGER !> The number of rows and columns in the Q matrix. !> N >= K (deflation may result in N>K). !>
[in]	N1	!> N1 is INTEGER !> The location of the last eigenvalue in the leading submatrix. !> min(1,N) <= N1 <= N/2. !>
[out]	D	!> D is DOUBLE PRECISION array, dimension (N) !> D(I) contains the updated eigenvalues for !> 1 <= I <= K. !>
[out]	Q	!> Q is DOUBLE PRECISION array, dimension (LDQ,N) !> Initially the first K columns are used as workspace. !> On output the columns 1 to K contain !> the updated eigenvectors. !>
[in]	LDQ	!> LDQ is INTEGER !> The leading dimension of the array Q. LDQ >= max(1,N). !>
[in]	RHO	!> RHO is DOUBLE PRECISION !> The value of the parameter in the rank one update equation. !> RHO >= 0 required. !>
[in,out]	DLAMDA	!> DLAMDA is DOUBLE PRECISION array, dimension (K) !> The first K elements of this array contain the old roots !> of the deflated updating problem. These are the poles !> of the secular equation. May be changed on output by !> having lowest order bit set to zero on Cray X-MP, Cray Y-MP, !> Cray-2, or Cray C-90, as described above. !>
[in]	Q2	!> Q2 is DOUBLE PRECISION array, dimension (LDQ2*N) !> The first K columns of this matrix contain the non-deflated !> eigenvectors for the split problem. !>
[in]	INDX	!> INDX is INTEGER array, dimension (N) !> The permutation used to arrange the columns of the deflated !> Q matrix into three groups (see DLAED2). !> The rows of the eigenvectors found by DLAED4 must be likewise !> permuted before the matrix multiply can take place. !>
[in]	CTOT	!> CTOT is INTEGER array, dimension (4) !> A count of the total number of the various types of columns !> in Q, as described in INDX. The fourth column type is any !> column which has been deflated. !>
[in,out]	W	!> W is DOUBLE PRECISION array, dimension (K) !> The first K elements of this array contain the components !> of the deflation-adjusted updating vector. Destroyed on !> output. !>
[out]	S	!> S is DOUBLE PRECISION array, dimension (N1 + 1)*K !> Will contain the eigenvectors of the repaired matrix which !> will be multiplied by the previously accumulated eigenvectors !> to update the system. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> < 0: if INFO = -i, the i-th argument had an illegal value. !> > 0: if INFO = 1, an eigenvalue did not converge !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: Jeff Rutter, Computer Science Division, University of California at Berkeley, USA
Modified by Francoise Tisseur, University of Tennessee

Definition at line 183 of file dlaed3.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INFO, K, LDQ, N, N1
      DOUBLE PRECISION   RHO
*     ..
*     .. Array Arguments ..
      INTEGER            CTOT( * ), INDX( * )
      DOUBLE PRECISION   D( * ), DLAMDA( * ), Q( LDQ, * ), Q2( * ),
     $                   S( * ), W( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ONE, ZERO
      parameter( one = 1.0d0, zero = 0.0d0 )
*     ..
*     .. Local Scalars ..
      INTEGER            I, II, IQ2, J, N12, N2, N23
      DOUBLE PRECISION   TEMP
*     ..
*     .. External Functions ..
      DOUBLE PRECISION   DLAMC3, DNRM2
      EXTERNAL           dlamc3, dnrm2
*     ..
*     .. External Subroutines ..
      EXTERNAL           dcopy, dgemm, dlacpy, dlaed4, dlaset, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, sign, sqrt
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
*
      IF( k.LT.0 ) THEN
         info = -1
      ELSE IF( n.LT.k ) THEN
         info = -2
      ELSE IF( ldq.LT.max( 1, n ) ) THEN
         info = -6
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'DLAED3', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( k.EQ.0 )
     $   RETURN
*
*     Modify values DLAMDA(i) to make sure all DLAMDA(i)-DLAMDA(j) can
*     be computed with high relative accuracy (barring over/underflow).
*     This is a problem on machines without a guard digit in
*     add/subtract (Cray XMP, Cray YMP, Cray C 90 and Cray 2).
*     The following code replaces DLAMDA(I) by 2*DLAMDA(I)-DLAMDA(I),
*     which on any of these machines zeros out the bottommost
*     bit of DLAMDA(I) if it is 1; this makes the subsequent
*     subtractions DLAMDA(I)-DLAMDA(J) unproblematic when cancellation
*     occurs. On binary machines with a guard digit (almost all
*     machines) it does not change DLAMDA(I) at all. On hexadecimal
*     and decimal machines with a guard digit, it slightly
*     changes the bottommost bits of DLAMDA(I). It does not account
*     for hexadecimal or decimal machines without guard digits
*     (we know of none). We use a subroutine call to compute
*     2*DLAMBDA(I) to prevent optimizing compilers from eliminating
*     this code.
*
      DO 10 i = 1, k
         dlamda( i ) = dlamc3( dlamda( i ), dlamda( i ) ) - dlamda( i )
   10 CONTINUE
*
      DO 20 j = 1, k
         CALL dlaed4( k, j, dlamda, w, q( 1, j ), rho, d( j ), info )
*
*        If the zero finder fails, the computation is terminated.
*
         IF( info.NE.0 )
     $      GO TO 120
   20 CONTINUE
*
      IF( k.EQ.1 )
     $   GO TO 110
      IF( k.EQ.2 ) THEN
         DO 30 j = 1, k
            w( 1 ) = q( 1, j )
            w( 2 ) = q( 2, j )
            ii = indx( 1 )
            q( 1, j ) = w( ii )
            ii = indx( 2 )
            q( 2, j ) = w( ii )
   30    CONTINUE
         GO TO 110
      END IF
*
*     Compute updated W.
*
      CALL dcopy( k, w, 1, s, 1 )
*
*     Initialize W(I) = Q(I,I)
*
      CALL dcopy( k, q, ldq+1, w, 1 )
      DO 60 j = 1, k
         DO 40 i = 1, j - 1
            w( i ) = w( i )*( q( i, j ) / ( dlamda( i )-dlamda( j ) ) )
   40    CONTINUE
         DO 50 i = j + 1, k
            w( i ) = w( i )*( q( i, j ) / ( dlamda( i )-dlamda( j ) ) )
   50    CONTINUE
   60 CONTINUE
      DO 70 i = 1, k
         w( i ) = sign( sqrt( -w( i ) ), s( i ) )
   70 CONTINUE
*
*     Compute eigenvectors of the modified rank-1 modification.
*
      DO 100 j = 1, k
         DO 80 i = 1, k
            s( i ) = w( i ) / q( i, j )
   80    CONTINUE
         temp = dnrm2( k, s, 1 )
         DO 90 i = 1, k
            ii = indx( i )
            q( i, j ) = s( ii ) / temp
   90    CONTINUE
  100 CONTINUE
*
*     Compute the updated eigenvectors.
*
  110 CONTINUE
*
      n2 = n - n1
      n12 = ctot( 1 ) + ctot( 2 )
      n23 = ctot( 2 ) + ctot( 3 )
*
      CALL dlacpy( 'A', n23, k, q( ctot( 1 )+1, 1 ), ldq, s, n23 )
      iq2 = n1*n12 + 1
      IF( n23.NE.0 ) THEN
         CALL dgemm( 'N', 'N', n2, k, n23, one, q2( iq2 ), n2, s, n23,
     $               zero, q( n1+1, 1 ), ldq )
      ELSE
         CALL dlaset( 'A', n2, k, zero, zero, q( n1+1, 1 ), ldq )
      END IF
*
      CALL dlacpy( 'A', n12, k, q, ldq, s, n12 )
      IF( n12.NE.0 ) THEN
         CALL dgemm( 'N', 'N', n1, k, n12, one, q2, n1, s, n12, zero, q,
     $               ldq )
      ELSE
         CALL dlaset( 'A', n1, k, zero, zero, q( 1, 1 ), ldq )
      END IF
*
*
  120 CONTINUE
      RETURN
*
*     End of DLAED3
*

◆ dlaed4()

subroutine dlaed4	(	integer	n,
		integer	i,
		double precision, dimension( * )	d,
		double precision, dimension( * )	z,
		double precision, dimension( * )	delta,
		double precision	rho,
		double precision	dlam,
		integer	info )

DLAED4 used by DSTEDC. Finds a single root of the secular equation.

Download DLAED4 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> This subroutine computes the I-th updated eigenvalue of a symmetric
!> rank-one modification to a diagonal matrix whose elements are
!> given in the array d, and that
!>
!>            D(i) < D(j)  for  i < j
!>
!> and that RHO > 0.  This is arranged by the calling routine, and is
!> no loss in generality.  The rank-one modified system is thus
!>
!>            diag( D )  +  RHO * Z * Z_transpose.
!>
!> where we assume the Euclidean norm of Z is 1.
!>
!> The method consists of approximating the rational functions in the
!> secular equation by simpler interpolating rational functions.
!>

Parameters

[in]	N	!> N is INTEGER !> The length of all arrays. !>
[in]	I	!> I is INTEGER !> The index of the eigenvalue to be computed. 1 <= I <= N. !>
[in]	D	!> D is DOUBLE PRECISION array, dimension (N) !> The original eigenvalues. It is assumed that they are in !> order, D(I) < D(J) for I < J. !>
[in]	Z	!> Z is DOUBLE PRECISION array, dimension (N) !> The components of the updating vector. !>
[out]	DELTA	!> DELTA is DOUBLE PRECISION array, dimension (N) !> If N > 2, DELTA contains (D(j) - lambda_I) in its j-th !> component. If N = 1, then DELTA(1) = 1. If N = 2, see DLAED5 !> for detail. The vector DELTA contains the information necessary !> to construct the eigenvectors by DLAED3 and DLAED9. !>
[in]	RHO	!> RHO is DOUBLE PRECISION !> The scalar in the symmetric updating formula. !>
[out]	DLAM	!> DLAM is DOUBLE PRECISION !> The computed lambda_I, the I-th updated eigenvalue. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> > 0: if INFO = 1, the updating process failed. !>

Internal Parameters:

!>  Logical variable ORGATI (origin-at-i?) is used for distinguishing
!>  whether D(i) or D(i+1) is treated as the origin.
!>
!>            ORGATI = .true.    origin at i
!>            ORGATI = .false.   origin at i+1
!>
!>   Logical variable SWTCH3 (switch-for-3-poles?) is for noting
!>   if we are working with THREE poles!
!>
!>   MAXIT is the maximum number of iterations allowed for each
!>   eigenvalue.
!>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: Ren-Cang Li, Computer Science Division, University of California at Berkeley, USA

Definition at line 144 of file dlaed4.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            I, INFO, N
      DOUBLE PRECISION   DLAM, RHO
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   D( * ), DELTA( * ), Z( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      INTEGER            MAXIT
      parameter( maxit = 30 )
      DOUBLE PRECISION   ZERO, ONE, TWO, THREE, FOUR, EIGHT, TEN
      parameter( zero = 0.0d0, one = 1.0d0, two = 2.0d0,
     $                   three = 3.0d0, four = 4.0d0, eight = 8.0d0,
     $                   ten = 10.0d0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            ORGATI, SWTCH, SWTCH3
      INTEGER            II, IIM1, IIP1, IP1, ITER, J, NITER
      DOUBLE PRECISION   A, B, C, DEL, DLTLB, DLTUB, DPHI, DPSI, DW,
     $                   EPS, ERRETM, ETA, MIDPT, PHI, PREW, PSI,
     $                   RHOINV, TAU, TEMP, TEMP1, W
*     ..
*     .. Local Arrays ..
      DOUBLE PRECISION   ZZ( 3 )
*     ..
*     .. External Functions ..
      DOUBLE PRECISION   DLAMCH
      EXTERNAL           dlamch
*     ..
*     .. External Subroutines ..
      EXTERNAL           dlaed5, dlaed6
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, max, min, sqrt
*     ..
*     .. Executable Statements ..
*
*     Since this routine is called in an inner loop, we do no argument
*     checking.
*
*     Quick return for N=1 and 2.
*
      info = 0
      IF( n.EQ.1 ) THEN
*
*         Presumably, I=1 upon entry
*
         dlam = d( 1 ) + rho*z( 1 )*z( 1 )
         delta( 1 ) = one
         RETURN
      END IF
      IF( n.EQ.2 ) THEN
         CALL dlaed5( i, d, z, delta, rho, dlam )
         RETURN
      END IF
*
*     Compute machine epsilon
*
      eps = dlamch( 'Epsilon' )
      rhoinv = one / rho
*
*     The case I = N
*
      IF( i.EQ.n ) THEN
*
*        Initialize some basic variables
*
         ii = n - 1
         niter = 1
*
*        Calculate initial guess
*
         midpt = rho / two
*
*        If ||Z||_2 is not one, then TEMP should be set to
*        RHO * ||Z||_2^2 / TWO
*
         DO 10 j = 1, n
            delta( j ) = ( d( j )-d( i ) ) - midpt
   10    CONTINUE
*
         psi = zero
         DO 20 j = 1, n - 2
            psi = psi + z( j )*z( j ) / delta( j )
   20    CONTINUE
*
         c = rhoinv + psi
         w = c + z( ii )*z( ii ) / delta( ii ) +
     $       z( n )*z( n ) / delta( n )
*
         IF( w.LE.zero ) THEN
            temp = z( n-1 )*z( n-1 ) / ( d( n )-d( n-1 )+rho ) +
     $             z( n )*z( n ) / rho
            IF( c.LE.temp ) THEN
               tau = rho
            ELSE
               del = d( n ) - d( n-1 )
               a = -c*del + z( n-1 )*z( n-1 ) + z( n )*z( n )
               b = z( n )*z( n )*del
               IF( a.LT.zero ) THEN
                  tau = two*b / ( sqrt( a*a+four*b*c )-a )
               ELSE
                  tau = ( a+sqrt( a*a+four*b*c ) ) / ( two*c )
               END IF
            END IF
*
*           It can be proved that
*               D(N)+RHO/2 <= LAMBDA(N) < D(N)+TAU <= D(N)+RHO
*
            dltlb = midpt
            dltub = rho
         ELSE
            del = d( n ) - d( n-1 )
            a = -c*del + z( n-1 )*z( n-1 ) + z( n )*z( n )
            b = z( n )*z( n )*del
            IF( a.LT.zero ) THEN
               tau = two*b / ( sqrt( a*a+four*b*c )-a )
            ELSE
               tau = ( a+sqrt( a*a+four*b*c ) ) / ( two*c )
            END IF
*
*           It can be proved that
*               D(N) < D(N)+TAU < LAMBDA(N) < D(N)+RHO/2
*
            dltlb = zero
            dltub = midpt
         END IF
*
         DO 30 j = 1, n
            delta( j ) = ( d( j )-d( i ) ) - tau
   30    CONTINUE
*
*        Evaluate PSI and the derivative DPSI
*
         dpsi = zero
         psi = zero
         erretm = zero
         DO 40 j = 1, ii
            temp = z( j ) / delta( j )
            psi = psi + z( j )*temp
            dpsi = dpsi + temp*temp
            erretm = erretm + psi
   40    CONTINUE
         erretm = abs( erretm )
*
*        Evaluate PHI and the derivative DPHI
*
         temp = z( n ) / delta( n )
         phi = z( n )*temp
         dphi = temp*temp
         erretm = eight*( -phi-psi ) + erretm - phi + rhoinv +
     $            abs( tau )*( dpsi+dphi )
*
         w = rhoinv + phi + psi
*
*        Test for convergence
*
         IF( abs( w ).LE.eps*erretm ) THEN
            dlam = d( i ) + tau
            GO TO 250
         END IF
*
         IF( w.LE.zero ) THEN
            dltlb = max( dltlb, tau )
         ELSE
            dltub = min( dltub, tau )
         END IF
*
*        Calculate the new step
*
         niter = niter + 1
         c = w - delta( n-1 )*dpsi - delta( n )*dphi
         a = ( delta( n-1 )+delta( n ) )*w -
     $       delta( n-1 )*delta( n )*( dpsi+dphi )
         b = delta( n-1 )*delta( n )*w
         IF( c.LT.zero )
     $      c = abs( c )
         IF( c.EQ.zero ) THEN
*          ETA = B/A
*           ETA = RHO - TAU
            eta = dltub - tau
         ELSE IF( a.GE.zero ) THEN
            eta = ( a+sqrt( abs( a*a-four*b*c ) ) ) / ( two*c )
         ELSE
            eta = two*b / ( a-sqrt( abs( a*a-four*b*c ) ) )
         END IF
*
*        Note, eta should be positive if w is negative, and
*        eta should be negative otherwise. However,
*        if for some reason caused by roundoff, eta*w > 0,
*        we simply use one Newton step instead. This way
*        will guarantee eta*w < 0.
*
         IF( w*eta.GT.zero )
     $      eta = -w / ( dpsi+dphi )
         temp = tau + eta
         IF( temp.GT.dltub .OR. temp.LT.dltlb ) THEN
            IF( w.LT.zero ) THEN
               eta = ( dltub-tau ) / two
            ELSE
               eta = ( dltlb-tau ) / two
            END IF
         END IF
         DO 50 j = 1, n
            delta( j ) = delta( j ) - eta
   50    CONTINUE
*
         tau = tau + eta
*
*        Evaluate PSI and the derivative DPSI
*
         dpsi = zero
         psi = zero
         erretm = zero
         DO 60 j = 1, ii
            temp = z( j ) / delta( j )
            psi = psi + z( j )*temp
            dpsi = dpsi + temp*temp
            erretm = erretm + psi
   60    CONTINUE
         erretm = abs( erretm )
*
*        Evaluate PHI and the derivative DPHI
*
         temp = z( n ) / delta( n )
         phi = z( n )*temp
         dphi = temp*temp
         erretm = eight*( -phi-psi ) + erretm - phi + rhoinv +
     $            abs( tau )*( dpsi+dphi )
*
         w = rhoinv + phi + psi
*
*        Main loop to update the values of the array   DELTA
*
         iter = niter + 1
*
         DO 90 niter = iter, maxit
*
*           Test for convergence
*
            IF( abs( w ).LE.eps*erretm ) THEN
               dlam = d( i ) + tau
               GO TO 250
            END IF
*
            IF( w.LE.zero ) THEN
               dltlb = max( dltlb, tau )
            ELSE
               dltub = min( dltub, tau )
            END IF
*
*           Calculate the new step
*
            c = w - delta( n-1 )*dpsi - delta( n )*dphi
            a = ( delta( n-1 )+delta( n ) )*w -
     $          delta( n-1 )*delta( n )*( dpsi+dphi )
            b = delta( n-1 )*delta( n )*w
            IF( a.GE.zero ) THEN
               eta = ( a+sqrt( abs( a*a-four*b*c ) ) ) / ( two*c )
            ELSE
               eta = two*b / ( a-sqrt( abs( a*a-four*b*c ) ) )
            END IF
*
*           Note, eta should be positive if w is negative, and
*           eta should be negative otherwise. However,
*           if for some reason caused by roundoff, eta*w > 0,
*           we simply use one Newton step instead. This way
*           will guarantee eta*w < 0.
*
            IF( w*eta.GT.zero )
     $         eta = -w / ( dpsi+dphi )
            temp = tau + eta
            IF( temp.GT.dltub .OR. temp.LT.dltlb ) THEN
               IF( w.LT.zero ) THEN
                  eta = ( dltub-tau ) / two
               ELSE
                  eta = ( dltlb-tau ) / two
               END IF
            END IF
            DO 70 j = 1, n
               delta( j ) = delta( j ) - eta
   70       CONTINUE
*
            tau = tau + eta
*
*           Evaluate PSI and the derivative DPSI
*
            dpsi = zero
            psi = zero
            erretm = zero
            DO 80 j = 1, ii
               temp = z( j ) / delta( j )
               psi = psi + z( j )*temp
               dpsi = dpsi + temp*temp
               erretm = erretm + psi
   80       CONTINUE
            erretm = abs( erretm )
*
*           Evaluate PHI and the derivative DPHI
*
            temp = z( n ) / delta( n )
            phi = z( n )*temp
            dphi = temp*temp
            erretm = eight*( -phi-psi ) + erretm - phi + rhoinv +
     $               abs( tau )*( dpsi+dphi )
*
            w = rhoinv + phi + psi
   90    CONTINUE
*
*        Return with INFO = 1, NITER = MAXIT and not converged
*
         info = 1
         dlam = d( i ) + tau
         GO TO 250
*
*        End for the case I = N
*
      ELSE
*
*        The case for I < N
*
         niter = 1
         ip1 = i + 1
*
*        Calculate initial guess
*
         del = d( ip1 ) - d( i )
         midpt = del / two
         DO 100 j = 1, n
            delta( j ) = ( d( j )-d( i ) ) - midpt
  100    CONTINUE
*
         psi = zero
         DO 110 j = 1, i - 1
            psi = psi + z( j )*z( j ) / delta( j )
  110    CONTINUE
*
         phi = zero
         DO 120 j = n, i + 2, -1
            phi = phi + z( j )*z( j ) / delta( j )
  120    CONTINUE
         c = rhoinv + psi + phi
         w = c + z( i )*z( i ) / delta( i ) +
     $       z( ip1 )*z( ip1 ) / delta( ip1 )
*
         IF( w.GT.zero ) THEN
*
*           d(i)< the ith eigenvalue < (d(i)+d(i+1))/2
*
*           We choose d(i) as origin.
*
            orgati = .true.
            a = c*del + z( i )*z( i ) + z( ip1 )*z( ip1 )
            b = z( i )*z( i )*del
            IF( a.GT.zero ) THEN
               tau = two*b / ( a+sqrt( abs( a*a-four*b*c ) ) )
            ELSE
               tau = ( a-sqrt( abs( a*a-four*b*c ) ) ) / ( two*c )
            END IF
            dltlb = zero
            dltub = midpt
         ELSE
*
*           (d(i)+d(i+1))/2 <= the ith eigenvalue < d(i+1)
*
*           We choose d(i+1) as origin.
*
            orgati = .false.
            a = c*del - z( i )*z( i ) - z( ip1 )*z( ip1 )
            b = z( ip1 )*z( ip1 )*del
            IF( a.LT.zero ) THEN
               tau = two*b / ( a-sqrt( abs( a*a+four*b*c ) ) )
            ELSE
               tau = -( a+sqrt( abs( a*a+four*b*c ) ) ) / ( two*c )
            END IF
            dltlb = -midpt
            dltub = zero
         END IF
*
         IF( orgati ) THEN
            DO 130 j = 1, n
               delta( j ) = ( d( j )-d( i ) ) - tau
  130       CONTINUE
         ELSE
            DO 140 j = 1, n
               delta( j ) = ( d( j )-d( ip1 ) ) - tau
  140       CONTINUE
         END IF
         IF( orgati ) THEN
            ii = i
         ELSE
            ii = i + 1
         END IF
         iim1 = ii - 1
         iip1 = ii + 1
*
*        Evaluate PSI and the derivative DPSI
*
         dpsi = zero
         psi = zero
         erretm = zero
         DO 150 j = 1, iim1
            temp = z( j ) / delta( j )
            psi = psi + z( j )*temp
            dpsi = dpsi + temp*temp
            erretm = erretm + psi
  150    CONTINUE
         erretm = abs( erretm )
*
*        Evaluate PHI and the derivative DPHI
*
         dphi = zero
         phi = zero
         DO 160 j = n, iip1, -1
            temp = z( j ) / delta( j )
            phi = phi + z( j )*temp
            dphi = dphi + temp*temp
            erretm = erretm + phi
  160    CONTINUE
*
         w = rhoinv + phi + psi
*
*        W is the value of the secular function with
*        its ii-th element removed.
*
         swtch3 = .false.
         IF( orgati ) THEN
            IF( w.LT.zero )
     $         swtch3 = .true.
         ELSE
            IF( w.GT.zero )
     $         swtch3 = .true.
         END IF
         IF( ii.EQ.1 .OR. ii.EQ.n )
     $      swtch3 = .false.
*
         temp = z( ii ) / delta( ii )
         dw = dpsi + dphi + temp*temp
         temp = z( ii )*temp
         w = w + temp
         erretm = eight*( phi-psi ) + erretm + two*rhoinv +
     $            three*abs( temp ) + abs( tau )*dw
*
*        Test for convergence
*
         IF( abs( w ).LE.eps*erretm ) THEN
            IF( orgati ) THEN
               dlam = d( i ) + tau
            ELSE
               dlam = d( ip1 ) + tau
            END IF
            GO TO 250
         END IF
*
         IF( w.LE.zero ) THEN
            dltlb = max( dltlb, tau )
         ELSE
            dltub = min( dltub, tau )
         END IF
*
*        Calculate the new step
*
         niter = niter + 1
         IF( .NOT.swtch3 ) THEN
            IF( orgati ) THEN
               c = w - delta( ip1 )*dw - ( d( i )-d( ip1 ) )*
     $             ( z( i ) / delta( i ) )**2
            ELSE
               c = w - delta( i )*dw - ( d( ip1 )-d( i ) )*
     $             ( z( ip1 ) / delta( ip1 ) )**2
            END IF
            a = ( delta( i )+delta( ip1 ) )*w -
     $          delta( i )*delta( ip1 )*dw
            b = delta( i )*delta( ip1 )*w
            IF( c.EQ.zero ) THEN
               IF( a.EQ.zero ) THEN
                  IF( orgati ) THEN
                     a = z( i )*z( i ) + delta( ip1 )*delta( ip1 )*
     $                   ( dpsi+dphi )
                  ELSE
                     a = z( ip1 )*z( ip1 ) + delta( i )*delta( i )*
     $                   ( dpsi+dphi )
                  END IF
               END IF
               eta = b / a
            ELSE IF( a.LE.zero ) THEN
               eta = ( a-sqrt( abs( a*a-four*b*c ) ) ) / ( two*c )
            ELSE
               eta = two*b / ( a+sqrt( abs( a*a-four*b*c ) ) )
            END IF
         ELSE
*
*           Interpolation using THREE most relevant poles
*
            temp = rhoinv + psi + phi
            IF( orgati ) THEN
               temp1 = z( iim1 ) / delta( iim1 )
               temp1 = temp1*temp1
               c = temp - delta( iip1 )*( dpsi+dphi ) -
     $             ( d( iim1 )-d( iip1 ) )*temp1
               zz( 1 ) = z( iim1 )*z( iim1 )
               zz( 3 ) = delta( iip1 )*delta( iip1 )*
     $                   ( ( dpsi-temp1 )+dphi )
            ELSE
               temp1 = z( iip1 ) / delta( iip1 )
               temp1 = temp1*temp1
               c = temp - delta( iim1 )*( dpsi+dphi ) -
     $             ( d( iip1 )-d( iim1 ) )*temp1
               zz( 1 ) = delta( iim1 )*delta( iim1 )*
     $                   ( dpsi+( dphi-temp1 ) )
               zz( 3 ) = z( iip1 )*z( iip1 )
            END IF
            zz( 2 ) = z( ii )*z( ii )
            CALL dlaed6( niter, orgati, c, delta( iim1 ), zz, w, eta,
     $                   info )
            IF( info.NE.0 )
     $         GO TO 250
         END IF
*
*        Note, eta should be positive if w is negative, and
*        eta should be negative otherwise. However,
*        if for some reason caused by roundoff, eta*w > 0,
*        we simply use one Newton step instead. This way
*        will guarantee eta*w < 0.
*
         IF( w*eta.GE.zero )
     $      eta = -w / dw
         temp = tau + eta
         IF( temp.GT.dltub .OR. temp.LT.dltlb ) THEN
            IF( w.LT.zero ) THEN
               eta = ( dltub-tau ) / two
            ELSE
               eta = ( dltlb-tau ) / two
            END IF
         END IF
*
         prew = w
*
         DO 180 j = 1, n
            delta( j ) = delta( j ) - eta
  180    CONTINUE
*
*        Evaluate PSI and the derivative DPSI
*
         dpsi = zero
         psi = zero
         erretm = zero
         DO 190 j = 1, iim1
            temp = z( j ) / delta( j )
            psi = psi + z( j )*temp
            dpsi = dpsi + temp*temp
            erretm = erretm + psi
  190    CONTINUE
         erretm = abs( erretm )
*
*        Evaluate PHI and the derivative DPHI
*
         dphi = zero
         phi = zero
         DO 200 j = n, iip1, -1
            temp = z( j ) / delta( j )
            phi = phi + z( j )*temp
            dphi = dphi + temp*temp
            erretm = erretm + phi
  200    CONTINUE
*
         temp = z( ii ) / delta( ii )
         dw = dpsi + dphi + temp*temp
         temp = z( ii )*temp
         w = rhoinv + phi + psi + temp
         erretm = eight*( phi-psi ) + erretm + two*rhoinv +
     $            three*abs( temp ) + abs( tau+eta )*dw
*
         swtch = .false.
         IF( orgati ) THEN
            IF( -w.GT.abs( prew ) / ten )
     $         swtch = .true.
         ELSE
            IF( w.GT.abs( prew ) / ten )
     $         swtch = .true.
         END IF
*
         tau = tau + eta
*
*        Main loop to update the values of the array   DELTA
*
         iter = niter + 1
*
         DO 240 niter = iter, maxit
*
*           Test for convergence
*
            IF( abs( w ).LE.eps*erretm ) THEN
               IF( orgati ) THEN
                  dlam = d( i ) + tau
               ELSE
                  dlam = d( ip1 ) + tau
               END IF
               GO TO 250
            END IF
*
            IF( w.LE.zero ) THEN
               dltlb = max( dltlb, tau )
            ELSE
               dltub = min( dltub, tau )
            END IF
*
*           Calculate the new step
*
            IF( .NOT.swtch3 ) THEN
               IF( .NOT.swtch ) THEN
                  IF( orgati ) THEN
                     c = w - delta( ip1 )*dw -
     $                   ( d( i )-d( ip1 ) )*( z( i ) / delta( i ) )**2
                  ELSE
                     c = w - delta( i )*dw - ( d( ip1 )-d( i ) )*
     $                   ( z( ip1 ) / delta( ip1 ) )**2
                  END IF
               ELSE
                  temp = z( ii ) / delta( ii )
                  IF( orgati ) THEN
                     dpsi = dpsi + temp*temp
                  ELSE
                     dphi = dphi + temp*temp
                  END IF
                  c = w - delta( i )*dpsi - delta( ip1 )*dphi
               END IF
               a = ( delta( i )+delta( ip1 ) )*w -
     $             delta( i )*delta( ip1 )*dw
               b = delta( i )*delta( ip1 )*w
               IF( c.EQ.zero ) THEN
                  IF( a.EQ.zero ) THEN
                     IF( .NOT.swtch ) THEN
                        IF( orgati ) THEN
                           a = z( i )*z( i ) + delta( ip1 )*
     $                         delta( ip1 )*( dpsi+dphi )
                        ELSE
                           a = z( ip1 )*z( ip1 ) +
     $                         delta( i )*delta( i )*( dpsi+dphi )
                        END IF
                     ELSE
                        a = delta( i )*delta( i )*dpsi +
     $                      delta( ip1 )*delta( ip1 )*dphi
                     END IF
                  END IF
                  eta = b / a
               ELSE IF( a.LE.zero ) THEN
                  eta = ( a-sqrt( abs( a*a-four*b*c ) ) ) / ( two*c )
               ELSE
                  eta = two*b / ( a+sqrt( abs( a*a-four*b*c ) ) )
               END IF
            ELSE
*
*              Interpolation using THREE most relevant poles
*
               temp = rhoinv + psi + phi
               IF( swtch ) THEN
                  c = temp - delta( iim1 )*dpsi - delta( iip1 )*dphi
                  zz( 1 ) = delta( iim1 )*delta( iim1 )*dpsi
                  zz( 3 ) = delta( iip1 )*delta( iip1 )*dphi
               ELSE
                  IF( orgati ) THEN
                     temp1 = z( iim1 ) / delta( iim1 )
                     temp1 = temp1*temp1
                     c = temp - delta( iip1 )*( dpsi+dphi ) -
     $                   ( d( iim1 )-d( iip1 ) )*temp1
                     zz( 1 ) = z( iim1 )*z( iim1 )
                     zz( 3 ) = delta( iip1 )*delta( iip1 )*
     $                         ( ( dpsi-temp1 )+dphi )
                  ELSE
                     temp1 = z( iip1 ) / delta( iip1 )
                     temp1 = temp1*temp1
                     c = temp - delta( iim1 )*( dpsi+dphi ) -
     $                   ( d( iip1 )-d( iim1 ) )*temp1
                     zz( 1 ) = delta( iim1 )*delta( iim1 )*
     $                         ( dpsi+( dphi-temp1 ) )
                     zz( 3 ) = z( iip1 )*z( iip1 )
                  END IF
               END IF
               CALL dlaed6( niter, orgati, c, delta( iim1 ), zz, w, eta,
     $                      info )
               IF( info.NE.0 )
     $            GO TO 250
            END IF
*
*           Note, eta should be positive if w is negative, and
*           eta should be negative otherwise. However,
*           if for some reason caused by roundoff, eta*w > 0,
*           we simply use one Newton step instead. This way
*           will guarantee eta*w < 0.
*
            IF( w*eta.GE.zero )
     $         eta = -w / dw
            temp = tau + eta
            IF( temp.GT.dltub .OR. temp.LT.dltlb ) THEN
               IF( w.LT.zero ) THEN
                  eta = ( dltub-tau ) / two
               ELSE
                  eta = ( dltlb-tau ) / two
               END IF
            END IF
*
            DO 210 j = 1, n
               delta( j ) = delta( j ) - eta
  210       CONTINUE
*
            tau = tau + eta
            prew = w
*
*           Evaluate PSI and the derivative DPSI
*
            dpsi = zero
            psi = zero
            erretm = zero
            DO 220 j = 1, iim1
               temp = z( j ) / delta( j )
               psi = psi + z( j )*temp
               dpsi = dpsi + temp*temp
               erretm = erretm + psi
  220       CONTINUE
            erretm = abs( erretm )
*
*           Evaluate PHI and the derivative DPHI
*
            dphi = zero
            phi = zero
            DO 230 j = n, iip1, -1
               temp = z( j ) / delta( j )
               phi = phi + z( j )*temp
               dphi = dphi + temp*temp
               erretm = erretm + phi
  230       CONTINUE
*
            temp = z( ii ) / delta( ii )
            dw = dpsi + dphi + temp*temp
            temp = z( ii )*temp
            w = rhoinv + phi + psi + temp
            erretm = eight*( phi-psi ) + erretm + two*rhoinv +
     $               three*abs( temp ) + abs( tau )*dw
            IF( w*prew.GT.zero .AND. abs( w ).GT.abs( prew ) / ten )
     $         swtch = .NOT.swtch
*
  240    CONTINUE
*
*        Return with INFO = 1, NITER = MAXIT and not converged
*
         info = 1
         IF( orgati ) THEN
            dlam = d( i ) + tau
         ELSE
            dlam = d( ip1 ) + tau
         END IF
*
      END IF
*
  250 CONTINUE
*
      RETURN
*
*     End of DLAED4
*

◆ dlaed5()

subroutine dlaed5	(	integer	i,
		double precision, dimension( 2 )	d,
		double precision, dimension( 2 )	z,
		double precision, dimension( 2 )	delta,
		double precision	rho,
		double precision	dlam )

DLAED5 used by DSTEDC. Solves the 2-by-2 secular equation.

Download DLAED5 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> This subroutine computes the I-th eigenvalue of a symmetric rank-one
!> modification of a 2-by-2 diagonal matrix
!>
!>            diag( D )  +  RHO * Z * transpose(Z) .
!>
!> The diagonal elements in the array D are assumed to satisfy
!>
!>            D(i) < D(j)  for  i < j .
!>
!> We also assume RHO > 0 and that the Euclidean norm of the vector
!> Z is one.
!>

Parameters

[in]	I	!> I is INTEGER !> The index of the eigenvalue to be computed. I = 1 or I = 2. !>
[in]	D	!> D is DOUBLE PRECISION array, dimension (2) !> The original eigenvalues. We assume D(1) < D(2). !>
[in]	Z	!> Z is DOUBLE PRECISION array, dimension (2) !> The components of the updating vector. !>
[out]	DELTA	!> DELTA is DOUBLE PRECISION array, dimension (2) !> The vector DELTA contains the information necessary !> to construct the eigenvectors. !>
[in]	RHO	!> RHO is DOUBLE PRECISION !> The scalar in the symmetric updating formula. !>
[out]	DLAM	!> DLAM is DOUBLE PRECISION !> The computed lambda_I, the I-th updated eigenvalue. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: Ren-Cang Li, Computer Science Division, University of California at Berkeley, USA

Definition at line 107 of file dlaed5.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            I
      DOUBLE PRECISION   DLAM, RHO
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   D( 2 ), DELTA( 2 ), Z( 2 )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ZERO, ONE, TWO, FOUR
      parameter( zero = 0.0d0, one = 1.0d0, two = 2.0d0,
     $                   four = 4.0d0 )
*     ..
*     .. Local Scalars ..
      DOUBLE PRECISION   B, C, DEL, TAU, TEMP, W
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, sqrt
*     ..
*     .. Executable Statements ..
*
      del = d( 2 ) - d( 1 )
      IF( i.EQ.1 ) THEN
         w = one + two*rho*( z( 2 )*z( 2 )-z( 1 )*z( 1 ) ) / del
         IF( w.GT.zero ) THEN
            b = del + rho*( z( 1 )*z( 1 )+z( 2 )*z( 2 ) )
            c = rho*z( 1 )*z( 1 )*del
*
*           B > ZERO, always
*
            tau = two*c / ( b+sqrt( abs( b*b-four*c ) ) )
            dlam = d( 1 ) + tau
            delta( 1 ) = -z( 1 ) / tau
            delta( 2 ) = z( 2 ) / ( del-tau )
         ELSE
            b = -del + rho*( z( 1 )*z( 1 )+z( 2 )*z( 2 ) )
            c = rho*z( 2 )*z( 2 )*del
            IF( b.GT.zero ) THEN
               tau = -two*c / ( b+sqrt( b*b+four*c ) )
            ELSE
               tau = ( b-sqrt( b*b+four*c ) ) / two
            END IF
            dlam = d( 2 ) + tau
            delta( 1 ) = -z( 1 ) / ( del+tau )
            delta( 2 ) = -z( 2 ) / tau
         END IF
         temp = sqrt( delta( 1 )*delta( 1 )+delta( 2 )*delta( 2 ) )
         delta( 1 ) = delta( 1 ) / temp
         delta( 2 ) = delta( 2 ) / temp
      ELSE
*
*     Now I=2
*
         b = -del + rho*( z( 1 )*z( 1 )+z( 2 )*z( 2 ) )
         c = rho*z( 2 )*z( 2 )*del
         IF( b.GT.zero ) THEN
            tau = ( b+sqrt( b*b+four*c ) ) / two
         ELSE
            tau = two*c / ( -b+sqrt( b*b+four*c ) )
         END IF
         dlam = d( 2 ) + tau
         delta( 1 ) = -z( 1 ) / ( del+tau )
         delta( 2 ) = -z( 2 ) / tau
         temp = sqrt( delta( 1 )*delta( 1 )+delta( 2 )*delta( 2 ) )
         delta( 1 ) = delta( 1 ) / temp
         delta( 2 ) = delta( 2 ) / temp
      END IF
      RETURN
*
*     End of DLAED5
*

◆ dlaed6()

subroutine dlaed6	(	integer	kniter,
		logical	orgati,
		double precision	rho,
		double precision, dimension( 3 )	d,
		double precision, dimension( 3 )	z,
		double precision	finit,
		double precision	tau,
		integer	info )

DLAED6 used by DSTEDC. Computes one Newton step in solution of the secular equation.

Download DLAED6 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLAED6 computes the positive or negative root (closest to the origin)
!> of
!>                  z(1)        z(2)        z(3)
!> f(x) =   rho + --------- + ---------- + ---------
!>                 d(1)-x      d(2)-x      d(3)-x
!>
!> It is assumed that
!>
!>       if ORGATI = .true. the root is between d(2) and d(3);
!>       otherwise it is between d(1) and d(2)
!>
!> This routine will be called by DLAED4 when necessary. In most cases,
!> the root sought is the smallest in magnitude, though it might not be
!> in some extremely rare situations.
!>

Parameters

[in]	KNITER	!> KNITER is INTEGER !> Refer to DLAED4 for its significance. !>
[in]	ORGATI	!> ORGATI is LOGICAL !> If ORGATI is true, the needed root is between d(2) and !> d(3); otherwise it is between d(1) and d(2). See !> DLAED4 for further details. !>
[in]	RHO	!> RHO is DOUBLE PRECISION !> Refer to the equation f(x) above. !>
[in]	D	!> D is DOUBLE PRECISION array, dimension (3) !> D satisfies d(1) < d(2) < d(3). !>
[in]	Z	!> Z is DOUBLE PRECISION array, dimension (3) !> Each of the elements in z must be positive. !>
[in]	FINIT	!> FINIT is DOUBLE PRECISION !> The value of f at 0. It is more accurate than the one !> evaluated inside this routine (if someone wants to do !> so). !>
[out]	TAU	!> TAU is DOUBLE PRECISION !> The root of the equation f(x). !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> > 0: if INFO = 1, failure to converge !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  10/02/03: This version has a few statements commented out for thread
!>  safety (machine parameters are computed on each entry). SJH.
!>
!>  05/10/06: Modified from a new version of Ren-Cang Li, use
!>     Gragg-Thornton-Warner cubic convergent scheme for better stability.
!>

Contributors:: Ren-Cang Li, Computer Science Division, University of California at Berkeley, USA

Definition at line 139 of file dlaed6.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      LOGICAL            ORGATI
      INTEGER            INFO, KNITER
      DOUBLE PRECISION   FINIT, RHO, TAU
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   D( 3 ), Z( 3 )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      INTEGER            MAXIT
      parameter( maxit = 40 )
      DOUBLE PRECISION   ZERO, ONE, TWO, THREE, FOUR, EIGHT
      parameter( zero = 0.0d0, one = 1.0d0, two = 2.0d0,
     $                   three = 3.0d0, four = 4.0d0, eight = 8.0d0 )
*     ..
*     .. External Functions ..
      DOUBLE PRECISION   DLAMCH
      EXTERNAL           dlamch
*     ..
*     .. Local Arrays ..
      DOUBLE PRECISION   DSCALE( 3 ), ZSCALE( 3 )
*     ..
*     .. Local Scalars ..
      LOGICAL            SCALE
      INTEGER            I, ITER, NITER
      DOUBLE PRECISION   A, B, BASE, C, DDF, DF, EPS, ERRETM, ETA, F,
     $                   FC, SCLFAC, SCLINV, SMALL1, SMALL2, SMINV1,
     $                   SMINV2, TEMP, TEMP1, TEMP2, TEMP3, TEMP4,
     $                   LBD, UBD
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, int, log, max, min, sqrt
*     ..
*     .. Executable Statements ..
*
      info = 0
*
      IF( orgati ) THEN
         lbd = d(2)
         ubd = d(3)
      ELSE
         lbd = d(1)
         ubd = d(2)
      END IF
      IF( finit .LT. zero )THEN
         lbd = zero
      ELSE
         ubd = zero
      END IF
*
      niter = 1
      tau = zero
      IF( kniter.EQ.2 ) THEN
         IF( orgati ) THEN
            temp = ( d( 3 )-d( 2 ) ) / two
            c = rho + z( 1 ) / ( ( d( 1 )-d( 2 ) )-temp )
            a = c*( d( 2 )+d( 3 ) ) + z( 2 ) + z( 3 )
            b = c*d( 2 )*d( 3 ) + z( 2 )*d( 3 ) + z( 3 )*d( 2 )
         ELSE
            temp = ( d( 1 )-d( 2 ) ) / two
            c = rho + z( 3 ) / ( ( d( 3 )-d( 2 ) )-temp )
            a = c*( d( 1 )+d( 2 ) ) + z( 1 ) + z( 2 )
            b = c*d( 1 )*d( 2 ) + z( 1 )*d( 2 ) + z( 2 )*d( 1 )
         END IF
         temp = max( abs( a ), abs( b ), abs( c ) )
         a = a / temp
         b = b / temp
         c = c / temp
         IF( c.EQ.zero ) THEN
            tau = b / a
         ELSE IF( a.LE.zero ) THEN
            tau = ( a-sqrt( abs( a*a-four*b*c ) ) ) / ( two*c )
         ELSE
            tau = two*b / ( a+sqrt( abs( a*a-four*b*c ) ) )
         END IF
         IF( tau .LT. lbd .OR. tau .GT. ubd )
     $      tau = ( lbd+ubd )/two
         IF( d(1).EQ.tau .OR. d(2).EQ.tau .OR. d(3).EQ.tau ) THEN
            tau = zero
         ELSE
            temp = finit + tau*z(1)/( d(1)*( d( 1 )-tau ) ) +
     $                     tau*z(2)/( d(2)*( d( 2 )-tau ) ) +
     $                     tau*z(3)/( d(3)*( d( 3 )-tau ) )
            IF( temp .LE. zero )THEN
               lbd = tau
            ELSE
               ubd = tau
            END IF
            IF( abs( finit ).LE.abs( temp ) )
     $         tau = zero
         END IF
      END IF
*
*     get machine parameters for possible scaling to avoid overflow
*
*     modified by Sven: parameters SMALL1, SMINV1, SMALL2,
*     SMINV2, EPS are not SAVEd anymore between one call to the
*     others but recomputed at each call
*
      eps = dlamch( 'Epsilon' )
      base = dlamch( 'Base' )
      small1 = base**( int( log( dlamch( 'SafMin' ) ) / log( base ) /
     $         three ) )
      sminv1 = one / small1
      small2 = small1*small1
      sminv2 = sminv1*sminv1
*
*     Determine if scaling of inputs necessary to avoid overflow
*     when computing 1/TEMP**3
*
      IF( orgati ) THEN
         temp = min( abs( d( 2 )-tau ), abs( d( 3 )-tau ) )
      ELSE
         temp = min( abs( d( 1 )-tau ), abs( d( 2 )-tau ) )
      END IF
      scale = .false.
      IF( temp.LE.small1 ) THEN
         scale = .true.
         IF( temp.LE.small2 ) THEN
*
*        Scale up by power of radix nearest 1/SAFMIN**(2/3)
*
            sclfac = sminv2
            sclinv = small2
         ELSE
*
*        Scale up by power of radix nearest 1/SAFMIN**(1/3)
*
            sclfac = sminv1
            sclinv = small1
         END IF
*
*        Scaling up safe because D, Z, TAU scaled elsewhere to be O(1)
*
         DO 10 i = 1, 3
            dscale( i ) = d( i )*sclfac
            zscale( i ) = z( i )*sclfac
   10    CONTINUE
         tau = tau*sclfac
         lbd = lbd*sclfac
         ubd = ubd*sclfac
      ELSE
*
*        Copy D and Z to DSCALE and ZSCALE
*
         DO 20 i = 1, 3
            dscale( i ) = d( i )
            zscale( i ) = z( i )
   20    CONTINUE
      END IF
*
      fc = zero
      df = zero
      ddf = zero
      DO 30 i = 1, 3
         temp = one / ( dscale( i )-tau )
         temp1 = zscale( i )*temp
         temp2 = temp1*temp
         temp3 = temp2*temp
         fc = fc + temp1 / dscale( i )
         df = df + temp2
         ddf = ddf + temp3
   30 CONTINUE
      f = finit + tau*fc
*
      IF( abs( f ).LE.zero )
     $   GO TO 60
      IF( f .LE. zero )THEN
         lbd = tau
      ELSE
         ubd = tau
      END IF
*
*        Iteration begins -- Use Gragg-Thornton-Warner cubic convergent
*                            scheme
*
*     It is not hard to see that
*
*           1) Iterations will go up monotonically
*              if FINIT < 0;
*
*           2) Iterations will go down monotonically
*              if FINIT > 0.
*
      iter = niter + 1
*
      DO 50 niter = iter, maxit
*
         IF( orgati ) THEN
            temp1 = dscale( 2 ) - tau
            temp2 = dscale( 3 ) - tau
         ELSE
            temp1 = dscale( 1 ) - tau
            temp2 = dscale( 2 ) - tau
         END IF
         a = ( temp1+temp2 )*f - temp1*temp2*df
         b = temp1*temp2*f
         c = f - ( temp1+temp2 )*df + temp1*temp2*ddf
         temp = max( abs( a ), abs( b ), abs( c ) )
         a = a / temp
         b = b / temp
         c = c / temp
         IF( c.EQ.zero ) THEN
            eta = b / a
         ELSE IF( a.LE.zero ) THEN
            eta = ( a-sqrt( abs( a*a-four*b*c ) ) ) / ( two*c )
         ELSE
            eta = two*b / ( a+sqrt( abs( a*a-four*b*c ) ) )
         END IF
         IF( f*eta.GE.zero ) THEN
            eta = -f / df
         END IF
*
         tau = tau + eta
         IF( tau .LT. lbd .OR. tau .GT. ubd )
     $      tau = ( lbd + ubd )/two
*
         fc = zero
         erretm = zero
         df = zero
         ddf = zero
         DO 40 i = 1, 3
            IF ( ( dscale( i )-tau ).NE.zero ) THEN
               temp = one / ( dscale( i )-tau )
               temp1 = zscale( i )*temp
               temp2 = temp1*temp
               temp3 = temp2*temp
               temp4 = temp1 / dscale( i )
               fc = fc + temp4
               erretm = erretm + abs( temp4 )
               df = df + temp2
               ddf = ddf + temp3
            ELSE
               GO TO 60
            END IF
   40    CONTINUE
         f = finit + tau*fc
         erretm = eight*( abs( finit )+abs( tau )*erretm ) +
     $            abs( tau )*df
         IF( ( abs( f ).LE.four*eps*erretm ) .OR.
     $      ( (ubd-lbd).LE.four*eps*abs(tau) )  )
     $      GO TO 60
         IF( f .LE. zero )THEN
            lbd = tau
         ELSE
            ubd = tau
         END IF
   50 CONTINUE
      info = 1
   60 CONTINUE
*
*     Undo scaling
*
      IF( scale )
     $   tau = tau*sclinv
      RETURN
*
*     End of DLAED6
*

◆ dlaed7()

subroutine dlaed7	(	integer	icompq,
		integer	n,
		integer	qsiz,
		integer	tlvls,
		integer	curlvl,
		integer	curpbm,
		double precision, dimension( * )	d,
		double precision, dimension( ldq, * )	q,
		integer	ldq,
		integer, dimension( * )	indxq,
		double precision	rho,
		integer	cutpnt,
		double precision, dimension( * )	qstore,
		integer, dimension( * )	qptr,
		integer, dimension( * )	prmptr,
		integer, dimension( * )	perm,
		integer, dimension( * )	givptr,
		integer, dimension( 2, * )	givcol,
		double precision, dimension( 2, * )	givnum,
		double precision, dimension( * )	work,
		integer, dimension( * )	iwork,
		integer	info )

DLAED7 used by DSTEDC. Computes the updated eigensystem of a diagonal matrix after modification by a rank-one symmetric matrix. Used when the original matrix is dense.

Download DLAED7 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLAED7 computes the updated eigensystem of a diagonal
!> matrix after modification by a rank-one symmetric matrix. This
!> routine is used only for the eigenproblem which requires all
!> eigenvalues and optionally eigenvectors of a dense symmetric matrix
!> that has been reduced to tridiagonal form.  DLAED1 handles
!> the case in which all eigenvalues and eigenvectors of a symmetric
!> tridiagonal matrix are desired.
!>
!>   T = Q(in) ( D(in) + RHO * Z*Z**T ) Q**T(in) = Q(out) * D(out) * Q**T(out)
!>
!>    where Z = Q**Tu, u is a vector of length N with ones in the
!>    CUTPNT and CUTPNT + 1 th elements and zeros elsewhere.
!>
!>    The eigenvectors of the original matrix are stored in Q, and the
!>    eigenvalues are in D.  The algorithm consists of three stages:
!>
!>       The first stage consists of deflating the size of the problem
!>       when there are multiple eigenvalues or if there is a zero in
!>       the Z vector.  For each such occurrence the dimension of the
!>       secular equation problem is reduced by one.  This stage is
!>       performed by the routine DLAED8.
!>
!>       The second stage consists of calculating the updated
!>       eigenvalues. This is done by finding the roots of the secular
!>       equation via the routine DLAED4 (as called by DLAED9).
!>       This routine also calculates the eigenvectors of the current
!>       problem.
!>
!>       The final stage consists of computing the updated eigenvectors
!>       directly using the updated eigenvalues.  The eigenvectors for
!>       the current problem are multiplied with the eigenvectors from
!>       the overall problem.
!>

Parameters

[in]	ICOMPQ	!> ICOMPQ is INTEGER !> = 0: Compute eigenvalues only. !> = 1: Compute eigenvectors of original dense symmetric matrix !> also. On entry, Q contains the orthogonal matrix used !> to reduce the original matrix to tridiagonal form. !>
[in]	N	!> N is INTEGER !> The dimension of the symmetric tridiagonal matrix. N >= 0. !>
[in]	QSIZ	!> QSIZ is INTEGER !> The dimension of the orthogonal matrix used to reduce !> the full matrix to tridiagonal form. QSIZ >= N if ICOMPQ = 1. !>
[in]	TLVLS	!> TLVLS is INTEGER !> The total number of merging levels in the overall divide and !> conquer tree. !>
[in]	CURLVL	!> CURLVL is INTEGER !> The current level in the overall merge routine, !> 0 <= CURLVL <= TLVLS. !>
[in]	CURPBM	!> CURPBM is INTEGER !> The current problem in the current level in the overall !> merge routine (counting from upper left to lower right). !>
[in,out]	D	!> D is DOUBLE PRECISION array, dimension (N) !> On entry, the eigenvalues of the rank-1-perturbed matrix. !> On exit, the eigenvalues of the repaired matrix. !>
[in,out]	Q	!> Q is DOUBLE PRECISION array, dimension (LDQ, N) !> On entry, the eigenvectors of the rank-1-perturbed matrix. !> On exit, the eigenvectors of the repaired tridiagonal matrix. !>
[in]	LDQ	!> LDQ is INTEGER !> The leading dimension of the array Q. LDQ >= max(1,N). !>
[out]	INDXQ	!> INDXQ is INTEGER array, dimension (N) !> The permutation which will reintegrate the subproblem just !> solved back into sorted order, i.e., D( INDXQ( I = 1, N ) ) !> will be in ascending order. !>
[in]	RHO	!> RHO is DOUBLE PRECISION !> The subdiagonal element used to create the rank-1 !> modification. !>
[in]	CUTPNT	!> CUTPNT is INTEGER !> Contains the location of the last eigenvalue in the leading !> sub-matrix. min(1,N) <= CUTPNT <= N. !>
[in,out]	QSTORE	!> QSTORE is DOUBLE PRECISION array, dimension (N**2+1) !> Stores eigenvectors of submatrices encountered during !> divide and conquer, packed together. QPTR points to !> beginning of the submatrices. !>
[in,out]	QPTR	!> QPTR is INTEGER array, dimension (N+2) !> List of indices pointing to beginning of submatrices stored !> in QSTORE. The submatrices are numbered starting at the !> bottom left of the divide and conquer tree, from left to !> right and bottom to top. !>
[in]	PRMPTR	!> PRMPTR is INTEGER array, dimension (N lg N) !> Contains a list of pointers which indicate where in PERM a !> level's permutation is stored. PRMPTR(i+1) - PRMPTR(i) !> indicates the size of the permutation and also the size of !> the full, non-deflated problem. !>
[in]	PERM	!> PERM is INTEGER array, dimension (N lg N) !> Contains the permutations (from deflation and sorting) to be !> applied to each eigenblock. !>
[in]	GIVPTR	!> GIVPTR is INTEGER array, dimension (N lg N) !> Contains a list of pointers which indicate where in GIVCOL a !> level's Givens rotations are stored. GIVPTR(i+1) - GIVPTR(i) !> indicates the number of Givens rotations. !>
[in]	GIVCOL	!> GIVCOL is INTEGER array, dimension (2, N lg N) !> Each pair of numbers indicates a pair of columns to take place !> in a Givens rotation. !>
[in]	GIVNUM	!> GIVNUM is DOUBLE PRECISION array, dimension (2, N lg N) !> Each number indicates the S value to be used in the !> corresponding Givens rotation. !>
[out]	WORK	!> WORK is DOUBLE PRECISION array, dimension (3N+2QSIZ*N) !>
[out]	IWORK	!> IWORK is INTEGER array, dimension (4*N) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> < 0: if INFO = -i, the i-th argument had an illegal value. !> > 0: if INFO = 1, an eigenvalue did not converge !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: Jeff Rutter, Computer Science Division, University of California at Berkeley, USA

Definition at line 256 of file dlaed7.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            CURLVL, CURPBM, CUTPNT, ICOMPQ, INFO, LDQ, N,
     $                   QSIZ, TLVLS
      DOUBLE PRECISION   RHO
*     ..
*     .. Array Arguments ..
      INTEGER            GIVCOL( 2, * ), GIVPTR( * ), INDXQ( * ),
     $                   IWORK( * ), PERM( * ), PRMPTR( * ), QPTR( * )
      DOUBLE PRECISION   D( * ), GIVNUM( 2, * ), Q( LDQ, * ),
     $                   QSTORE( * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ONE, ZERO
      parameter( one = 1.0d0, zero = 0.0d0 )
*     ..
*     .. Local Scalars ..
      INTEGER            COLTYP, CURR, I, IDLMDA, INDX, INDXC, INDXP,
     $                   IQ2, IS, IW, IZ, K, LDQ2, N1, N2, PTR
*     ..
*     .. External Subroutines ..
      EXTERNAL           dgemm, dlaed8, dlaed9, dlaeda, dlamrg, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, min
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
*
      IF( icompq.LT.0 .OR. icompq.GT.1 ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( icompq.EQ.1 .AND. qsiz.LT.n ) THEN
         info = -3
      ELSE IF( ldq.LT.max( 1, n ) ) THEN
         info = -9
      ELSE IF( min( 1, n ).GT.cutpnt .OR. n.LT.cutpnt ) THEN
         info = -12
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'DLAED7', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
*     The following values are for bookkeeping purposes only.  They are
*     integer pointers which indicate the portion of the workspace
*     used by a particular array in DLAED8 and DLAED9.
*
      IF( icompq.EQ.1 ) THEN
         ldq2 = qsiz
      ELSE
         ldq2 = n
      END IF
*
      iz = 1
      idlmda = iz + n
      iw = idlmda + n
      iq2 = iw + n
      is = iq2 + n*ldq2
*
      indx = 1
      indxc = indx + n
      coltyp = indxc + n
      indxp = coltyp + n
*
*     Form the z-vector which consists of the last row of Q_1 and the
*     first row of Q_2.
*
      ptr = 1 + 2**tlvls
      DO 10 i = 1, curlvl - 1
         ptr = ptr + 2**( tlvls-i )
   10 CONTINUE
      curr = ptr + curpbm
      CALL dlaeda( n, tlvls, curlvl, curpbm, prmptr, perm, givptr,
     $             givcol, givnum, qstore, qptr, work( iz ),
     $             work( iz+n ), info )
*
*     When solving the final problem, we no longer need the stored data,
*     so we will overwrite the data from this level onto the previously
*     used storage space.
*
      IF( curlvl.EQ.tlvls ) THEN
         qptr( curr ) = 1
         prmptr( curr ) = 1
         givptr( curr ) = 1
      END IF
*
*     Sort and Deflate eigenvalues.
*
      CALL dlaed8( icompq, k, n, qsiz, d, q, ldq, indxq, rho, cutpnt,
     $             work( iz ), work( idlmda ), work( iq2 ), ldq2,
     $             work( iw ), perm( prmptr( curr ) ), givptr( curr+1 ),
     $             givcol( 1, givptr( curr ) ),
     $             givnum( 1, givptr( curr ) ), iwork( indxp ),
     $             iwork( indx ), info )
      prmptr( curr+1 ) = prmptr( curr ) + n
      givptr( curr+1 ) = givptr( curr+1 ) + givptr( curr )
*
*     Solve Secular Equation.
*
      IF( k.NE.0 ) THEN
         CALL dlaed9( k, 1, k, n, d, work( is ), k, rho, work( idlmda ),
     $                work( iw ), qstore( qptr( curr ) ), k, info )
         IF( info.NE.0 )
     $      GO TO 30
         IF( icompq.EQ.1 ) THEN
            CALL dgemm( 'N', 'N', qsiz, k, k, one, work( iq2 ), ldq2,
     $                  qstore( qptr( curr ) ), k, zero, q, ldq )
         END IF
         qptr( curr+1 ) = qptr( curr ) + k**2
*
*     Prepare the INDXQ sorting permutation.
*
         n1 = k
         n2 = n - k
         CALL dlamrg( n1, n2, d, 1, -1, indxq )
      ELSE
         qptr( curr+1 ) = qptr( curr )
         DO 20 i = 1, n
            indxq( i ) = i
   20    CONTINUE
      END IF
*
   30 CONTINUE
      RETURN
*
*     End of DLAED7
*

◆ dlaed8()

subroutine dlaed8	(	integer	icompq,
		integer	k,
		integer	n,
		integer	qsiz,
		double precision, dimension( * )	d,
		double precision, dimension( ldq, * )	q,
		integer	ldq,
		integer, dimension( * )	indxq,
		double precision	rho,
		integer	cutpnt,
		double precision, dimension( * )	z,
		double precision, dimension( * )	dlamda,
		double precision, dimension( ldq2, * )	q2,
		integer	ldq2,
		double precision, dimension( * )	w,
		integer, dimension( * )	perm,
		integer	givptr,
		integer, dimension( 2, * )	givcol,
		double precision, dimension( 2, * )	givnum,
		integer, dimension( * )	indxp,
		integer, dimension( * )	indx,
		integer	info )

DLAED8 used by DSTEDC. Merges eigenvalues and deflates secular equation. Used when the original matrix is dense.

Download DLAED8 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLAED8 merges the two sets of eigenvalues together into a single
!> sorted set.  Then it tries to deflate the size of the problem.
!> There are two ways in which deflation can occur:  when two or more
!> eigenvalues are close together or if there is a tiny element in the
!> Z vector.  For each such occurrence the order of the related secular
!> equation problem is reduced by one.
!>

Parameters

[in]	ICOMPQ	!> ICOMPQ is INTEGER !> = 0: Compute eigenvalues only. !> = 1: Compute eigenvectors of original dense symmetric matrix !> also. On entry, Q contains the orthogonal matrix used !> to reduce the original matrix to tridiagonal form. !>
[out]	K	!> K is INTEGER !> The number of non-deflated eigenvalues, and the order of the !> related secular equation. !>
[in]	N	!> N is INTEGER !> The dimension of the symmetric tridiagonal matrix. N >= 0. !>
[in]	QSIZ	!> QSIZ is INTEGER !> The dimension of the orthogonal matrix used to reduce !> the full matrix to tridiagonal form. QSIZ >= N if ICOMPQ = 1. !>
[in,out]	D	!> D is DOUBLE PRECISION array, dimension (N) !> On entry, the eigenvalues of the two submatrices to be !> combined. On exit, the trailing (N-K) updated eigenvalues !> (those which were deflated) sorted into increasing order. !>
[in,out]	Q	!> Q is DOUBLE PRECISION array, dimension (LDQ,N) !> If ICOMPQ = 0, Q is not referenced. Otherwise, !> on entry, Q contains the eigenvectors of the partially solved !> system which has been previously updated in matrix !> multiplies with other partially solved eigensystems. !> On exit, Q contains the trailing (N-K) updated eigenvectors !> (those which were deflated) in its last N-K columns. !>
[in]	LDQ	!> LDQ is INTEGER !> The leading dimension of the array Q. LDQ >= max(1,N). !>
[in]	INDXQ	!> INDXQ is INTEGER array, dimension (N) !> The permutation which separately sorts the two sub-problems !> in D into ascending order. Note that elements in the second !> half of this permutation must first have CUTPNT added to !> their values in order to be accurate. !>
[in,out]	RHO	!> RHO is DOUBLE PRECISION !> On entry, the off-diagonal element associated with the rank-1 !> cut which originally split the two submatrices which are now !> being recombined. !> On exit, RHO has been modified to the value required by !> DLAED3. !>
[in]	CUTPNT	!> CUTPNT is INTEGER !> The location of the last eigenvalue in the leading !> sub-matrix. min(1,N) <= CUTPNT <= N. !>
[in]	Z	!> Z is DOUBLE PRECISION array, dimension (N) !> On entry, Z contains the updating vector (the last row of !> the first sub-eigenvector matrix and the first row of the !> second sub-eigenvector matrix). !> On exit, the contents of Z are destroyed by the updating !> process. !>
[out]	DLAMDA	!> DLAMDA is DOUBLE PRECISION array, dimension (N) !> A copy of the first K eigenvalues which will be used by !> DLAED3 to form the secular equation. !>
[out]	Q2	!> Q2 is DOUBLE PRECISION array, dimension (LDQ2,N) !> If ICOMPQ = 0, Q2 is not referenced. Otherwise, !> a copy of the first K eigenvectors which will be used by !> DLAED7 in a matrix multiply (DGEMM) to update the new !> eigenvectors. !>
[in]	LDQ2	!> LDQ2 is INTEGER !> The leading dimension of the array Q2. LDQ2 >= max(1,N). !>
[out]	W	!> W is DOUBLE PRECISION array, dimension (N) !> The first k values of the final deflation-altered z-vector and !> will be passed to DLAED3. !>
[out]	PERM	!> PERM is INTEGER array, dimension (N) !> The permutations (from deflation and sorting) to be applied !> to each eigenblock. !>
[out]	GIVPTR	!> GIVPTR is INTEGER !> The number of Givens rotations which took place in this !> subproblem. !>
[out]	GIVCOL	!> GIVCOL is INTEGER array, dimension (2, N) !> Each pair of numbers indicates a pair of columns to take place !> in a Givens rotation. !>
[out]	GIVNUM	!> GIVNUM is DOUBLE PRECISION array, dimension (2, N) !> Each number indicates the S value to be used in the !> corresponding Givens rotation. !>
[out]	INDXP	!> INDXP is INTEGER array, dimension (N) !> The permutation used to place deflated values of D at the end !> of the array. INDXP(1:K) points to the nondeflated D-values !> and INDXP(K+1:N) points to the deflated eigenvalues. !>
[out]	INDX	!> INDX is INTEGER array, dimension (N) !> The permutation used to sort the contents of D into ascending !> order. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> < 0: if INFO = -i, the i-th argument had an illegal value. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: Jeff Rutter, Computer Science Division, University of California at Berkeley, USA

Definition at line 240 of file dlaed8.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            CUTPNT, GIVPTR, ICOMPQ, INFO, K, LDQ, LDQ2, N,
     $                   QSIZ
      DOUBLE PRECISION   RHO
*     ..
*     .. Array Arguments ..
      INTEGER            GIVCOL( 2, * ), INDX( * ), INDXP( * ),
     $                   INDXQ( * ), PERM( * )
      DOUBLE PRECISION   D( * ), DLAMDA( * ), GIVNUM( 2, * ),
     $                   Q( LDQ, * ), Q2( LDQ2, * ), W( * ), Z( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   MONE, ZERO, ONE, TWO, EIGHT
      parameter( mone = -1.0d0, zero = 0.0d0, one = 1.0d0,
     $                   two = 2.0d0, eight = 8.0d0 )
*     ..
*     .. Local Scalars ..
*
      INTEGER            I, IMAX, J, JLAM, JMAX, JP, K2, N1, N1P1, N2
      DOUBLE PRECISION   C, EPS, S, T, TAU, TOL
*     ..
*     .. External Functions ..
      INTEGER            IDAMAX
      DOUBLE PRECISION   DLAMCH, DLAPY2
      EXTERNAL           idamax, dlamch, dlapy2
*     ..
*     .. External Subroutines ..
      EXTERNAL           dcopy, dlacpy, dlamrg, drot, dscal, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, max, min, sqrt
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
*
      IF( icompq.LT.0 .OR. icompq.GT.1 ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -3
      ELSE IF( icompq.EQ.1 .AND. qsiz.LT.n ) THEN
         info = -4
      ELSE IF( ldq.LT.max( 1, n ) ) THEN
         info = -7
      ELSE IF( cutpnt.LT.min( 1, n ) .OR. cutpnt.GT.n ) THEN
         info = -10
      ELSE IF( ldq2.LT.max( 1, n ) ) THEN
         info = -14
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'DLAED8', -info )
         RETURN
      END IF
*
*     Need to initialize GIVPTR to O here in case of quick exit
*     to prevent an unspecified code behavior (usually sigfault)
*     when IWORK array on entry to *stedc is not zeroed
*     (or at least some IWORK entries which used in *laed7 for GIVPTR).
*
      givptr = 0
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
      n1 = cutpnt
      n2 = n - n1
      n1p1 = n1 + 1
*
      IF( rho.LT.zero ) THEN
         CALL dscal( n2, mone, z( n1p1 ), 1 )
      END IF
*
*     Normalize z so that norm(z) = 1
*
      t = one / sqrt( two )
      DO 10 j = 1, n
         indx( j ) = j
   10 CONTINUE
      CALL dscal( n, t, z, 1 )
      rho = abs( two*rho )
*
*     Sort the eigenvalues into increasing order
*
      DO 20 i = cutpnt + 1, n
         indxq( i ) = indxq( i ) + cutpnt
   20 CONTINUE
      DO 30 i = 1, n
         dlamda( i ) = d( indxq( i ) )
         w( i ) = z( indxq( i ) )
   30 CONTINUE
      i = 1
      j = cutpnt + 1
      CALL dlamrg( n1, n2, dlamda, 1, 1, indx )
      DO 40 i = 1, n
         d( i ) = dlamda( indx( i ) )
         z( i ) = w( indx( i ) )
   40 CONTINUE
*
*     Calculate the allowable deflation tolerance
*
      imax = idamax( n, z, 1 )
      jmax = idamax( n, d, 1 )
      eps = dlamch( 'Epsilon' )
      tol = eight*eps*abs( d( jmax ) )
*
*     If the rank-1 modifier is small enough, no more needs to be done
*     except to reorganize Q so that its columns correspond with the
*     elements in D.
*
      IF( rho*abs( z( imax ) ).LE.tol ) THEN
         k = 0
         IF( icompq.EQ.0 ) THEN
            DO 50 j = 1, n
               perm( j ) = indxq( indx( j ) )
   50       CONTINUE
         ELSE
            DO 60 j = 1, n
               perm( j ) = indxq( indx( j ) )
               CALL dcopy( qsiz, q( 1, perm( j ) ), 1, q2( 1, j ), 1 )
   60       CONTINUE
            CALL dlacpy( 'A', qsiz, n, q2( 1, 1 ), ldq2, q( 1, 1 ),
     $                   ldq )
         END IF
         RETURN
      END IF
*
*     If there are multiple eigenvalues then the problem deflates.  Here
*     the number of equal eigenvalues are found.  As each equal
*     eigenvalue is found, an elementary reflector is computed to rotate
*     the corresponding eigensubspace so that the corresponding
*     components of Z are zero in this new basis.
*
      k = 0
      k2 = n + 1
      DO 70 j = 1, n
         IF( rho*abs( z( j ) ).LE.tol ) THEN
*
*           Deflate due to small z component.
*
            k2 = k2 - 1
            indxp( k2 ) = j
            IF( j.EQ.n )
     $         GO TO 110
         ELSE
            jlam = j
            GO TO 80
         END IF
   70 CONTINUE
   80 CONTINUE
      j = j + 1
      IF( j.GT.n )
     $   GO TO 100
      IF( rho*abs( z( j ) ).LE.tol ) THEN
*
*        Deflate due to small z component.
*
         k2 = k2 - 1
         indxp( k2 ) = j
      ELSE
*
*        Check if eigenvalues are close enough to allow deflation.
*
         s = z( jlam )
         c = z( j )
*
*        Find sqrt(a**2+b**2) without overflow or
*        destructive underflow.
*
         tau = dlapy2( c, s )
         t = d( j ) - d( jlam )
         c = c / tau
         s = -s / tau
         IF( abs( t*c*s ).LE.tol ) THEN
*
*           Deflation is possible.
*
            z( j ) = tau
            z( jlam ) = zero
*
*           Record the appropriate Givens rotation
*
            givptr = givptr + 1
            givcol( 1, givptr ) = indxq( indx( jlam ) )
            givcol( 2, givptr ) = indxq( indx( j ) )
            givnum( 1, givptr ) = c
            givnum( 2, givptr ) = s
            IF( icompq.EQ.1 ) THEN
               CALL drot( qsiz, q( 1, indxq( indx( jlam ) ) ), 1,
     $                    q( 1, indxq( indx( j ) ) ), 1, c, s )
            END IF
            t = d( jlam )*c*c + d( j )*s*s
            d( j ) = d( jlam )*s*s + d( j )*c*c
            d( jlam ) = t
            k2 = k2 - 1
            i = 1
   90       CONTINUE
            IF( k2+i.LE.n ) THEN
               IF( d( jlam ).LT.d( indxp( k2+i ) ) ) THEN
                  indxp( k2+i-1 ) = indxp( k2+i )
                  indxp( k2+i ) = jlam
                  i = i + 1
                  GO TO 90
               ELSE
                  indxp( k2+i-1 ) = jlam
               END IF
            ELSE
               indxp( k2+i-1 ) = jlam
            END IF
            jlam = j
         ELSE
            k = k + 1
            w( k ) = z( jlam )
            dlamda( k ) = d( jlam )
            indxp( k ) = jlam
            jlam = j
         END IF
      END IF
      GO TO 80
  100 CONTINUE
*
*     Record the last eigenvalue.
*
      k = k + 1
      w( k ) = z( jlam )
      dlamda( k ) = d( jlam )
      indxp( k ) = jlam
*
  110 CONTINUE
*
*     Sort the eigenvalues and corresponding eigenvectors into DLAMDA
*     and Q2 respectively.  The eigenvalues/vectors which were not
*     deflated go into the first K slots of DLAMDA and Q2 respectively,
*     while those which were deflated go into the last N - K slots.
*
      IF( icompq.EQ.0 ) THEN
         DO 120 j = 1, n
            jp = indxp( j )
            dlamda( j ) = d( jp )
            perm( j ) = indxq( indx( jp ) )
  120    CONTINUE
      ELSE
         DO 130 j = 1, n
            jp = indxp( j )
            dlamda( j ) = d( jp )
            perm( j ) = indxq( indx( jp ) )
            CALL dcopy( qsiz, q( 1, perm( j ) ), 1, q2( 1, j ), 1 )
  130    CONTINUE
      END IF
*
*     The deflated eigenvalues and their corresponding vectors go back
*     into the last N - K slots of D and Q respectively.
*
      IF( k.LT.n ) THEN
         IF( icompq.EQ.0 ) THEN
            CALL dcopy( n-k, dlamda( k+1 ), 1, d( k+1 ), 1 )
         ELSE
            CALL dcopy( n-k, dlamda( k+1 ), 1, d( k+1 ), 1 )
            CALL dlacpy( 'A', qsiz, n-k, q2( 1, k+1 ), ldq2,
     $                   q( 1, k+1 ), ldq )
         END IF
      END IF
*
      RETURN
*
*     End of DLAED8
*

◆ dlaed9()

subroutine dlaed9	(	integer	k,
		integer	kstart,
		integer	kstop,
		integer	n,
		double precision, dimension( * )	d,
		double precision, dimension( ldq, * )	q,
		integer	ldq,
		double precision	rho,
		double precision, dimension( * )	dlamda,
		double precision, dimension( * )	w,
		double precision, dimension( lds, * )	s,
		integer	lds,
		integer	info )

DLAED9 used by DSTEDC. Finds the roots of the secular equation and updates the eigenvectors. Used when the original matrix is dense.

Download DLAED9 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLAED9 finds the roots of the secular equation, as defined by the
!> values in D, Z, and RHO, between KSTART and KSTOP.  It makes the
!> appropriate calls to DLAED4 and then stores the new matrix of
!> eigenvectors for use in calculating the next level of Z vectors.
!>

Parameters

[in]	K	!> K is INTEGER !> The number of terms in the rational function to be solved by !> DLAED4. K >= 0. !>
[in]	KSTART	!> KSTART is INTEGER !>
[in]	KSTOP	!> KSTOP is INTEGER !> The updated eigenvalues Lambda(I), KSTART <= I <= KSTOP !> are to be computed. 1 <= KSTART <= KSTOP <= K. !>
[in]	N	!> N is INTEGER !> The number of rows and columns in the Q matrix. !> N >= K (delation may result in N > K). !>
[out]	D	!> D is DOUBLE PRECISION array, dimension (N) !> D(I) contains the updated eigenvalues !> for KSTART <= I <= KSTOP. !>
[out]	Q	!> Q is DOUBLE PRECISION array, dimension (LDQ,N) !>
[in]	LDQ	!> LDQ is INTEGER !> The leading dimension of the array Q. LDQ >= max( 1, N ). !>
[in]	RHO	!> RHO is DOUBLE PRECISION !> The value of the parameter in the rank one update equation. !> RHO >= 0 required. !>
[in]	DLAMDA	!> DLAMDA is DOUBLE PRECISION array, dimension (K) !> The first K elements of this array contain the old roots !> of the deflated updating problem. These are the poles !> of the secular equation. !>
[in]	W	!> W is DOUBLE PRECISION array, dimension (K) !> The first K elements of this array contain the components !> of the deflation-adjusted updating vector. !>
[out]	S	!> S is DOUBLE PRECISION array, dimension (LDS, K) !> Will contain the eigenvectors of the repaired matrix which !> will be stored for subsequent Z vector calculation and !> multiplied by the previously accumulated eigenvectors !> to update the system. !>
[in]	LDS	!> LDS is INTEGER !> The leading dimension of S. LDS >= max( 1, K ). !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> < 0: if INFO = -i, the i-th argument had an illegal value. !> > 0: if INFO = 1, an eigenvalue did not converge !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: Jeff Rutter, Computer Science Division, University of California at Berkeley, USA

Definition at line 154 of file dlaed9.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INFO, K, KSTART, KSTOP, LDQ, LDS, N
      DOUBLE PRECISION   RHO
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   D( * ), DLAMDA( * ), Q( LDQ, * ), S( LDS, * ),
     $                   W( * )
*     ..
*
*  =====================================================================
*
*     .. Local Scalars ..
      INTEGER            I, J
      DOUBLE PRECISION   TEMP
*     ..
*     .. External Functions ..
      DOUBLE PRECISION   DLAMC3, DNRM2
      EXTERNAL           dlamc3, dnrm2
*     ..
*     .. External Subroutines ..
      EXTERNAL           dcopy, dlaed4, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, sign, sqrt
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
*
      IF( k.LT.0 ) THEN
         info = -1
      ELSE IF( kstart.LT.1 .OR. kstart.GT.max( 1, k ) ) THEN
         info = -2
      ELSE IF( max( 1, kstop ).LT.kstart .OR. kstop.GT.max( 1, k ) )
     $          THEN
         info = -3
      ELSE IF( n.LT.k ) THEN
         info = -4
      ELSE IF( ldq.LT.max( 1, k ) ) THEN
         info = -7
      ELSE IF( lds.LT.max( 1, k ) ) THEN
         info = -12
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'DLAED9', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( k.EQ.0 )
     $   RETURN
*
*     Modify values DLAMDA(i) to make sure all DLAMDA(i)-DLAMDA(j) can
*     be computed with high relative accuracy (barring over/underflow).
*     This is a problem on machines without a guard digit in
*     add/subtract (Cray XMP, Cray YMP, Cray C 90 and Cray 2).
*     The following code replaces DLAMDA(I) by 2*DLAMDA(I)-DLAMDA(I),
*     which on any of these machines zeros out the bottommost
*     bit of DLAMDA(I) if it is 1; this makes the subsequent
*     subtractions DLAMDA(I)-DLAMDA(J) unproblematic when cancellation
*     occurs. On binary machines with a guard digit (almost all
*     machines) it does not change DLAMDA(I) at all. On hexadecimal
*     and decimal machines with a guard digit, it slightly
*     changes the bottommost bits of DLAMDA(I). It does not account
*     for hexadecimal or decimal machines without guard digits
*     (we know of none). We use a subroutine call to compute
*     2*DLAMBDA(I) to prevent optimizing compilers from eliminating
*     this code.
*
      DO 10 i = 1, n
         dlamda( i ) = dlamc3( dlamda( i ), dlamda( i ) ) - dlamda( i )
   10 CONTINUE
*
      DO 20 j = kstart, kstop
         CALL dlaed4( k, j, dlamda, w, q( 1, j ), rho, d( j ), info )
*
*        If the zero finder fails, the computation is terminated.
*
         IF( info.NE.0 )
     $      GO TO 120
   20 CONTINUE
*
      IF( k.EQ.1 .OR. k.EQ.2 ) THEN
         DO 40 i = 1, k
            DO 30 j = 1, k
               s( j, i ) = q( j, i )
   30       CONTINUE
   40    CONTINUE
         GO TO 120
      END IF
*
*     Compute updated W.
*
      CALL dcopy( k, w, 1, s, 1 )
*
*     Initialize W(I) = Q(I,I)
*
      CALL dcopy( k, q, ldq+1, w, 1 )
      DO 70 j = 1, k
         DO 50 i = 1, j - 1
            w( i ) = w( i )*( q( i, j ) / ( dlamda( i )-dlamda( j ) ) )
   50    CONTINUE
         DO 60 i = j + 1, k
            w( i ) = w( i )*( q( i, j ) / ( dlamda( i )-dlamda( j ) ) )
   60    CONTINUE
   70 CONTINUE
      DO 80 i = 1, k
         w( i ) = sign( sqrt( -w( i ) ), s( i, 1 ) )
   80 CONTINUE
*
*     Compute eigenvectors of the modified rank-1 modification.
*
      DO 110 j = 1, k
         DO 90 i = 1, k
            q( i, j ) = w( i ) / q( i, j )
   90    CONTINUE
         temp = dnrm2( k, q( 1, j ), 1 )
         DO 100 i = 1, k
            s( i, j ) = q( i, j ) / temp
  100    CONTINUE
  110 CONTINUE
*
  120 CONTINUE
      RETURN
*
*     End of DLAED9
*

◆ dlaeda()

subroutine dlaeda	(	integer	n,
		integer	tlvls,
		integer	curlvl,
		integer	curpbm,
		integer, dimension( * )	prmptr,
		integer, dimension( * )	perm,
		integer, dimension( * )	givptr,
		integer, dimension( 2, * )	givcol,
		double precision, dimension( 2, * )	givnum,
		double precision, dimension( * )	q,
		integer, dimension( * )	qptr,
		double precision, dimension( * )	z,
		double precision, dimension( * )	ztemp,
		integer	info )

DLAEDA used by DSTEDC. Computes the Z vector determining the rank-one modification of the diagonal matrix. Used when the original matrix is dense.

Download DLAEDA + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLAEDA computes the Z vector corresponding to the merge step in the
!> CURLVLth step of the merge process with TLVLS steps for the CURPBMth
!> problem.
!>

Parameters

[in]	N	!> N is INTEGER !> The dimension of the symmetric tridiagonal matrix. N >= 0. !>
[in]	TLVLS	!> TLVLS is INTEGER !> The total number of merging levels in the overall divide and !> conquer tree. !>
[in]	CURLVL	!> CURLVL is INTEGER !> The current level in the overall merge routine, !> 0 <= curlvl <= tlvls. !>
[in]	CURPBM	!> CURPBM is INTEGER !> The current problem in the current level in the overall !> merge routine (counting from upper left to lower right). !>
[in]	PRMPTR	!> PRMPTR is INTEGER array, dimension (N lg N) !> Contains a list of pointers which indicate where in PERM a !> level's permutation is stored. PRMPTR(i+1) - PRMPTR(i) !> indicates the size of the permutation and incidentally the !> size of the full, non-deflated problem. !>
[in]	PERM	!> PERM is INTEGER array, dimension (N lg N) !> Contains the permutations (from deflation and sorting) to be !> applied to each eigenblock. !>
[in]	GIVPTR	!> GIVPTR is INTEGER array, dimension (N lg N) !> Contains a list of pointers which indicate where in GIVCOL a !> level's Givens rotations are stored. GIVPTR(i+1) - GIVPTR(i) !> indicates the number of Givens rotations. !>
[in]	GIVCOL	!> GIVCOL is INTEGER array, dimension (2, N lg N) !> Each pair of numbers indicates a pair of columns to take place !> in a Givens rotation. !>
[in]	GIVNUM	!> GIVNUM is DOUBLE PRECISION array, dimension (2, N lg N) !> Each number indicates the S value to be used in the !> corresponding Givens rotation. !>
[in]	Q	!> Q is DOUBLE PRECISION array, dimension (N**2) !> Contains the square eigenblocks from previous levels, the !> starting positions for blocks are given by QPTR. !>
[in]	QPTR	!> QPTR is INTEGER array, dimension (N+2) !> Contains a list of pointers which indicate where in Q an !> eigenblock is stored. SQRT( QPTR(i+1) - QPTR(i) ) indicates !> the size of the block. !>
[out]	Z	!> Z is DOUBLE PRECISION array, dimension (N) !> On output this vector contains the updating vector (the last !> row of the first sub-eigenvector matrix and the first row of !> the second sub-eigenvector matrix). !>
[out]	ZTEMP	!> ZTEMP is DOUBLE PRECISION array, dimension (N) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> < 0: if INFO = -i, the i-th argument had an illegal value. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: Jeff Rutter, Computer Science Division, University of California at Berkeley, USA

Definition at line 164 of file dlaeda.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            CURLVL, CURPBM, INFO, N, TLVLS
*     ..
*     .. Array Arguments ..
      INTEGER            GIVCOL( 2, * ), GIVPTR( * ), PERM( * ),
     $                   PRMPTR( * ), QPTR( * )
      DOUBLE PRECISION   GIVNUM( 2, * ), Q( * ), Z( * ), ZTEMP( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ZERO, HALF, ONE
      parameter( zero = 0.0d0, half = 0.5d0, one = 1.0d0 )
*     ..
*     .. Local Scalars ..
      INTEGER            BSIZ1, BSIZ2, CURR, I, K, MID, PSIZ1, PSIZ2,
     $                   PTR, ZPTR1
*     ..
*     .. External Subroutines ..
      EXTERNAL           dcopy, dgemv, drot, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          dble, int, sqrt
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
*
      IF( n.LT.0 ) THEN
         info = -1
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'DLAEDA', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
*     Determine location of first number in second half.
*
      mid = n / 2 + 1
*
*     Gather last/first rows of appropriate eigenblocks into center of Z
*
      ptr = 1
*
*     Determine location of lowest level subproblem in the full storage
*     scheme
*
      curr = ptr + curpbm*2**curlvl + 2**( curlvl-1 ) - 1
*
*     Determine size of these matrices.  We add HALF to the value of
*     the SQRT in case the machine underestimates one of these square
*     roots.
*
      bsiz1 = int( half+sqrt( dble( qptr( curr+1 )-qptr( curr ) ) ) )
      bsiz2 = int( half+sqrt( dble( qptr( curr+2 )-qptr( curr+1 ) ) ) )
      DO 10 k = 1, mid - bsiz1 - 1
         z( k ) = zero
   10 CONTINUE
      CALL dcopy( bsiz1, q( qptr( curr )+bsiz1-1 ), bsiz1,
     $            z( mid-bsiz1 ), 1 )
      CALL dcopy( bsiz2, q( qptr( curr+1 ) ), bsiz2, z( mid ), 1 )
      DO 20 k = mid + bsiz2, n
         z( k ) = zero
   20 CONTINUE
*
*     Loop through remaining levels 1 -> CURLVL applying the Givens
*     rotations and permutation and then multiplying the center matrices
*     against the current Z.
*
      ptr = 2**tlvls + 1
      DO 70 k = 1, curlvl - 1
         curr = ptr + curpbm*2**( curlvl-k ) + 2**( curlvl-k-1 ) - 1
         psiz1 = prmptr( curr+1 ) - prmptr( curr )
         psiz2 = prmptr( curr+2 ) - prmptr( curr+1 )
         zptr1 = mid - psiz1
*
*       Apply Givens at CURR and CURR+1
*
         DO 30 i = givptr( curr ), givptr( curr+1 ) - 1
            CALL drot( 1, z( zptr1+givcol( 1, i )-1 ), 1,
     $                 z( zptr1+givcol( 2, i )-1 ), 1, givnum( 1, i ),
     $                 givnum( 2, i ) )
   30    CONTINUE
         DO 40 i = givptr( curr+1 ), givptr( curr+2 ) - 1
            CALL drot( 1, z( mid-1+givcol( 1, i ) ), 1,
     $                 z( mid-1+givcol( 2, i ) ), 1, givnum( 1, i ),
     $                 givnum( 2, i ) )
   40    CONTINUE
         psiz1 = prmptr( curr+1 ) - prmptr( curr )
         psiz2 = prmptr( curr+2 ) - prmptr( curr+1 )
         DO 50 i = 0, psiz1 - 1
            ztemp( i+1 ) = z( zptr1+perm( prmptr( curr )+i )-1 )
   50    CONTINUE
         DO 60 i = 0, psiz2 - 1
            ztemp( psiz1+i+1 ) = z( mid+perm( prmptr( curr+1 )+i )-1 )
   60    CONTINUE
*
*        Multiply Blocks at CURR and CURR+1
*
*        Determine size of these matrices.  We add HALF to the value of
*        the SQRT in case the machine underestimates one of these
*        square roots.
*
         bsiz1 = int( half+sqrt( dble( qptr( curr+1 )-qptr( curr ) ) ) )
         bsiz2 = int( half+sqrt( dble( qptr( curr+2 )-qptr( curr+
     $           1 ) ) ) )
         IF( bsiz1.GT.0 ) THEN
            CALL dgemv( 'T', bsiz1, bsiz1, one, q( qptr( curr ) ),
     $                  bsiz1, ztemp( 1 ), 1, zero, z( zptr1 ), 1 )
         END IF
         CALL dcopy( psiz1-bsiz1, ztemp( bsiz1+1 ), 1, z( zptr1+bsiz1 ),
     $               1 )
         IF( bsiz2.GT.0 ) THEN
            CALL dgemv( 'T', bsiz2, bsiz2, one, q( qptr( curr+1 ) ),
     $                  bsiz2, ztemp( psiz1+1 ), 1, zero, z( mid ), 1 )
         END IF
         CALL dcopy( psiz2-bsiz2, ztemp( psiz1+bsiz2+1 ), 1,
     $               z( mid+bsiz2 ), 1 )
*
         ptr = ptr + 2**( tlvls-k )
   70 CONTINUE
*
      RETURN
*
*     End of DLAEDA
*

◆ dlagtf()

subroutine dlagtf	(	integer	n,
		double precision, dimension( * )	a,
		double precision	lambda,
		double precision, dimension( * )	b,
		double precision, dimension( * )	c,
		double precision	tol,
		double precision, dimension( * )	d,
		integer, dimension( * )	in,
		integer	info )

DLAGTF computes an LU factorization of a matrix T-λI, where T is a general tridiagonal matrix, and λ a scalar, using partial pivoting with row interchanges.

Download DLAGTF + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLAGTF factorizes the matrix (T - lambda*I), where T is an n by n
!> tridiagonal matrix and lambda is a scalar, as
!>
!>    T - lambda*I = PLU,
!>
!> where P is a permutation matrix, L is a unit lower tridiagonal matrix
!> with at most one non-zero sub-diagonal elements per column and U is
!> an upper triangular matrix with at most two non-zero super-diagonal
!> elements per column.
!>
!> The factorization is obtained by Gaussian elimination with partial
!> pivoting and implicit row scaling.
!>
!> The parameter LAMBDA is included in the routine so that DLAGTF may
!> be used, in conjunction with DLAGTS, to obtain eigenvectors of T by
!> inverse iteration.
!>

Parameters

[in]	N	!> N is INTEGER !> The order of the matrix T. !>
[in,out]	A	!> A is DOUBLE PRECISION array, dimension (N) !> On entry, A must contain the diagonal elements of T. !> !> On exit, A is overwritten by the n diagonal elements of the !> upper triangular matrix U of the factorization of T. !>
[in]	LAMBDA	!> LAMBDA is DOUBLE PRECISION !> On entry, the scalar lambda. !>
[in,out]	B	!> B is DOUBLE PRECISION array, dimension (N-1) !> On entry, B must contain the (n-1) super-diagonal elements of !> T. !> !> On exit, B is overwritten by the (n-1) super-diagonal !> elements of the matrix U of the factorization of T. !>
[in,out]	C	!> C is DOUBLE PRECISION array, dimension (N-1) !> On entry, C must contain the (n-1) sub-diagonal elements of !> T. !> !> On exit, C is overwritten by the (n-1) sub-diagonal elements !> of the matrix L of the factorization of T. !>
[in]	TOL	!> TOL is DOUBLE PRECISION !> On entry, a relative tolerance used to indicate whether or !> not the matrix (T - lambdaI) is nearly singular. TOL should !> normally be chose as approximately the largest relative error !> in the elements of T. For example, if the elements of T are !> correct to about 4 significant figures, then TOL should be !> set to about 510**(-4). If TOL is supplied as less than eps, !> where eps is the relative machine precision, then the value !> eps is used in place of TOL. !>
[out]	D	!> D is DOUBLE PRECISION array, dimension (N-2) !> On exit, D is overwritten by the (n-2) second super-diagonal !> elements of the matrix U of the factorization of T. !>
[out]	IN	!> IN is INTEGER array, dimension (N) !> On exit, IN contains details of the permutation matrix P. If !> an interchange occurred at the kth step of the elimination, !> then IN(k) = 1, otherwise IN(k) = 0. The element IN(n) !> returns the smallest positive integer j such that !> !> abs( u(j,j) ) <= norm( (T - lambdaI)(j) )TOL, !> !> where norm( A(j) ) denotes the sum of the absolute values of !> the jth row of the matrix A. If no such j exists then IN(n) !> is returned as zero. If IN(n) is returned as positive, then a !> diagonal element of U is small, indicating that !> (T - lambda*I) is singular or nearly singular, !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -k, the kth argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 155 of file dlagtf.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INFO, N
      DOUBLE PRECISION   LAMBDA, TOL
*     ..
*     .. Array Arguments ..
      INTEGER            IN( * )
      DOUBLE PRECISION   A( * ), B( * ), C( * ), D( * )
*     ..
*
* =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ZERO
      parameter( zero = 0.0d+0 )
*     ..
*     .. Local Scalars ..
      INTEGER            K
      DOUBLE PRECISION   EPS, MULT, PIV1, PIV2, SCALE1, SCALE2, TEMP, TL
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, max
*     ..
*     .. External Functions ..
      DOUBLE PRECISION   DLAMCH
      EXTERNAL           dlamch
*     ..
*     .. External Subroutines ..
      EXTERNAL           xerbla
*     ..
*     .. Executable Statements ..
*
      info = 0
      IF( n.LT.0 ) THEN
         info = -1
         CALL xerbla( 'DLAGTF', -info )
         RETURN
      END IF
*
      IF( n.EQ.0 )
     $   RETURN
*
      a( 1 ) = a( 1 ) - lambda
      in( n ) = 0
      IF( n.EQ.1 ) THEN
         IF( a( 1 ).EQ.zero )
     $      in( 1 ) = 1
         RETURN
      END IF
*
      eps = dlamch( 'Epsilon' )
*
      tl = max( tol, eps )
      scale1 = abs( a( 1 ) ) + abs( b( 1 ) )
      DO 10 k = 1, n - 1
         a( k+1 ) = a( k+1 ) - lambda
         scale2 = abs( c( k ) ) + abs( a( k+1 ) )
         IF( k.LT.( n-1 ) )
     $      scale2 = scale2 + abs( b( k+1 ) )
         IF( a( k ).EQ.zero ) THEN
            piv1 = zero
         ELSE
            piv1 = abs( a( k ) ) / scale1
         END IF
         IF( c( k ).EQ.zero ) THEN
            in( k ) = 0
            piv2 = zero
            scale1 = scale2
            IF( k.LT.( n-1 ) )
     $         d( k ) = zero
         ELSE
            piv2 = abs( c( k ) ) / scale2
            IF( piv2.LE.piv1 ) THEN
               in( k ) = 0
               scale1 = scale2
               c( k ) = c( k ) / a( k )
               a( k+1 ) = a( k+1 ) - c( k )*b( k )
               IF( k.LT.( n-1 ) )
     $            d( k ) = zero
            ELSE
               in( k ) = 1
               mult = a( k ) / c( k )
               a( k ) = c( k )
               temp = a( k+1 )
               a( k+1 ) = b( k ) - mult*temp
               IF( k.LT.( n-1 ) ) THEN
                  d( k ) = b( k+1 )
                  b( k+1 ) = -mult*d( k )
               END IF
               b( k ) = temp
               c( k ) = mult
            END IF
         END IF
         IF( ( max( piv1, piv2 ).LE.tl ) .AND. ( in( n ).EQ.0 ) )
     $      in( n ) = k
   10 CONTINUE
      IF( ( abs( a( n ) ).LE.scale1*tl ) .AND. ( in( n ).EQ.0 ) )
     $   in( n ) = n
*
      RETURN
*
*     End of DLAGTF
*

◆ dlamrg()

subroutine dlamrg	(	integer	n1,
		integer	n2,
		double precision, dimension( * )	a,
		integer	dtrd1,
		integer	dtrd2,
		integer, dimension( * )	index )

DLAMRG creates a permutation list to merge the entries of two independently sorted sets into a single set sorted in ascending order.

Download DLAMRG + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLAMRG will create a permutation list which will merge the elements
!> of A (which is composed of two independently sorted sets) into a
!> single set which is sorted in ascending order.
!>

Parameters

[in]	N1	!> N1 is INTEGER !>
[in]	N2	!> N2 is INTEGER !> These arguments contain the respective lengths of the two !> sorted lists to be merged. !>
[in]	A	!> A is DOUBLE PRECISION array, dimension (N1+N2) !> The first N1 elements of A contain a list of numbers which !> are sorted in either ascending or descending order. Likewise !> for the final N2 elements. !>
[in]	DTRD1	!> DTRD1 is INTEGER !>
[in]	DTRD2	!> DTRD2 is INTEGER !> These are the strides to be taken through the array A. !> Allowable strides are 1 and -1. They indicate whether a !> subset of A is sorted in ascending (DTRDx = 1) or descending !> (DTRDx = -1) order. !>
[out]	INDEX	!> INDEX is INTEGER array, dimension (N1+N2) !> On exit this array will contain a permutation such that !> if B( I ) = A( INDEX( I ) ) for I=1,N1+N2, then B will be !> sorted in ascending order. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 98 of file dlamrg.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            DTRD1, DTRD2, N1, N2
*     ..
*     .. Array Arguments ..
      INTEGER            INDEX( * )
      DOUBLE PRECISION   A( * )
*     ..
*
*  =====================================================================
*
*     .. Local Scalars ..
      INTEGER            I, IND1, IND2, N1SV, N2SV
*     ..
*     .. Executable Statements ..
*
      n1sv = n1
      n2sv = n2
      IF( dtrd1.GT.0 ) THEN
         ind1 = 1
      ELSE
         ind1 = n1
      END IF
      IF( dtrd2.GT.0 ) THEN
         ind2 = 1 + n1
      ELSE
         ind2 = n1 + n2
      END IF
      i = 1
*     while ( (N1SV > 0) & (N2SV > 0) )
   10 CONTINUE
      IF( n1sv.GT.0 .AND. n2sv.GT.0 ) THEN
         IF( a( ind1 ).LE.a( ind2 ) ) THEN
            index( i ) = ind1
            i = i + 1
            ind1 = ind1 + dtrd1
            n1sv = n1sv - 1
         ELSE
            index( i ) = ind2
            i = i + 1
            ind2 = ind2 + dtrd2
            n2sv = n2sv - 1
         END IF
         GO TO 10
      END IF
*     end while
      IF( n1sv.EQ.0 ) THEN
         DO 20 n1sv = 1, n2sv
            index( i ) = ind2
            i = i + 1
            ind2 = ind2 + dtrd2
   20    CONTINUE
      ELSE
*     N2SV .EQ. 0
         DO 30 n2sv = 1, n1sv
            index( i ) = ind1
            i = i + 1
            ind1 = ind1 + dtrd1
   30    CONTINUE
      END IF
*
      RETURN
*
*     End of DLAMRG
*

◆ dlartgs()

subroutine dlartgs	(	double precision	x,
		double precision	y,
		double precision	sigma,
		double precision	cs,
		double precision	sn )

DLARTGS generates a plane rotation designed to introduce a bulge in implicit QR iteration for the bidiagonal SVD problem.

Download DLARTGS + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLARTGS generates a plane rotation designed to introduce a bulge in
!> Golub-Reinsch-style implicit QR iteration for the bidiagonal SVD
!> problem. X and Y are the top-row entries, and SIGMA is the shift.
!> The computed CS and SN define a plane rotation satisfying
!>
!>    [  CS  SN  ]  .  [ X^2 - SIGMA ]  =  [ R ],
!>    [ -SN  CS  ]     [    X * Y    ]     [ 0 ]
!>
!> with R nonnegative.  If X^2 - SIGMA and X * Y are 0, then the
!> rotation is by PI/2.
!>

Parameters

[in]	X	!> X is DOUBLE PRECISION !> The (1,1) entry of an upper bidiagonal matrix. !>
[in]	Y	!> Y is DOUBLE PRECISION !> The (1,2) entry of an upper bidiagonal matrix. !>
[in]	SIGMA	!> SIGMA is DOUBLE PRECISION !> The shift. !>
[out]	CS	!> CS is DOUBLE PRECISION !> The cosine of the rotation. !>
[out]	SN	!> SN is DOUBLE PRECISION !> The sine of the rotation. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 89 of file dlartgs.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      DOUBLE PRECISION        CS, SIGMA, SN, X, Y
*     ..
*
*  ===================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION        NEGONE, ONE, ZERO
      parameter( negone = -1.0d0, one = 1.0d0, zero = 0.0d0 )
*     ..
*     .. Local Scalars ..
      DOUBLE PRECISION        R, S, THRESH, W, Z
*     ..
*     .. External Subroutines ..
      EXTERNAL           dlartgp
*     ..
*     .. External Functions ..
      DOUBLE PRECISION        DLAMCH
      EXTERNAL           dlamch
*     .. Executable Statements ..
*
      thresh = dlamch('E')
*
*     Compute the first column of B**T*B - SIGMA^2*I, up to a scale
*     factor.
*
      IF( (sigma .EQ. zero .AND. abs(x) .LT. thresh) .OR.
     $          (abs(x) .EQ. sigma .AND. y .EQ. zero) ) THEN
         z = zero
         w = zero
      ELSE IF( sigma .EQ. zero ) THEN
         IF( x .GE. zero ) THEN
            z = x
            w = y
         ELSE
            z = -x
            w = -y
         END IF
      ELSE IF( abs(x) .LT. thresh ) THEN
         z = -sigma*sigma
         w = zero
      ELSE
         IF( x .GE. zero ) THEN
            s = one
         ELSE
            s = negone
         END IF
         z = s * (abs(x)-sigma) * (s+sigma/x)
         w = s * y
      END IF
*
*     Generate the rotation.
*     CALL DLARTGP( Z, W, CS, SN, R ) might seem more natural;
*     reordering the arguments ensures that if Z = 0 then the rotation
*     is by PI/2.
*
      CALL dlartgp( w, z, sn, cs, r )
*
      RETURN
*
*     End DLARTGS
*

◆ dlasq1()

subroutine dlasq1	(	integer	n,
		double precision, dimension( * )	d,
		double precision, dimension( * )	e,
		double precision, dimension( * )	work,
		integer	info )

DLASQ1 computes the singular values of a real square bidiagonal matrix. Used by sbdsqr.

Download DLASQ1 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLASQ1 computes the singular values of a real N-by-N bidiagonal
!> matrix with diagonal D and off-diagonal E. The singular values
!> are computed to high relative accuracy, in the absence of
!> denormalization, underflow and overflow. The algorithm was first
!> presented in
!>
!>  by K. V.
!> Fernando and B. N. Parlett, Numer. Math., Vol-67, No. 2, pp. 191-230,
!> 1994,
!>
!> and the present implementation is described in , LAPACK Working Note.
!>

Parameters

[in]	N	!> N is INTEGER !> The number of rows and columns in the matrix. N >= 0. !>
[in,out]	D	!> D is DOUBLE PRECISION array, dimension (N) !> On entry, D contains the diagonal elements of the !> bidiagonal matrix whose SVD is desired. On normal exit, !> D contains the singular values in decreasing order. !>
[in,out]	E	!> E is DOUBLE PRECISION array, dimension (N) !> On entry, elements E(1:N-1) contain the off-diagonal elements !> of the bidiagonal matrix whose SVD is desired. !> On exit, E is overwritten. !>
[out]	WORK	!> WORK is DOUBLE PRECISION array, dimension (4*N) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !> > 0: the algorithm failed !> = 1, a split was marked by a positive value in E !> = 2, current block of Z not diagonalized after 100*N !> iterations (in inner while loop) On exit D and E !> represent a matrix with the same singular values !> which the calling subroutine could use to finish the !> computation, or even feed back into DLASQ1 !> = 3, termination criterion of outer while loop not met !> (program created more than N unreduced blocks) !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 107 of file dlasq1.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INFO, N
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   D( * ), E( * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ZERO
      parameter( zero = 0.0d0 )
*     ..
*     .. Local Scalars ..
      INTEGER            I, IINFO
      DOUBLE PRECISION   EPS, SCALE, SAFMIN, SIGMN, SIGMX
*     ..
*     .. External Subroutines ..
      EXTERNAL           dcopy, dlas2, dlascl, dlasq2, dlasrt, xerbla
*     ..
*     .. External Functions ..
      DOUBLE PRECISION   DLAMCH
      EXTERNAL           dlamch
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, max, sqrt
*     ..
*     .. Executable Statements ..
*
      info = 0
      IF( n.LT.0 ) THEN
         info = -1
         CALL xerbla( 'DLASQ1', -info )
         RETURN
      ELSE IF( n.EQ.0 ) THEN
         RETURN
      ELSE IF( n.EQ.1 ) THEN
         d( 1 ) = abs( d( 1 ) )
         RETURN
      ELSE IF( n.EQ.2 ) THEN
         CALL dlas2( d( 1 ), e( 1 ), d( 2 ), sigmn, sigmx )
         d( 1 ) = sigmx
         d( 2 ) = sigmn
         RETURN
      END IF
*
*     Estimate the largest singular value.
*
      sigmx = zero
      DO 10 i = 1, n - 1
         d( i ) = abs( d( i ) )
         sigmx = max( sigmx, abs( e( i ) ) )
   10 CONTINUE
      d( n ) = abs( d( n ) )
*
*     Early return if SIGMX is zero (matrix is already diagonal).
*
      IF( sigmx.EQ.zero ) THEN
         CALL dlasrt( 'D', n, d, iinfo )
         RETURN
      END IF
*
      DO 20 i = 1, n
         sigmx = max( sigmx, d( i ) )
   20 CONTINUE
*
*     Copy D and E into WORK (in the Z format) and scale (squaring the
*     input data makes scaling by a power of the radix pointless).
*
      eps = dlamch( 'Precision' )
      safmin = dlamch( 'Safe minimum' )
      scale = sqrt( eps / safmin )
      CALL dcopy( n, d, 1, work( 1 ), 2 )
      CALL dcopy( n-1, e, 1, work( 2 ), 2 )
      CALL dlascl( 'G', 0, 0, sigmx, scale, 2*n-1, 1, work, 2*n-1,
     $             iinfo )
*
*     Compute the q's and e's.
*
      DO 30 i = 1, 2*n - 1
         work( i ) = work( i )**2
   30 CONTINUE
      work( 2*n ) = zero
*
      CALL dlasq2( n, work, info )
*
      IF( info.EQ.0 ) THEN
         DO 40 i = 1, n
            d( i ) = sqrt( work( i ) )
   40    CONTINUE
         CALL dlascl( 'G', 0, 0, scale, sigmx, n, 1, d, n, iinfo )
      ELSE IF( info.EQ.2 ) THEN
*
*     Maximum number of iterations exceeded.  Move data from WORK
*     into D and E so the calling subroutine can try to finish
*
         DO i = 1, n
            d( i ) = sqrt( work( 2*i-1 ) )
            e( i ) = sqrt( work( 2*i ) )
         END DO
         CALL dlascl( 'G', 0, 0, scale, sigmx, n, 1, d, n, iinfo )
         CALL dlascl( 'G', 0, 0, scale, sigmx, n, 1, e, n, iinfo )
      END IF
*
      RETURN
*
*     End of DLASQ1
*

◆ dlasq2()

subroutine dlasq2	(	integer	n,
		double precision, dimension( * )	z,
		integer	info )

DLASQ2 computes all the eigenvalues of the symmetric positive definite tridiagonal matrix associated with the qd Array Z to high relative accuracy. Used by sbdsqr and sstegr.

Download DLASQ2 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLASQ2 computes all the eigenvalues of the symmetric positive
!> definite tridiagonal matrix associated with the qd array Z to high
!> relative accuracy are computed to high relative accuracy, in the
!> absence of denormalization, underflow and overflow.
!>
!> To see the relation of Z to the tridiagonal matrix, let L be a
!> unit lower bidiagonal matrix with subdiagonals Z(2,4,6,,..) and
!> let U be an upper bidiagonal matrix with 1's above and diagonal
!> Z(1,3,5,,..). The tridiagonal is L*U or, if you prefer, the
!> symmetric tridiagonal to which it is similar.
!>
!> Note : DLASQ2 defines a logical variable, IEEE, which is true
!> on machines which follow ieee-754 floating-point standard in their
!> handling of infinities and NaNs, and false otherwise. This variable
!> is passed to DLASQ3.
!>

Parameters

[in]

N

!>          N is INTEGER
!>        The number of rows and columns in the matrix. N >= 0.
!>

[in,out]

Z

!>          Z is DOUBLE PRECISION array, dimension ( 4*N )
!>        On entry Z holds the qd array. On exit, entries 1 to N hold
!>        the eigenvalues in decreasing order, Z( 2*N+1 ) holds the
!>        trace, and Z( 2*N+2 ) holds the sum of the eigenvalues. If
!>        N > 2, then Z( 2*N+3 ) holds the iteration count, Z( 2*N+4 )
!>        holds NDIVS/NIN^2, and Z( 2*N+5 ) holds the percentage of
!>        shifts that failed.
!>

[out]

INFO

!>          INFO is INTEGER
!>        = 0: successful exit
!>        < 0: if the i-th argument is a scalar and had an illegal
!>             value, then INFO = -i, if the i-th argument is an
!>             array and the j-entry had an illegal value, then
!>             INFO = -(i*100+j)
!>        > 0: the algorithm failed
!>              = 1, a split was marked by a positive value in E
!>              = 2, current block of Z not diagonalized after 100*N
!>                   iterations (in inner while loop).  On exit Z holds
!>                   a qd array with the same eigenvalues as the given Z.
!>              = 3, termination criterion of outer while loop not met
!>                   (program created more than N unreduced blocks)
!>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  Local Variables: I0:N0 defines a current unreduced segment of Z.
!>  The shifts are accumulated in SIGMA. Iteration count is in ITER.
!>  Ping-pong is controlled by PP (alternates between 0 and 1).
!>

Definition at line 111 of file dlasq2.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INFO, N
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   Z( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   CBIAS
      parameter( cbias = 1.50d0 )
      DOUBLE PRECISION   ZERO, HALF, ONE, TWO, FOUR, HUNDRD
      parameter( zero = 0.0d0, half = 0.5d0, one = 1.0d0,
     $                     two = 2.0d0, four = 4.0d0, hundrd = 100.0d0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            IEEE
      INTEGER            I0, I1, I4, IINFO, IPN4, ITER, IWHILA, IWHILB,
     $                   K, KMIN, N0, N1, NBIG, NDIV, NFAIL, PP, SPLT,
     $                   TTYPE
      DOUBLE PRECISION   D, DEE, DEEMIN, DESIG, DMIN, DMIN1, DMIN2, DN,
     $                   DN1, DN2, E, EMAX, EMIN, EPS, G, OLDEMN, QMAX,
     $                   QMIN, S, SAFMIN, SIGMA, T, TAU, TEMP, TOL,
     $                   TOL2, TRACE, ZMAX, TEMPE, TEMPQ
*     ..
*     .. External Subroutines ..
      EXTERNAL           dlasq3, dlasrt, xerbla
*     ..
*     .. External Functions ..
      INTEGER            ILAENV
      DOUBLE PRECISION   DLAMCH
      EXTERNAL           dlamch, ilaenv
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, dble, max, min, sqrt
*     ..
*     .. Executable Statements ..
*
*     Test the input arguments.
*     (in case DLASQ2 is not called by DLASQ1)
*
      info = 0
      eps = dlamch( 'Precision' )
      safmin = dlamch( 'Safe minimum' )
      tol = eps*hundrd
      tol2 = tol**2
*
      IF( n.LT.0 ) THEN
         info = -1
         CALL xerbla( 'DLASQ2', 1 )
         RETURN
      ELSE IF( n.EQ.0 ) THEN
         RETURN
      ELSE IF( n.EQ.1 ) THEN
*
*        1-by-1 case.
*
         IF( z( 1 ).LT.zero ) THEN
            info = -201
            CALL xerbla( 'DLASQ2', 2 )
         END IF
         RETURN
      ELSE IF( n.EQ.2 ) THEN
*
*        2-by-2 case.
*
         IF( z( 1 ).LT.zero ) THEN
            info = -201
            CALL xerbla( 'DLASQ2', 2 )
            RETURN
         ELSE IF( z( 2 ).LT.zero ) THEN
            info = -202
            CALL xerbla( 'DLASQ2', 2 )
            RETURN
         ELSE IF( z( 3 ).LT.zero ) THEN
           info = -203
           CALL xerbla( 'DLASQ2', 2 )
           RETURN
         ELSE IF( z( 3 ).GT.z( 1 ) ) THEN
            d = z( 3 )
            z( 3 ) = z( 1 )
            z( 1 ) = d
         END IF
         z( 5 ) = z( 1 ) + z( 2 ) + z( 3 )
         IF( z( 2 ).GT.z( 3 )*tol2 ) THEN
            t = half*( ( z( 1 )-z( 3 ) )+z( 2 ) )
            s = z( 3 )*( z( 2 ) / t )
            IF( s.LE.t ) THEN
               s = z( 3 )*( z( 2 ) / ( t*( one+sqrt( one+s / t ) ) ) )
            ELSE
               s = z( 3 )*( z( 2 ) / ( t+sqrt( t )*sqrt( t+s ) ) )
            END IF
            t = z( 1 ) + ( s+z( 2 ) )
            z( 3 ) = z( 3 )*( z( 1 ) / t )
            z( 1 ) = t
         END IF
         z( 2 ) = z( 3 )
         z( 6 ) = z( 2 ) + z( 1 )
         RETURN
      END IF
*
*     Check for negative data and compute sums of q's and e's.
*
      z( 2*n ) = zero
      emin = z( 2 )
      qmax = zero
      zmax = zero
      d = zero
      e = zero
*
      DO 10 k = 1, 2*( n-1 ), 2
         IF( z( k ).LT.zero ) THEN
            info = -( 200+k )
            CALL xerbla( 'DLASQ2', 2 )
            RETURN
         ELSE IF( z( k+1 ).LT.zero ) THEN
            info = -( 200+k+1 )
            CALL xerbla( 'DLASQ2', 2 )
            RETURN
         END IF
         d = d + z( k )
         e = e + z( k+1 )
         qmax = max( qmax, z( k ) )
         emin = min( emin, z( k+1 ) )
         zmax = max( qmax, zmax, z( k+1 ) )
   10 CONTINUE
      IF( z( 2*n-1 ).LT.zero ) THEN
         info = -( 200+2*n-1 )
         CALL xerbla( 'DLASQ2', 2 )
         RETURN
      END IF
      d = d + z( 2*n-1 )
      qmax = max( qmax, z( 2*n-1 ) )
      zmax = max( qmax, zmax )
*
*     Check for diagonality.
*
      IF( e.EQ.zero ) THEN
         DO 20 k = 2, n
            z( k ) = z( 2*k-1 )
   20    CONTINUE
         CALL dlasrt( 'D', n, z, iinfo )
         z( 2*n-1 ) = d
         RETURN
      END IF
*
      trace = d + e
*
*     Check for zero data.
*
      IF( trace.EQ.zero ) THEN
         z( 2*n-1 ) = zero
         RETURN
      END IF
*
*     Check whether the machine is IEEE conformable.
*
      ieee = ( ilaenv( 10, 'DLASQ2', 'N', 1, 2, 3, 4 ).EQ.1 )
*
*     Rearrange data for locality: Z=(q1,qq1,e1,ee1,q2,qq2,e2,ee2,...).
*
      DO 30 k = 2*n, 2, -2
         z( 2*k ) = zero
         z( 2*k-1 ) = z( k )
         z( 2*k-2 ) = zero
         z( 2*k-3 ) = z( k-1 )
   30 CONTINUE
*
      i0 = 1
      n0 = n
*
*     Reverse the qd-array, if warranted.
*
      IF( cbias*z( 4*i0-3 ).LT.z( 4*n0-3 ) ) THEN
         ipn4 = 4*( i0+n0 )
         DO 40 i4 = 4*i0, 2*( i0+n0-1 ), 4
            temp = z( i4-3 )
            z( i4-3 ) = z( ipn4-i4-3 )
            z( ipn4-i4-3 ) = temp
            temp = z( i4-1 )
            z( i4-1 ) = z( ipn4-i4-5 )
            z( ipn4-i4-5 ) = temp
   40    CONTINUE
      END IF
*
*     Initial split checking via dqd and Li's test.
*
      pp = 0
*
      DO 80 k = 1, 2
*
         d = z( 4*n0+pp-3 )
         DO 50 i4 = 4*( n0-1 ) + pp, 4*i0 + pp, -4
            IF( z( i4-1 ).LE.tol2*d ) THEN
               z( i4-1 ) = -zero
               d = z( i4-3 )
            ELSE
               d = z( i4-3 )*( d / ( d+z( i4-1 ) ) )
            END IF
   50    CONTINUE
*
*        dqd maps Z to ZZ plus Li's test.
*
         emin = z( 4*i0+pp+1 )
         d = z( 4*i0+pp-3 )
         DO 60 i4 = 4*i0 + pp, 4*( n0-1 ) + pp, 4
            z( i4-2*pp-2 ) = d + z( i4-1 )
            IF( z( i4-1 ).LE.tol2*d ) THEN
               z( i4-1 ) = -zero
               z( i4-2*pp-2 ) = d
               z( i4-2*pp ) = zero
               d = z( i4+1 )
            ELSE IF( safmin*z( i4+1 ).LT.z( i4-2*pp-2 ) .AND.
     $               safmin*z( i4-2*pp-2 ).LT.z( i4+1 ) ) THEN
               temp = z( i4+1 ) / z( i4-2*pp-2 )
               z( i4-2*pp ) = z( i4-1 )*temp
               d = d*temp
            ELSE
               z( i4-2*pp ) = z( i4+1 )*( z( i4-1 ) / z( i4-2*pp-2 ) )
               d = z( i4+1 )*( d / z( i4-2*pp-2 ) )
            END IF
            emin = min( emin, z( i4-2*pp ) )
   60    CONTINUE
         z( 4*n0-pp-2 ) = d
*
*        Now find qmax.
*
         qmax = z( 4*i0-pp-2 )
         DO 70 i4 = 4*i0 - pp + 2, 4*n0 - pp - 2, 4
            qmax = max( qmax, z( i4 ) )
   70    CONTINUE
*
*        Prepare for the next iteration on K.
*
         pp = 1 - pp
   80 CONTINUE
*
*     Initialise variables to pass to DLASQ3.
*
      ttype = 0
      dmin1 = zero
      dmin2 = zero
      dn    = zero
      dn1   = zero
      dn2   = zero
      g     = zero
      tau   = zero
*
      iter = 2
      nfail = 0
      ndiv = 2*( n0-i0 )
*
      DO 160 iwhila = 1, n + 1
         IF( n0.LT.1 )
     $      GO TO 170
*
*        While array unfinished do
*
*        E(N0) holds the value of SIGMA when submatrix in I0:N0
*        splits from the rest of the array, but is negated.
*
         desig = zero
         IF( n0.EQ.n ) THEN
            sigma = zero
         ELSE
            sigma = -z( 4*n0-1 )
         END IF
         IF( sigma.LT.zero ) THEN
            info = 1
            RETURN
         END IF
*
*        Find last unreduced submatrix's top index I0, find QMAX and
*        EMIN. Find Gershgorin-type bound if Q's much greater than E's.
*
         emax = zero
         IF( n0.GT.i0 ) THEN
            emin = abs( z( 4*n0-5 ) )
         ELSE
            emin = zero
         END IF
         qmin = z( 4*n0-3 )
         qmax = qmin
         DO 90 i4 = 4*n0, 8, -4
            IF( z( i4-5 ).LE.zero )
     $         GO TO 100
            IF( qmin.GE.four*emax ) THEN
               qmin = min( qmin, z( i4-3 ) )
               emax = max( emax, z( i4-5 ) )
            END IF
            qmax = max( qmax, z( i4-7 )+z( i4-5 ) )
            emin = min( emin, z( i4-5 ) )
   90    CONTINUE
         i4 = 4
*
  100    CONTINUE
         i0 = i4 / 4
         pp = 0
*
         IF( n0-i0.GT.1 ) THEN
            dee = z( 4*i0-3 )
            deemin = dee
            kmin = i0
            DO 110 i4 = 4*i0+1, 4*n0-3, 4
               dee = z( i4 )*( dee /( dee+z( i4-2 ) ) )
               IF( dee.LE.deemin ) THEN
                  deemin = dee
                  kmin = ( i4+3 )/4
               END IF
  110       CONTINUE
            IF( (kmin-i0)*2.LT.n0-kmin .AND.
     $         deemin.LE.half*z(4*n0-3) ) THEN
               ipn4 = 4*( i0+n0 )
               pp = 2
               DO 120 i4 = 4*i0, 2*( i0+n0-1 ), 4
                  temp = z( i4-3 )
                  z( i4-3 ) = z( ipn4-i4-3 )
                  z( ipn4-i4-3 ) = temp
                  temp = z( i4-2 )
                  z( i4-2 ) = z( ipn4-i4-2 )
                  z( ipn4-i4-2 ) = temp
                  temp = z( i4-1 )
                  z( i4-1 ) = z( ipn4-i4-5 )
                  z( ipn4-i4-5 ) = temp
                  temp = z( i4 )
                  z( i4 ) = z( ipn4-i4-4 )
                  z( ipn4-i4-4 ) = temp
  120          CONTINUE
            END IF
         END IF
*
*        Put -(initial shift) into DMIN.
*
         dmin = -max( zero, qmin-two*sqrt( qmin )*sqrt( emax ) )
*
*        Now I0:N0 is unreduced.
*        PP = 0 for ping, PP = 1 for pong.
*        PP = 2 indicates that flipping was applied to the Z array and
*               and that the tests for deflation upon entry in DLASQ3
*               should not be performed.
*
         nbig = 100*( n0-i0+1 )
         DO 140 iwhilb = 1, nbig
            IF( i0.GT.n0 )
     $         GO TO 150
*
*           While submatrix unfinished take a good dqds step.
*
            CALL dlasq3( i0, n0, z, pp, dmin, sigma, desig, qmax, nfail,
     $                   iter, ndiv, ieee, ttype, dmin1, dmin2, dn, dn1,
     $                   dn2, g, tau )
*
            pp = 1 - pp
*
*           When EMIN is very small check for splits.
*
            IF( pp.EQ.0 .AND. n0-i0.GE.3 ) THEN
               IF( z( 4*n0 ).LE.tol2*qmax .OR.
     $             z( 4*n0-1 ).LE.tol2*sigma ) THEN
                  splt = i0 - 1
                  qmax = z( 4*i0-3 )
                  emin = z( 4*i0-1 )
                  oldemn = z( 4*i0 )
                  DO 130 i4 = 4*i0, 4*( n0-3 ), 4
                     IF( z( i4 ).LE.tol2*z( i4-3 ) .OR.
     $                   z( i4-1 ).LE.tol2*sigma ) THEN
                        z( i4-1 ) = -sigma
                        splt = i4 / 4
                        qmax = zero
                        emin = z( i4+3 )
                        oldemn = z( i4+4 )
                     ELSE
                        qmax = max( qmax, z( i4+1 ) )
                        emin = min( emin, z( i4-1 ) )
                        oldemn = min( oldemn, z( i4 ) )
                     END IF
  130             CONTINUE
                  z( 4*n0-1 ) = emin
                  z( 4*n0 ) = oldemn
                  i0 = splt + 1
               END IF
            END IF
*
  140    CONTINUE
*
         info = 2
*
*        Maximum number of iterations exceeded, restore the shift
*        SIGMA and place the new d's and e's in a qd array.
*        This might need to be done for several blocks
*
         i1 = i0
         n1 = n0
 145     CONTINUE
         tempq = z( 4*i0-3 )
         z( 4*i0-3 ) = z( 4*i0-3 ) + sigma
         DO k = i0+1, n0
            tempe = z( 4*k-5 )
            z( 4*k-5 ) = z( 4*k-5 ) * (tempq / z( 4*k-7 ))
            tempq = z( 4*k-3 )
            z( 4*k-3 ) = z( 4*k-3 ) + sigma + tempe - z( 4*k-5 )
         END DO
*
*        Prepare to do this on the previous block if there is one
*
         IF( i1.GT.1 ) THEN
            n1 = i1-1
            DO WHILE( ( i1.GE.2 ) .AND. ( z(4*i1-5).GE.zero ) )
               i1 = i1 - 1
            END DO
            sigma = -z(4*n1-1)
            GO TO 145
         END IF
 
         DO k = 1, n
            z( 2*k-1 ) = z( 4*k-3 )
*
*        Only the block 1..N0 is unfinished.  The rest of the e's
*        must be essentially zero, although sometimes other data
*        has been stored in them.
*
            IF( k.LT.n0 ) THEN
               z( 2*k ) = z( 4*k-1 )
            ELSE
               z( 2*k ) = 0
            END IF
         END DO
         RETURN
*
*        end IWHILB
*
  150    CONTINUE
*
  160 CONTINUE
*
      info = 3
      RETURN
*
*     end IWHILA
*
  170 CONTINUE
*
*     Move q's to the front.
*
      DO 180 k = 2, n
         z( k ) = z( 4*k-3 )
  180 CONTINUE
*
*     Sort and compute sum of eigenvalues.
*
      CALL dlasrt( 'D', n, z, iinfo )
*
      e = zero
      DO 190 k = n, 1, -1
         e = e + z( k )
  190 CONTINUE
*
*     Store trace, sum(eigenvalues) and information on performance.
*
      z( 2*n+1 ) = trace
      z( 2*n+2 ) = e
      z( 2*n+3 ) = dble( iter )
      z( 2*n+4 ) = dble( ndiv ) / dble( n**2 )
      z( 2*n+5 ) = hundrd*nfail / dble( iter )
      RETURN
*
*     End of DLASQ2
*

◆ dlasq3()

subroutine dlasq3	(	integer	i0,
		integer	n0,
		double precision, dimension( * )	z,
		integer	pp,
		double precision	dmin,
		double precision	sigma,
		double precision	desig,
		double precision	qmax,
		integer	nfail,
		integer	iter,
		integer	ndiv,
		logical	ieee,
		integer	ttype,
		double precision	dmin1,
		double precision	dmin2,
		double precision	dn,
		double precision	dn1,
		double precision	dn2,
		double precision	g,
		double precision	tau )

DLASQ3 checks for deflation, computes a shift and calls dqds. Used by sbdsqr.

Download DLASQ3 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLASQ3 checks for deflation, computes a shift (TAU) and calls dqds.
!> In case of failure it changes shifts, and tries again until output
!> is positive.
!>

Parameters

[in]	I0	!> I0 is INTEGER !> First index. !>
[in,out]	N0	!> N0 is INTEGER !> Last index. !>
[in,out]	Z	!> Z is DOUBLE PRECISION array, dimension ( 4*N0 ) !> Z holds the qd array. !>
[in,out]	PP	!> PP is INTEGER !> PP=0 for ping, PP=1 for pong. !> PP=2 indicates that flipping was applied to the Z array !> and that the initial tests for deflation should not be !> performed. !>
[out]	DMIN	!> DMIN is DOUBLE PRECISION !> Minimum value of d. !>
[out]	SIGMA	!> SIGMA is DOUBLE PRECISION !> Sum of shifts used in current segment. !>
[in,out]	DESIG	!> DESIG is DOUBLE PRECISION !> Lower order part of SIGMA !>
[in]	QMAX	!> QMAX is DOUBLE PRECISION !> Maximum value of q. !>
[in,out]	NFAIL	!> NFAIL is INTEGER !> Increment NFAIL by 1 each time the shift was too big. !>
[in,out]	ITER	!> ITER is INTEGER !> Increment ITER by 1 for each iteration. !>
[in,out]	NDIV	!> NDIV is INTEGER !> Increment NDIV by 1 for each division. !>
[in]	IEEE	!> IEEE is LOGICAL !> Flag for IEEE or non IEEE arithmetic (passed to DLASQ5). !>
[in,out]	TTYPE	!> TTYPE is INTEGER !> Shift type. !>
[in,out]	DMIN1	!> DMIN1 is DOUBLE PRECISION !>
[in,out]	DMIN2	!> DMIN2 is DOUBLE PRECISION !>
[in,out]	DN	!> DN is DOUBLE PRECISION !>
[in,out]	DN1	!> DN1 is DOUBLE PRECISION !>
[in,out]	DN2	!> DN2 is DOUBLE PRECISION !>
[in,out]	G	!> G is DOUBLE PRECISION !>
[in,out]	TAU	!> TAU is DOUBLE PRECISION !> !> These are passed as arguments in order to save their values !> between calls to DLASQ3. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 179 of file dlasq3.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      LOGICAL            IEEE
      INTEGER            I0, ITER, N0, NDIV, NFAIL, PP
      DOUBLE PRECISION   DESIG, DMIN, DMIN1, DMIN2, DN, DN1, DN2, G,
     $                   QMAX, SIGMA, TAU
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   Z( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   CBIAS
      parameter( cbias = 1.50d0 )
      DOUBLE PRECISION   ZERO, QURTR, HALF, ONE, TWO, HUNDRD
      parameter( zero = 0.0d0, qurtr = 0.250d0, half = 0.5d0,
     $                     one = 1.0d0, two = 2.0d0, hundrd = 100.0d0 )
*     ..
*     .. Local Scalars ..
      INTEGER            IPN4, J4, N0IN, NN, TTYPE
      DOUBLE PRECISION   EPS, S, T, TEMP, TOL, TOL2
*     ..
*     .. External Subroutines ..
      EXTERNAL           dlasq4, dlasq5, dlasq6
*     ..
*     .. External Function ..
      DOUBLE PRECISION   DLAMCH
      LOGICAL            DISNAN
      EXTERNAL           disnan, dlamch
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, max, min, sqrt
*     ..
*     .. Executable Statements ..
*
      n0in = n0
      eps = dlamch( 'Precision' )
      tol = eps*hundrd
      tol2 = tol**2
*
*     Check for deflation.
*
   10 CONTINUE
*
      IF( n0.LT.i0 )
     $   RETURN
      IF( n0.EQ.i0 )
     $   GO TO 20
      nn = 4*n0 + pp
      IF( n0.EQ.( i0+1 ) )
     $   GO TO 40
*
*     Check whether E(N0-1) is negligible, 1 eigenvalue.
*
      IF( z( nn-5 ).GT.tol2*( sigma+z( nn-3 ) ) .AND.
     $    z( nn-2*pp-4 ).GT.tol2*z( nn-7 ) )
     $   GO TO 30
*
   20 CONTINUE
*
      z( 4*n0-3 ) = z( 4*n0+pp-3 ) + sigma
      n0 = n0 - 1
      GO TO 10
*
*     Check  whether E(N0-2) is negligible, 2 eigenvalues.
*
   30 CONTINUE
*
      IF( z( nn-9 ).GT.tol2*sigma .AND.
     $    z( nn-2*pp-8 ).GT.tol2*z( nn-11 ) )
     $   GO TO 50
*
   40 CONTINUE
*
      IF( z( nn-3 ).GT.z( nn-7 ) ) THEN
         s = z( nn-3 )
         z( nn-3 ) = z( nn-7 )
         z( nn-7 ) = s
      END IF
      t = half*( ( z( nn-7 )-z( nn-3 ) )+z( nn-5 ) )
      IF( z( nn-5 ).GT.z( nn-3 )*tol2.AND.t.NE.zero ) THEN
         s = z( nn-3 )*( z( nn-5 ) / t )
         IF( s.LE.t ) THEN
            s = z( nn-3 )*( z( nn-5 ) /
     $          ( t*( one+sqrt( one+s / t ) ) ) )
         ELSE
            s = z( nn-3 )*( z( nn-5 ) / ( t+sqrt( t )*sqrt( t+s ) ) )
         END IF
         t = z( nn-7 ) + ( s+z( nn-5 ) )
         z( nn-3 ) = z( nn-3 )*( z( nn-7 ) / t )
         z( nn-7 ) = t
      END IF
      z( 4*n0-7 ) = z( nn-7 ) + sigma
      z( 4*n0-3 ) = z( nn-3 ) + sigma
      n0 = n0 - 2
      GO TO 10
*
   50 CONTINUE
      IF( pp.EQ.2 )
     $   pp = 0
*
*     Reverse the qd-array, if warranted.
*
      IF( dmin.LE.zero .OR. n0.LT.n0in ) THEN
         IF( cbias*z( 4*i0+pp-3 ).LT.z( 4*n0+pp-3 ) ) THEN
            ipn4 = 4*( i0+n0 )
            DO 60 j4 = 4*i0, 2*( i0+n0-1 ), 4
               temp = z( j4-3 )
               z( j4-3 ) = z( ipn4-j4-3 )
               z( ipn4-j4-3 ) = temp
               temp = z( j4-2 )
               z( j4-2 ) = z( ipn4-j4-2 )
               z( ipn4-j4-2 ) = temp
               temp = z( j4-1 )
               z( j4-1 ) = z( ipn4-j4-5 )
               z( ipn4-j4-5 ) = temp
               temp = z( j4 )
               z( j4 ) = z( ipn4-j4-4 )
               z( ipn4-j4-4 ) = temp
   60       CONTINUE
            IF( n0-i0.LE.4 ) THEN
               z( 4*n0+pp-1 ) = z( 4*i0+pp-1 )
               z( 4*n0-pp ) = z( 4*i0-pp )
            END IF
            dmin2 = min( dmin2, z( 4*n0+pp-1 ) )
            z( 4*n0+pp-1 ) = min( z( 4*n0+pp-1 ), z( 4*i0+pp-1 ),
     $                            z( 4*i0+pp+3 ) )
            z( 4*n0-pp ) = min( z( 4*n0-pp ), z( 4*i0-pp ),
     $                          z( 4*i0-pp+4 ) )
            qmax = max( qmax, z( 4*i0+pp-3 ), z( 4*i0+pp+1 ) )
            dmin = -zero
         END IF
      END IF
*
*     Choose a shift.
*
      CALL dlasq4( i0, n0, z, pp, n0in, dmin, dmin1, dmin2, dn, dn1,
     $             dn2, tau, ttype, g )
*
*     Call dqds until DMIN > 0.
*
   70 CONTINUE
*
      CALL dlasq5( i0, n0, z, pp, tau, sigma, dmin, dmin1, dmin2, dn,
     $             dn1, dn2, ieee, eps )
*
      ndiv = ndiv + ( n0-i0+2 )
      iter = iter + 1
*
*     Check status.
*
      IF( dmin.GE.zero .AND. dmin1.GE.zero ) THEN
*
*        Success.
*
         GO TO 90
*
      ELSE IF( dmin.LT.zero .AND. dmin1.GT.zero .AND.
     $         z( 4*( n0-1 )-pp ).LT.tol*( sigma+dn1 ) .AND.
     $         abs( dn ).LT.tol*sigma ) THEN
*
*        Convergence hidden by negative DN.
*
         z( 4*( n0-1 )-pp+2 ) = zero
         dmin = zero
         GO TO 90
      ELSE IF( dmin.LT.zero ) THEN
*
*        TAU too big. Select new TAU and try again.
*
         nfail = nfail + 1
         IF( ttype.LT.-22 ) THEN
*
*           Failed twice. Play it safe.
*
            tau = zero
         ELSE IF( dmin1.GT.zero ) THEN
*
*           Late failure. Gives excellent shift.
*
            tau = ( tau+dmin )*( one-two*eps )
            ttype = ttype - 11
         ELSE
*
*           Early failure. Divide by 4.
*
            tau = qurtr*tau
            ttype = ttype - 12
         END IF
         GO TO 70
      ELSE IF( disnan( dmin ) ) THEN
*
*        NaN.
*
         IF( tau.EQ.zero ) THEN
            GO TO 80
         ELSE
            tau = zero
            GO TO 70
         END IF
      ELSE
*
*        Possible underflow. Play it safe.
*
         GO TO 80
      END IF
*
*     Risk of underflow.
*
   80 CONTINUE
      CALL dlasq6( i0, n0, z, pp, dmin, dmin1, dmin2, dn, dn1, dn2 )
      ndiv = ndiv + ( n0-i0+2 )
      iter = iter + 1
      tau = zero
*
   90 CONTINUE
      IF( tau.LT.sigma ) THEN
         desig = desig + tau
         t = sigma + desig
         desig = desig - ( t-sigma )
      ELSE
         t = sigma + tau
         desig = sigma - ( t-tau ) + desig
      END IF
      sigma = t
*
      RETURN
*
*     End of DLASQ3
*

◆ dlasq4()

subroutine dlasq4	(	integer	i0,
		integer	n0,
		double precision, dimension( * )	z,
		integer	pp,
		integer	n0in,
		double precision	dmin,
		double precision	dmin1,
		double precision	dmin2,
		double precision	dn,
		double precision	dn1,
		double precision	dn2,
		double precision	tau,
		integer	ttype,
		double precision	g )

DLASQ4 computes an approximation to the smallest eigenvalue using values of d from the previous transform. Used by sbdsqr.

Download DLASQ4 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLASQ4 computes an approximation TAU to the smallest eigenvalue
!> using values of d from the previous transform.
!>

Parameters

[in]	I0	!> I0 is INTEGER !> First index. !>
[in]	N0	!> N0 is INTEGER !> Last index. !>
[in]	Z	!> Z is DOUBLE PRECISION array, dimension ( 4*N0 ) !> Z holds the qd array. !>
[in]	PP	!> PP is INTEGER !> PP=0 for ping, PP=1 for pong. !>
[in]	N0IN	!> N0IN is INTEGER !> The value of N0 at start of EIGTEST. !>
[in]	DMIN	!> DMIN is DOUBLE PRECISION !> Minimum value of d. !>
[in]	DMIN1	!> DMIN1 is DOUBLE PRECISION !> Minimum value of d, excluding D( N0 ). !>
[in]	DMIN2	!> DMIN2 is DOUBLE PRECISION !> Minimum value of d, excluding D( N0 ) and D( N0-1 ). !>
[in]	DN	!> DN is DOUBLE PRECISION !> d(N) !>
[in]	DN1	!> DN1 is DOUBLE PRECISION !> d(N-1) !>
[in]	DN2	!> DN2 is DOUBLE PRECISION !> d(N-2) !>
[out]	TAU	!> TAU is DOUBLE PRECISION !> This is the shift. !>
[out]	TTYPE	!> TTYPE is INTEGER !> Shift type. !>
[in,out]	G	!> G is DOUBLE PRECISION !> G is passed as an argument in order to save its value between !> calls to DLASQ4. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  CNST1 = 9/16
!>

Definition at line 149 of file dlasq4.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            I0, N0, N0IN, PP, TTYPE
      DOUBLE PRECISION   DMIN, DMIN1, DMIN2, DN, DN1, DN2, G, TAU
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   Z( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   CNST1, CNST2, CNST3
      parameter( cnst1 = 0.5630d0, cnst2 = 1.010d0,
     $                   cnst3 = 1.050d0 )
      DOUBLE PRECISION   QURTR, THIRD, HALF, ZERO, ONE, TWO, HUNDRD
      parameter( qurtr = 0.250d0, third = 0.3330d0,
     $                   half = 0.50d0, zero = 0.0d0, one = 1.0d0,
     $                   two = 2.0d0, hundrd = 100.0d0 )
*     ..
*     .. Local Scalars ..
      INTEGER            I4, NN, NP
      DOUBLE PRECISION   A2, B1, B2, GAM, GAP1, GAP2, S
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, min, sqrt
*     ..
*     .. Executable Statements ..
*
*     A negative DMIN forces the shift to take that absolute value
*     TTYPE records the type of shift.
*
      IF( dmin.LE.zero ) THEN
         tau = -dmin
         ttype = -1
         RETURN
      END IF
*
      nn = 4*n0 + pp
      IF( n0in.EQ.n0 ) THEN
*
*        No eigenvalues deflated.
*
         IF( dmin.EQ.dn .OR. dmin.EQ.dn1 ) THEN
*
            b1 = sqrt( z( nn-3 ) )*sqrt( z( nn-5 ) )
            b2 = sqrt( z( nn-7 ) )*sqrt( z( nn-9 ) )
            a2 = z( nn-7 ) + z( nn-5 )
*
*           Cases 2 and 3.
*
            IF( dmin.EQ.dn .AND. dmin1.EQ.dn1 ) THEN
               gap2 = dmin2 - a2 - dmin2*qurtr
               IF( gap2.GT.zero .AND. gap2.GT.b2 ) THEN
                  gap1 = a2 - dn - ( b2 / gap2 )*b2
               ELSE
                  gap1 = a2 - dn - ( b1+b2 )
               END IF
               IF( gap1.GT.zero .AND. gap1.GT.b1 ) THEN
                  s = max( dn-( b1 / gap1 )*b1, half*dmin )
                  ttype = -2
               ELSE
                  s = zero
                  IF( dn.GT.b1 )
     $               s = dn - b1
                  IF( a2.GT.( b1+b2 ) )
     $               s = min( s, a2-( b1+b2 ) )
                  s = max( s, third*dmin )
                  ttype = -3
               END IF
            ELSE
*
*              Case 4.
*
               ttype = -4
               s = qurtr*dmin
               IF( dmin.EQ.dn ) THEN
                  gam = dn
                  a2 = zero
                  IF( z( nn-5 ) .GT. z( nn-7 ) )
     $               RETURN
                  b2 = z( nn-5 ) / z( nn-7 )
                  np = nn - 9
               ELSE
                  np = nn - 2*pp
                  gam = dn1
                  IF( z( np-4 ) .GT. z( np-2 ) )
     $               RETURN
                  a2 = z( np-4 ) / z( np-2 )
                  IF( z( nn-9 ) .GT. z( nn-11 ) )
     $               RETURN
                  b2 = z( nn-9 ) / z( nn-11 )
                  np = nn - 13
               END IF
*
*              Approximate contribution to norm squared from I < NN-1.
*
               a2 = a2 + b2
               DO 10 i4 = np, 4*i0 - 1 + pp, -4
                  IF( b2.EQ.zero )
     $               GO TO 20
                  b1 = b2
                  IF( z( i4 ) .GT. z( i4-2 ) )
     $               RETURN
                  b2 = b2*( z( i4 ) / z( i4-2 ) )
                  a2 = a2 + b2
                  IF( hundrd*max( b2, b1 ).LT.a2 .OR. cnst1.LT.a2 )
     $               GO TO 20
   10          CONTINUE
   20          CONTINUE
               a2 = cnst3*a2
*
*              Rayleigh quotient residual bound.
*
               IF( a2.LT.cnst1 )
     $            s = gam*( one-sqrt( a2 ) ) / ( one+a2 )
            END IF
         ELSE IF( dmin.EQ.dn2 ) THEN
*
*           Case 5.
*
            ttype = -5
            s = qurtr*dmin
*
*           Compute contribution to norm squared from I > NN-2.
*
            np = nn - 2*pp
            b1 = z( np-2 )
            b2 = z( np-6 )
            gam = dn2
            IF( z( np-8 ).GT.b2 .OR. z( np-4 ).GT.b1 )
     $         RETURN
            a2 = ( z( np-8 ) / b2 )*( one+z( np-4 ) / b1 )
*
*           Approximate contribution to norm squared from I < NN-2.
*
            IF( n0-i0.GT.2 ) THEN
               b2 = z( nn-13 ) / z( nn-15 )
               a2 = a2 + b2
               DO 30 i4 = nn - 17, 4*i0 - 1 + pp, -4
                  IF( b2.EQ.zero )
     $               GO TO 40
                  b1 = b2
                  IF( z( i4 ) .GT. z( i4-2 ) )
     $               RETURN
                  b2 = b2*( z( i4 ) / z( i4-2 ) )
                  a2 = a2 + b2
                  IF( hundrd*max( b2, b1 ).LT.a2 .OR. cnst1.LT.a2 )
     $               GO TO 40
   30          CONTINUE
   40          CONTINUE
               a2 = cnst3*a2
            END IF
*
            IF( a2.LT.cnst1 )
     $         s = gam*( one-sqrt( a2 ) ) / ( one+a2 )
         ELSE
*
*           Case 6, no information to guide us.
*
            IF( ttype.EQ.-6 ) THEN
               g = g + third*( one-g )
            ELSE IF( ttype.EQ.-18 ) THEN
               g = qurtr*third
            ELSE
               g = qurtr
            END IF
            s = g*dmin
            ttype = -6
         END IF
*
      ELSE IF( n0in.EQ.( n0+1 ) ) THEN
*
*        One eigenvalue just deflated. Use DMIN1, DN1 for DMIN and DN.
*
         IF( dmin1.EQ.dn1 .AND. dmin2.EQ.dn2 ) THEN
*
*           Cases 7 and 8.
*
            ttype = -7
            s = third*dmin1
            IF( z( nn-5 ).GT.z( nn-7 ) )
     $         RETURN
            b1 = z( nn-5 ) / z( nn-7 )
            b2 = b1
            IF( b2.EQ.zero )
     $         GO TO 60
            DO 50 i4 = 4*n0 - 9 + pp, 4*i0 - 1 + pp, -4
               a2 = b1
               IF( z( i4 ).GT.z( i4-2 ) )
     $            RETURN
               b1 = b1*( z( i4 ) / z( i4-2 ) )
               b2 = b2 + b1
               IF( hundrd*max( b1, a2 ).LT.b2 )
     $            GO TO 60
   50       CONTINUE
   60       CONTINUE
            b2 = sqrt( cnst3*b2 )
            a2 = dmin1 / ( one+b2**2 )
            gap2 = half*dmin2 - a2
            IF( gap2.GT.zero .AND. gap2.GT.b2*a2 ) THEN
               s = max( s, a2*( one-cnst2*a2*( b2 / gap2 )*b2 ) )
            ELSE
               s = max( s, a2*( one-cnst2*b2 ) )
               ttype = -8
            END IF
         ELSE
*
*           Case 9.
*
            s = qurtr*dmin1
            IF( dmin1.EQ.dn1 )
     $         s = half*dmin1
            ttype = -9
         END IF
*
      ELSE IF( n0in.EQ.( n0+2 ) ) THEN
*
*        Two eigenvalues deflated. Use DMIN2, DN2 for DMIN and DN.
*
*        Cases 10 and 11.
*
         IF( dmin2.EQ.dn2 .AND. two*z( nn-5 ).LT.z( nn-7 ) ) THEN
            ttype = -10
            s = third*dmin2
            IF( z( nn-5 ).GT.z( nn-7 ) )
     $         RETURN
            b1 = z( nn-5 ) / z( nn-7 )
            b2 = b1
            IF( b2.EQ.zero )
     $         GO TO 80
            DO 70 i4 = 4*n0 - 9 + pp, 4*i0 - 1 + pp, -4
               IF( z( i4 ).GT.z( i4-2 ) )
     $            RETURN
               b1 = b1*( z( i4 ) / z( i4-2 ) )
               b2 = b2 + b1
               IF( hundrd*b1.LT.b2 )
     $            GO TO 80
   70       CONTINUE
   80       CONTINUE
            b2 = sqrt( cnst3*b2 )
            a2 = dmin2 / ( one+b2**2 )
            gap2 = z( nn-7 ) + z( nn-9 ) -
     $             sqrt( z( nn-11 ) )*sqrt( z( nn-9 ) ) - a2
            IF( gap2.GT.zero .AND. gap2.GT.b2*a2 ) THEN
               s = max( s, a2*( one-cnst2*a2*( b2 / gap2 )*b2 ) )
            ELSE
               s = max( s, a2*( one-cnst2*b2 ) )
            END IF
         ELSE
            s = qurtr*dmin2
            ttype = -11
         END IF
      ELSE IF( n0in.GT.( n0+2 ) ) THEN
*
*        Case 12, more than two eigenvalues deflated. No information.
*
         s = zero
         ttype = -12
      END IF
*
      tau = s
      RETURN
*
*     End of DLASQ4
*

◆ dlasq5()

subroutine dlasq5	(	integer	i0,
		integer	n0,
		double precision, dimension( * )	z,
		integer	pp,
		double precision	tau,
		double precision	sigma,
		double precision	dmin,
		double precision	dmin1,
		double precision	dmin2,
		double precision	dn,
		double precision	dnm1,
		double precision	dnm2,
		logical	ieee,
		double precision	eps )

DLASQ5 computes one dqds transform in ping-pong form. Used by sbdsqr and sstegr.

Download DLASQ5 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLASQ5 computes one dqds transform in ping-pong form, one
!> version for IEEE machines another for non IEEE machines.
!>

Parameters

[in]	I0	!> I0 is INTEGER !> First index. !>
[in]	N0	!> N0 is INTEGER !> Last index. !>
[in]	Z	!> Z is DOUBLE PRECISION array, dimension ( 4N ) !> Z holds the qd array. EMIN is stored in Z(4N0) to avoid !> an extra argument. !>
[in]	PP	!> PP is INTEGER !> PP=0 for ping, PP=1 for pong. !>
[in]	TAU	!> TAU is DOUBLE PRECISION !> This is the shift. !>
[in]	SIGMA	!> SIGMA is DOUBLE PRECISION !> This is the accumulated shift up to this step. !>
[out]	DMIN	!> DMIN is DOUBLE PRECISION !> Minimum value of d. !>
[out]	DMIN1	!> DMIN1 is DOUBLE PRECISION !> Minimum value of d, excluding D( N0 ). !>
[out]	DMIN2	!> DMIN2 is DOUBLE PRECISION !> Minimum value of d, excluding D( N0 ) and D( N0-1 ). !>
[out]	DN	!> DN is DOUBLE PRECISION !> d(N0), the last value of d. !>
[out]	DNM1	!> DNM1 is DOUBLE PRECISION !> d(N0-1). !>
[out]	DNM2	!> DNM2 is DOUBLE PRECISION !> d(N0-2). !>
[in]	IEEE	!> IEEE is LOGICAL !> Flag for IEEE or non IEEE arithmetic. !>
[in]	EPS	!> EPS is DOUBLE PRECISION !> This is the value of epsilon used. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 142 of file dlasq5.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      LOGICAL            IEEE
      INTEGER            I0, N0, PP
      DOUBLE PRECISION   DMIN, DMIN1, DMIN2, DN, DNM1, DNM2, TAU,
     $                   SIGMA, EPS
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   Z( * )
*     ..
*
*  =====================================================================
*
*     .. Parameter ..
      DOUBLE PRECISION   ZERO, HALF
      parameter( zero = 0.0d0, half = 0.5 )
*     ..
*     .. Local Scalars ..
      INTEGER            J4, J4P2
      DOUBLE PRECISION   D, EMIN, TEMP, DTHRESH
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          min
*     ..
*     .. Executable Statements ..
*
      IF( ( n0-i0-1 ).LE.0 )
     $   RETURN
*
      dthresh = eps*(sigma+tau)
      IF( tau.LT.dthresh*half ) tau = zero
      IF( tau.NE.zero ) THEN
      j4 = 4*i0 + pp - 3
      emin = z( j4+4 )
      d = z( j4 ) - tau
      dmin = d
      dmin1 = -z( j4 )
*
      IF( ieee ) THEN
*
*        Code for IEEE arithmetic.
*
         IF( pp.EQ.0 ) THEN
            DO 10 j4 = 4*i0, 4*( n0-3 ), 4
               z( j4-2 ) = d + z( j4-1 )
               temp = z( j4+1 ) / z( j4-2 )
               d = d*temp - tau
               dmin = min( dmin, d )
               z( j4 ) = z( j4-1 )*temp
               emin = min( z( j4 ), emin )
   10       CONTINUE
         ELSE
            DO 20 j4 = 4*i0, 4*( n0-3 ), 4
               z( j4-3 ) = d + z( j4 )
               temp = z( j4+2 ) / z( j4-3 )
               d = d*temp - tau
               dmin = min( dmin, d )
               z( j4-1 ) = z( j4 )*temp
               emin = min( z( j4-1 ), emin )
   20       CONTINUE
         END IF
*
*        Unroll last two steps.
*
         dnm2 = d
         dmin2 = dmin
         j4 = 4*( n0-2 ) - pp
         j4p2 = j4 + 2*pp - 1
         z( j4-2 ) = dnm2 + z( j4p2 )
         z( j4 ) = z( j4p2+2 )*( z( j4p2 ) / z( j4-2 ) )
         dnm1 = z( j4p2+2 )*( dnm2 / z( j4-2 ) ) - tau
         dmin = min( dmin, dnm1 )
*
         dmin1 = dmin
         j4 = j4 + 4
         j4p2 = j4 + 2*pp - 1
         z( j4-2 ) = dnm1 + z( j4p2 )
         z( j4 ) = z( j4p2+2 )*( z( j4p2 ) / z( j4-2 ) )
         dn = z( j4p2+2 )*( dnm1 / z( j4-2 ) ) - tau
         dmin = min( dmin, dn )
*
      ELSE
*
*        Code for non IEEE arithmetic.
*
         IF( pp.EQ.0 ) THEN
            DO 30 j4 = 4*i0, 4*( n0-3 ), 4
               z( j4-2 ) = d + z( j4-1 )
               IF( d.LT.zero ) THEN
                  RETURN
               ELSE
                  z( j4 ) = z( j4+1 )*( z( j4-1 ) / z( j4-2 ) )
                  d = z( j4+1 )*( d / z( j4-2 ) ) - tau
               END IF
               dmin = min( dmin, d )
               emin = min( emin, z( j4 ) )
   30       CONTINUE
         ELSE
            DO 40 j4 = 4*i0, 4*( n0-3 ), 4
               z( j4-3 ) = d + z( j4 )
               IF( d.LT.zero ) THEN
                  RETURN
               ELSE
                  z( j4-1 ) = z( j4+2 )*( z( j4 ) / z( j4-3 ) )
                  d = z( j4+2 )*( d / z( j4-3 ) ) - tau
               END IF
               dmin = min( dmin, d )
               emin = min( emin, z( j4-1 ) )
   40       CONTINUE
         END IF
*
*        Unroll last two steps.
*
         dnm2 = d
         dmin2 = dmin
         j4 = 4*( n0-2 ) - pp
         j4p2 = j4 + 2*pp - 1
         z( j4-2 ) = dnm2 + z( j4p2 )
         IF( dnm2.LT.zero ) THEN
            RETURN
         ELSE
            z( j4 ) = z( j4p2+2 )*( z( j4p2 ) / z( j4-2 ) )
            dnm1 = z( j4p2+2 )*( dnm2 / z( j4-2 ) ) - tau
         END IF
         dmin = min( dmin, dnm1 )
*
         dmin1 = dmin
         j4 = j4 + 4
         j4p2 = j4 + 2*pp - 1
         z( j4-2 ) = dnm1 + z( j4p2 )
         IF( dnm1.LT.zero ) THEN
            RETURN
         ELSE
            z( j4 ) = z( j4p2+2 )*( z( j4p2 ) / z( j4-2 ) )
            dn = z( j4p2+2 )*( dnm1 / z( j4-2 ) ) - tau
         END IF
         dmin = min( dmin, dn )
*
      END IF
      ELSE
*     This is the version that sets d's to zero if they are small enough
         j4 = 4*i0 + pp - 3
         emin = z( j4+4 )
         d = z( j4 ) - tau
         dmin = d
         dmin1 = -z( j4 )
         IF( ieee ) THEN
*
*     Code for IEEE arithmetic.
*
            IF( pp.EQ.0 ) THEN
               DO 50 j4 = 4*i0, 4*( n0-3 ), 4
                  z( j4-2 ) = d + z( j4-1 )
                  temp = z( j4+1 ) / z( j4-2 )
                  d = d*temp - tau
                  IF( d.LT.dthresh ) d = zero
                  dmin = min( dmin, d )
                  z( j4 ) = z( j4-1 )*temp
                  emin = min( z( j4 ), emin )
 50            CONTINUE
            ELSE
               DO 60 j4 = 4*i0, 4*( n0-3 ), 4
                  z( j4-3 ) = d + z( j4 )
                  temp = z( j4+2 ) / z( j4-3 )
                  d = d*temp - tau
                  IF( d.LT.dthresh ) d = zero
                  dmin = min( dmin, d )
                  z( j4-1 ) = z( j4 )*temp
                  emin = min( z( j4-1 ), emin )
 60            CONTINUE
            END IF
*
*     Unroll last two steps.
*
            dnm2 = d
            dmin2 = dmin
            j4 = 4*( n0-2 ) - pp
            j4p2 = j4 + 2*pp - 1
            z( j4-2 ) = dnm2 + z( j4p2 )
            z( j4 ) = z( j4p2+2 )*( z( j4p2 ) / z( j4-2 ) )
            dnm1 = z( j4p2+2 )*( dnm2 / z( j4-2 ) ) - tau
            dmin = min( dmin, dnm1 )
*
            dmin1 = dmin
            j4 = j4 + 4
            j4p2 = j4 + 2*pp - 1
            z( j4-2 ) = dnm1 + z( j4p2 )
            z( j4 ) = z( j4p2+2 )*( z( j4p2 ) / z( j4-2 ) )
            dn = z( j4p2+2 )*( dnm1 / z( j4-2 ) ) - tau
            dmin = min( dmin, dn )
*
         ELSE
*
*     Code for non IEEE arithmetic.
*
            IF( pp.EQ.0 ) THEN
               DO 70 j4 = 4*i0, 4*( n0-3 ), 4
                  z( j4-2 ) = d + z( j4-1 )
                  IF( d.LT.zero ) THEN
                     RETURN
                  ELSE
                     z( j4 ) = z( j4+1 )*( z( j4-1 ) / z( j4-2 ) )
                     d = z( j4+1 )*( d / z( j4-2 ) ) - tau
                  END IF
                  IF( d.LT.dthresh) d = zero
                  dmin = min( dmin, d )
                  emin = min( emin, z( j4 ) )
 70            CONTINUE
            ELSE
               DO 80 j4 = 4*i0, 4*( n0-3 ), 4
                  z( j4-3 ) = d + z( j4 )
                  IF( d.LT.zero ) THEN
                     RETURN
                  ELSE
                     z( j4-1 ) = z( j4+2 )*( z( j4 ) / z( j4-3 ) )
                     d = z( j4+2 )*( d / z( j4-3 ) ) - tau
                  END IF
                  IF( d.LT.dthresh) d = zero
                  dmin = min( dmin, d )
                  emin = min( emin, z( j4-1 ) )
 80            CONTINUE
            END IF
*
*     Unroll last two steps.
*
            dnm2 = d
            dmin2 = dmin
            j4 = 4*( n0-2 ) - pp
            j4p2 = j4 + 2*pp - 1
            z( j4-2 ) = dnm2 + z( j4p2 )
            IF( dnm2.LT.zero ) THEN
               RETURN
            ELSE
               z( j4 ) = z( j4p2+2 )*( z( j4p2 ) / z( j4-2 ) )
               dnm1 = z( j4p2+2 )*( dnm2 / z( j4-2 ) ) - tau
            END IF
            dmin = min( dmin, dnm1 )
*
            dmin1 = dmin
            j4 = j4 + 4
            j4p2 = j4 + 2*pp - 1
            z( j4-2 ) = dnm1 + z( j4p2 )
            IF( dnm1.LT.zero ) THEN
               RETURN
            ELSE
               z( j4 ) = z( j4p2+2 )*( z( j4p2 ) / z( j4-2 ) )
               dn = z( j4p2+2 )*( dnm1 / z( j4-2 ) ) - tau
            END IF
            dmin = min( dmin, dn )
*
         END IF
      END IF
*
      z( j4+2 ) = dn
      z( 4*n0-pp ) = emin
      RETURN
*
*     End of DLASQ5
*

◆ dlasq6()

subroutine dlasq6	(	integer	i0,
		integer	n0,
		double precision, dimension( * )	z,
		integer	pp,
		double precision	dmin,
		double precision	dmin1,
		double precision	dmin2,
		double precision	dn,
		double precision	dnm1,
		double precision	dnm2 )

DLASQ6 computes one dqd transform in ping-pong form. Used by sbdsqr and sstegr.

Download DLASQ6 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLASQ6 computes one dqd (shift equal to zero) transform in
!> ping-pong form, with protection against underflow and overflow.
!>

Parameters

[in]	I0	!> I0 is INTEGER !> First index. !>
[in]	N0	!> N0 is INTEGER !> Last index. !>
[in]	Z	!> Z is DOUBLE PRECISION array, dimension ( 4N ) !> Z holds the qd array. EMIN is stored in Z(4N0) to avoid !> an extra argument. !>
[in]	PP	!> PP is INTEGER !> PP=0 for ping, PP=1 for pong. !>
[out]	DMIN	!> DMIN is DOUBLE PRECISION !> Minimum value of d. !>
[out]	DMIN1	!> DMIN1 is DOUBLE PRECISION !> Minimum value of d, excluding D( N0 ). !>
[out]	DMIN2	!> DMIN2 is DOUBLE PRECISION !> Minimum value of d, excluding D( N0 ) and D( N0-1 ). !>
[out]	DN	!> DN is DOUBLE PRECISION !> d(N0), the last value of d. !>
[out]	DNM1	!> DNM1 is DOUBLE PRECISION !> d(N0-1). !>
[out]	DNM2	!> DNM2 is DOUBLE PRECISION !> d(N0-2). !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 117 of file dlasq6.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            I0, N0, PP
      DOUBLE PRECISION   DMIN, DMIN1, DMIN2, DN, DNM1, DNM2
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   Z( * )
*     ..
*
*  =====================================================================
*
*     .. Parameter ..
      DOUBLE PRECISION   ZERO
      parameter( zero = 0.0d0 )
*     ..
*     .. Local Scalars ..
      INTEGER            J4, J4P2
      DOUBLE PRECISION   D, EMIN, SAFMIN, TEMP
*     ..
*     .. External Function ..
      DOUBLE PRECISION   DLAMCH
      EXTERNAL           dlamch
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          min
*     ..
*     .. Executable Statements ..
*
      IF( ( n0-i0-1 ).LE.0 )
     $   RETURN
*
      safmin = dlamch( 'Safe minimum' )
      j4 = 4*i0 + pp - 3
      emin = z( j4+4 )
      d = z( j4 )
      dmin = d
*
      IF( pp.EQ.0 ) THEN
         DO 10 j4 = 4*i0, 4*( n0-3 ), 4
            z( j4-2 ) = d + z( j4-1 )
            IF( z( j4-2 ).EQ.zero ) THEN
               z( j4 ) = zero
               d = z( j4+1 )
               dmin = d
               emin = zero
            ELSE IF( safmin*z( j4+1 ).LT.z( j4-2 ) .AND.
     $               safmin*z( j4-2 ).LT.z( j4+1 ) ) THEN
               temp = z( j4+1 ) / z( j4-2 )
               z( j4 ) = z( j4-1 )*temp
               d = d*temp
            ELSE
               z( j4 ) = z( j4+1 )*( z( j4-1 ) / z( j4-2 ) )
               d = z( j4+1 )*( d / z( j4-2 ) )
            END IF
            dmin = min( dmin, d )
            emin = min( emin, z( j4 ) )
   10    CONTINUE
      ELSE
         DO 20 j4 = 4*i0, 4*( n0-3 ), 4
            z( j4-3 ) = d + z( j4 )
            IF( z( j4-3 ).EQ.zero ) THEN
               z( j4-1 ) = zero
               d = z( j4+2 )
               dmin = d
               emin = zero
            ELSE IF( safmin*z( j4+2 ).LT.z( j4-3 ) .AND.
     $               safmin*z( j4-3 ).LT.z( j4+2 ) ) THEN
               temp = z( j4+2 ) / z( j4-3 )
               z( j4-1 ) = z( j4 )*temp
               d = d*temp
            ELSE
               z( j4-1 ) = z( j4+2 )*( z( j4 ) / z( j4-3 ) )
               d = z( j4+2 )*( d / z( j4-3 ) )
            END IF
            dmin = min( dmin, d )
            emin = min( emin, z( j4-1 ) )
   20    CONTINUE
      END IF
*
*     Unroll last two steps.
*
      dnm2 = d
      dmin2 = dmin
      j4 = 4*( n0-2 ) - pp
      j4p2 = j4 + 2*pp - 1
      z( j4-2 ) = dnm2 + z( j4p2 )
      IF( z( j4-2 ).EQ.zero ) THEN
         z( j4 ) = zero
         dnm1 = z( j4p2+2 )
         dmin = dnm1
         emin = zero
      ELSE IF( safmin*z( j4p2+2 ).LT.z( j4-2 ) .AND.
     $         safmin*z( j4-2 ).LT.z( j4p2+2 ) ) THEN
         temp = z( j4p2+2 ) / z( j4-2 )
         z( j4 ) = z( j4p2 )*temp
         dnm1 = dnm2*temp
      ELSE
         z( j4 ) = z( j4p2+2 )*( z( j4p2 ) / z( j4-2 ) )
         dnm1 = z( j4p2+2 )*( dnm2 / z( j4-2 ) )
      END IF
      dmin = min( dmin, dnm1 )
*
      dmin1 = dmin
      j4 = j4 + 4
      j4p2 = j4 + 2*pp - 1
      z( j4-2 ) = dnm1 + z( j4p2 )
      IF( z( j4-2 ).EQ.zero ) THEN
         z( j4 ) = zero
         dn = z( j4p2+2 )
         dmin = dn
         emin = zero
      ELSE IF( safmin*z( j4p2+2 ).LT.z( j4-2 ) .AND.
     $         safmin*z( j4-2 ).LT.z( j4p2+2 ) ) THEN
         temp = z( j4p2+2 ) / z( j4-2 )
         z( j4 ) = z( j4p2 )*temp
         dn = dnm1*temp
      ELSE
         z( j4 ) = z( j4p2+2 )*( z( j4p2 ) / z( j4-2 ) )
         dn = z( j4p2+2 )*( dnm1 / z( j4-2 ) )
      END IF
      dmin = min( dmin, dn )
*
      z( j4+2 ) = dn
      z( 4*n0-pp ) = emin
      RETURN
*
*     End of DLASQ6
*

◆ dlasrt()

subroutine dlasrt	(	character	id,
		integer	n,
		double precision, dimension( * )	d,
		integer	info )

DLASRT sorts numbers in increasing or decreasing order.

Download DLASRT + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> Sort the numbers in D in increasing order (if ID = 'I') or
!> in decreasing order (if ID = 'D' ).
!>
!> Use Quick Sort, reverting to Insertion sort on arrays of
!> size <= 20. Dimension of STACK limits N to about 2**32.
!>

Parameters

[in]	ID	!> ID is CHARACTER*1 !> = 'I': sort D in increasing order; !> = 'D': sort D in decreasing order. !>
[in]	N	!> N is INTEGER !> The length of the array D. !>
[in,out]	D	!> D is DOUBLE PRECISION array, dimension (N) !> On entry, the array to be sorted. !> On exit, D has been sorted into increasing order !> (D(1) <= ... <= D(N) ) or into decreasing order !> (D(1) >= ... >= D(N) ), depending on ID. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 87 of file dlasrt.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          ID
      INTEGER            INFO, N
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   D( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      INTEGER            SELECT
      parameter( SELECT = 20 )
*     ..
*     .. Local Scalars ..
      INTEGER            DIR, ENDD, I, J, START, STKPNT
      DOUBLE PRECISION   D1, D2, D3, DMNMX, TMP
*     ..
*     .. Local Arrays ..
      INTEGER            STACK( 2, 32 )
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           xerbla
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      dir = -1
      IF( lsame( id, 'D' ) ) THEN
         dir = 0
      ELSE IF( lsame( id, 'I' ) ) THEN
         dir = 1
      END IF
      IF( dir.EQ.-1 ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'DLASRT', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.LE.1 )
     $   RETURN
*
      stkpnt = 1
      stack( 1, 1 ) = 1
      stack( 2, 1 ) = n
   10 CONTINUE
      start = stack( 1, stkpnt )
      endd = stack( 2, stkpnt )
      stkpnt = stkpnt - 1
      IF( endd-start.LE.SELECT .AND. endd-start.GT.0 ) THEN
*
*        Do Insertion sort on D( START:ENDD )
*
         IF( dir.EQ.0 ) THEN
*
*           Sort into decreasing order
*
            DO 30 i = start + 1, endd
               DO 20 j = i, start + 1, -1
                  IF( d( j ).GT.d( j-1 ) ) THEN
                     dmnmx = d( j )
                     d( j ) = d( j-1 )
                     d( j-1 ) = dmnmx
                  ELSE
                     GO TO 30
                  END IF
   20          CONTINUE
   30       CONTINUE
*
         ELSE
*
*           Sort into increasing order
*
            DO 50 i = start + 1, endd
               DO 40 j = i, start + 1, -1
                  IF( d( j ).LT.d( j-1 ) ) THEN
                     dmnmx = d( j )
                     d( j ) = d( j-1 )
                     d( j-1 ) = dmnmx
                  ELSE
                     GO TO 50
                  END IF
   40          CONTINUE
   50       CONTINUE
*
         END IF
*
      ELSE IF( endd-start.GT.SELECT ) THEN
*
*        Partition D( START:ENDD ) and stack parts, largest one first
*
*        Choose partition entry as median of 3
*
         d1 = d( start )
         d2 = d( endd )
         i = ( start+endd ) / 2
         d3 = d( i )
         IF( d1.LT.d2 ) THEN
            IF( d3.LT.d1 ) THEN
               dmnmx = d1
            ELSE IF( d3.LT.d2 ) THEN
               dmnmx = d3
            ELSE
               dmnmx = d2
            END IF
         ELSE
            IF( d3.LT.d2 ) THEN
               dmnmx = d2
            ELSE IF( d3.LT.d1 ) THEN
               dmnmx = d3
            ELSE
               dmnmx = d1
            END IF
         END IF
*
         IF( dir.EQ.0 ) THEN
*
*           Sort into decreasing order
*
            i = start - 1
            j = endd + 1
   60       CONTINUE
   70       CONTINUE
            j = j - 1
            IF( d( j ).LT.dmnmx )
     $         GO TO 70
   80       CONTINUE
            i = i + 1
            IF( d( i ).GT.dmnmx )
     $         GO TO 80
            IF( i.LT.j ) THEN
               tmp = d( i )
               d( i ) = d( j )
               d( j ) = tmp
               GO TO 60
            END IF
            IF( j-start.GT.endd-j-1 ) THEN
               stkpnt = stkpnt + 1
               stack( 1, stkpnt ) = start
               stack( 2, stkpnt ) = j
               stkpnt = stkpnt + 1
               stack( 1, stkpnt ) = j + 1
               stack( 2, stkpnt ) = endd
            ELSE
               stkpnt = stkpnt + 1
               stack( 1, stkpnt ) = j + 1
               stack( 2, stkpnt ) = endd
               stkpnt = stkpnt + 1
               stack( 1, stkpnt ) = start
               stack( 2, stkpnt ) = j
            END IF
         ELSE
*
*           Sort into increasing order
*
            i = start - 1
            j = endd + 1
   90       CONTINUE
  100       CONTINUE
            j = j - 1
            IF( d( j ).GT.dmnmx )
     $         GO TO 100
  110       CONTINUE
            i = i + 1
            IF( d( i ).LT.dmnmx )
     $         GO TO 110
            IF( i.LT.j ) THEN
               tmp = d( i )
               d( i ) = d( j )
               d( j ) = tmp
               GO TO 90
            END IF
            IF( j-start.GT.endd-j-1 ) THEN
               stkpnt = stkpnt + 1
               stack( 1, stkpnt ) = start
               stack( 2, stkpnt ) = j
               stkpnt = stkpnt + 1
               stack( 1, stkpnt ) = j + 1
               stack( 2, stkpnt ) = endd
            ELSE
               stkpnt = stkpnt + 1
               stack( 1, stkpnt ) = j + 1
               stack( 2, stkpnt ) = endd
               stkpnt = stkpnt + 1
               stack( 1, stkpnt ) = start
               stack( 2, stkpnt ) = j
            END IF
         END IF
      END IF
      IF( stkpnt.GT.0 )
     $   GO TO 10
      RETURN
*
*     End of DLASRT
*

◆ dstebz()

subroutine dstebz	(	character	range,
		character	order,
		integer	n,
		double precision	vl,
		double precision	vu,
		integer	il,
		integer	iu,
		double precision	abstol,
		double precision, dimension( * )	d,
		double precision, dimension( * )	e,
		integer	m,
		integer	nsplit,
		double precision, dimension( * )	w,
		integer, dimension( * )	iblock,
		integer, dimension( * )	isplit,
		double precision, dimension( * )	work,
		integer, dimension( * )	iwork,
		integer	info )

DSTEBZ

Download DSTEBZ + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DSTEBZ computes the eigenvalues of a symmetric tridiagonal
!> matrix T.  The user may ask for all eigenvalues, all eigenvalues
!> in the half-open interval (VL, VU], or the IL-th through IU-th
!> eigenvalues.
!>
!> To avoid overflow, the matrix must be scaled so that its
!> largest element is no greater than overflow**(1/2) * underflow**(1/4) in absolute value, and for greatest
!> accuracy, it should not be much smaller than that.
!>
!> See W. Kahan , Report CS41, Computer Science Dept., Stanford
!> University, July 21, 1966.
!>

Parameters

[in]	RANGE	!> RANGE is CHARACTER*1 !> = 'A': () all eigenvalues will be found. !> = 'V': () all eigenvalues in the half-open interval !> (VL, VU] will be found. !> = 'I': () the IL-th through IU-th eigenvalues (of the !> entire matrix) will be found. !>
[in]	ORDER	!> ORDER is CHARACTER*1 !> = 'B': () the eigenvalues will be grouped by !> split-off block (see IBLOCK, ISPLIT) and !> ordered from smallest to largest within !> the block. !> = 'E': () !> the eigenvalues for the entire matrix !> will be ordered from smallest to !> largest. !>
[in]	N	!> N is INTEGER !> The order of the tridiagonal matrix T. N >= 0. !>
[in]	VL	!> VL is DOUBLE PRECISION !> !> If RANGE='V', the lower bound of the interval to !> be searched for eigenvalues. Eigenvalues less than or equal !> to VL, or greater than VU, will not be returned. VL < VU. !> Not referenced if RANGE = 'A' or 'I'. !>
[in]	VU	!> VU is DOUBLE PRECISION !> !> If RANGE='V', the upper bound of the interval to !> be searched for eigenvalues. Eigenvalues less than or equal !> to VL, or greater than VU, will not be returned. VL < VU. !> Not referenced if RANGE = 'A' or 'I'. !>
[in]	IL	!> IL is INTEGER !> !> If RANGE='I', the index of the !> smallest eigenvalue to be returned. !> 1 <= IL <= IU <= N, if N > 0; IL = 1 and IU = 0 if N = 0. !> Not referenced if RANGE = 'A' or 'V'. !>
[in]	IU	!> IU is INTEGER !> !> If RANGE='I', the index of the !> largest eigenvalue to be returned. !> 1 <= IL <= IU <= N, if N > 0; IL = 1 and IU = 0 if N = 0. !> Not referenced if RANGE = 'A' or 'V'. !>
[in]	ABSTOL	!> ABSTOL is DOUBLE PRECISION !> The absolute tolerance for the eigenvalues. An eigenvalue !> (or cluster) is considered to be located if it has been !> determined to lie in an interval whose width is ABSTOL or !> less. If ABSTOL is less than or equal to zero, then ULP\|T\| !> will be used, where \|T\| means the 1-norm of T. !> !> Eigenvalues will be computed most accurately when ABSTOL is !> set to twice the underflow threshold 2DLAMCH('S'), not zero. !>
[in]	D	!> D is DOUBLE PRECISION array, dimension (N) !> The n diagonal elements of the tridiagonal matrix T. !>
[in]	E	!> E is DOUBLE PRECISION array, dimension (N-1) !> The (n-1) off-diagonal elements of the tridiagonal matrix T. !>
[out]	M	!> M is INTEGER !> The actual number of eigenvalues found. 0 <= M <= N. !> (See also the description of INFO=2,3.) !>
[out]	NSPLIT	!> NSPLIT is INTEGER !> The number of diagonal blocks in the matrix T. !> 1 <= NSPLIT <= N. !>
[out]	W	!> W is DOUBLE PRECISION array, dimension (N) !> On exit, the first M elements of W will contain the !> eigenvalues. (DSTEBZ may use the remaining N-M elements as !> workspace.) !>
[out]	IBLOCK	!> IBLOCK is INTEGER array, dimension (N) !> At each row/column j where E(j) is zero or small, the !> matrix T is considered to split into a block diagonal !> matrix. On exit, if INFO = 0, IBLOCK(i) specifies to which !> block (from 1 to the number of blocks) the eigenvalue W(i) !> belongs. (DSTEBZ may use the remaining N-M elements as !> workspace.) !>
[out]	ISPLIT	!> ISPLIT is INTEGER array, dimension (N) !> The splitting points, at which T breaks up into submatrices. !> The first submatrix consists of rows/columns 1 to ISPLIT(1), !> the second of rows/columns ISPLIT(1)+1 through ISPLIT(2), !> etc., and the NSPLIT-th consists of rows/columns !> ISPLIT(NSPLIT-1)+1 through ISPLIT(NSPLIT)=N. !> (Only the first NSPLIT elements will actually be used, but !> since the user cannot know a priori what value NSPLIT will !> have, N words must be reserved for ISPLIT.) !>
[out]	WORK	!> WORK is DOUBLE PRECISION array, dimension (4*N) !>
[out]	IWORK	!> IWORK is INTEGER array, dimension (3*N) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !> > 0: some or all of the eigenvalues failed to converge or !> were not computed: !> =1 or 3: Bisection failed to converge for some !> eigenvalues; these eigenvalues are flagged by a !> negative block number. The effect is that the !> eigenvalues may not be as accurate as the !> absolute and relative tolerances. This is !> generally caused by unexpectedly inaccurate !> arithmetic. !> =2 or 3: RANGE='I' only: Not all of the eigenvalues !> IL:IU were found. !> Effect: M < IU+1-IL !> Cause: non-monotonic arithmetic, causing the !> Sturm sequence to be non-monotonic. !> Cure: recalculate, using RANGE='A', and pick !> out eigenvalues IL:IU. In some cases, !> increasing the PARAMETER may !> make things work. !> = 4: RANGE='I', and the Gershgorin interval !> initially used was too small. No eigenvalues !> were computed. !> Probable cause: your machine has sloppy !> floating-point arithmetic. !> Cure: Increase the PARAMETER , !> recompile, and try again. !>

Internal Parameters:

!>  RELFAC  DOUBLE PRECISION, default = 2.0e0
!>          The relative tolerance.  An interval (a,b] lies within
!>           if  b-a < RELFAC*ulp*max(|a|,|b|),
!>          where  is the machine precision (distance from 1 to
!>          the next larger floating point number.)
!>
!>  FUDGE   DOUBLE PRECISION, default = 2
!>          A  to widen the Gershgorin intervals.  Ideally,
!>          a value of 1 should work, but on machines with sloppy
!>          arithmetic, this needs to be larger.  The default for
!>          publicly released versions should be large enough to handle
!>          the worst machine around.  Note that this has no effect
!>          on accuracy of the solution.
!>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 270 of file dstebz.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          ORDER, RANGE
      INTEGER            IL, INFO, IU, M, N, NSPLIT
      DOUBLE PRECISION   ABSTOL, VL, VU
*     ..
*     .. Array Arguments ..
      INTEGER            IBLOCK( * ), ISPLIT( * ), IWORK( * )
      DOUBLE PRECISION   D( * ), E( * ), W( * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ZERO, ONE, TWO, HALF
      parameter( zero = 0.0d0, one = 1.0d0, two = 2.0d0,
     $                   half = 1.0d0 / two )
      DOUBLE PRECISION   FUDGE, RELFAC
      parameter( fudge = 2.1d0, relfac = 2.0d0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            NCNVRG, TOOFEW
      INTEGER            IB, IBEGIN, IDISCL, IDISCU, IE, IEND, IINFO,
     $                   IM, IN, IOFF, IORDER, IOUT, IRANGE, ITMAX,
     $                   ITMP1, IW, IWOFF, J, JB, JDISC, JE, NB, NWL,
     $                   NWU
      DOUBLE PRECISION   ATOLI, BNORM, GL, GU, PIVMIN, RTOLI, SAFEMN,
     $                   TMP1, TMP2, TNORM, ULP, WKILL, WL, WLU, WU, WUL
*     ..
*     .. Local Arrays ..
      INTEGER            IDUMMA( 1 )
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      INTEGER            ILAENV
      DOUBLE PRECISION   DLAMCH
      EXTERNAL           lsame, ilaenv, dlamch
*     ..
*     .. External Subroutines ..
      EXTERNAL           dlaebz, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, int, log, max, min, sqrt
*     ..
*     .. Executable Statements ..
*
      info = 0
*
*     Decode RANGE
*
      IF( lsame( range, 'A' ) ) THEN
         irange = 1
      ELSE IF( lsame( range, 'V' ) ) THEN
         irange = 2
      ELSE IF( lsame( range, 'I' ) ) THEN
         irange = 3
      ELSE
         irange = 0
      END IF
*
*     Decode ORDER
*
      IF( lsame( order, 'B' ) ) THEN
         iorder = 2
      ELSE IF( lsame( order, 'E' ) ) THEN
         iorder = 1
      ELSE
         iorder = 0
      END IF
*
*     Check for Errors
*
      IF( irange.LE.0 ) THEN
         info = -1
      ELSE IF( iorder.LE.0 ) THEN
         info = -2
      ELSE IF( n.LT.0 ) THEN
         info = -3
      ELSE IF( irange.EQ.2 ) THEN
         IF( vl.GE.vu )
     $      info = -5
      ELSE IF( irange.EQ.3 .AND. ( il.LT.1 .OR. il.GT.max( 1, n ) ) )
     $          THEN
         info = -6
      ELSE IF( irange.EQ.3 .AND. ( iu.LT.min( n, il ) .OR. iu.GT.n ) )
     $          THEN
         info = -7
      END IF
*
      IF( info.NE.0 ) THEN
         CALL xerbla( 'DSTEBZ', -info )
         RETURN
      END IF
*
*     Initialize error flags
*
      info = 0
      ncnvrg = .false.
      toofew = .false.
*
*     Quick return if possible
*
      m = 0
      IF( n.EQ.0 )
     $   RETURN
*
*     Simplifications:
*
      IF( irange.EQ.3 .AND. il.EQ.1 .AND. iu.EQ.n )
     $   irange = 1
*
*     Get machine constants
*     NB is the minimum vector length for vector bisection, or 0
*     if only scalar is to be done.
*
      safemn = dlamch( 'S' )
      ulp = dlamch( 'P' )
      rtoli = ulp*relfac
      nb = ilaenv( 1, 'DSTEBZ', ' ', n, -1, -1, -1 )
      IF( nb.LE.1 )
     $   nb = 0
*
*     Special Case when N=1
*
      IF( n.EQ.1 ) THEN
         nsplit = 1
         isplit( 1 ) = 1
         IF( irange.EQ.2 .AND. ( vl.GE.d( 1 ) .OR. vu.LT.d( 1 ) ) ) THEN
            m = 0
         ELSE
            w( 1 ) = d( 1 )
            iblock( 1 ) = 1
            m = 1
         END IF
         RETURN
      END IF
*
*     Compute Splitting Points
*
      nsplit = 1
      work( n ) = zero
      pivmin = one
*
      DO 10 j = 2, n
         tmp1 = e( j-1 )**2
         IF( abs( d( j )*d( j-1 ) )*ulp**2+safemn.GT.tmp1 ) THEN
            isplit( nsplit ) = j - 1
            nsplit = nsplit + 1
            work( j-1 ) = zero
         ELSE
            work( j-1 ) = tmp1
            pivmin = max( pivmin, tmp1 )
         END IF
   10 CONTINUE
      isplit( nsplit ) = n
      pivmin = pivmin*safemn
*
*     Compute Interval and ATOLI
*
      IF( irange.EQ.3 ) THEN
*
*        RANGE='I': Compute the interval containing eigenvalues
*                   IL through IU.
*
*        Compute Gershgorin interval for entire (split) matrix
*        and use it as the initial interval
*
         gu = d( 1 )
         gl = d( 1 )
         tmp1 = zero
*
         DO 20 j = 1, n - 1
            tmp2 = sqrt( work( j ) )
            gu = max( gu, d( j )+tmp1+tmp2 )
            gl = min( gl, d( j )-tmp1-tmp2 )
            tmp1 = tmp2
   20    CONTINUE
*
         gu = max( gu, d( n )+tmp1 )
         gl = min( gl, d( n )-tmp1 )
         tnorm = max( abs( gl ), abs( gu ) )
         gl = gl - fudge*tnorm*ulp*n - fudge*two*pivmin
         gu = gu + fudge*tnorm*ulp*n + fudge*pivmin
*
*        Compute Iteration parameters
*
         itmax = int( ( log( tnorm+pivmin )-log( pivmin ) ) /
     $           log( two ) ) + 2
         IF( abstol.LE.zero ) THEN
            atoli = ulp*tnorm
         ELSE
            atoli = abstol
         END IF
*
         work( n+1 ) = gl
         work( n+2 ) = gl
         work( n+3 ) = gu
         work( n+4 ) = gu
         work( n+5 ) = gl
         work( n+6 ) = gu
         iwork( 1 ) = -1
         iwork( 2 ) = -1
         iwork( 3 ) = n + 1
         iwork( 4 ) = n + 1
         iwork( 5 ) = il - 1
         iwork( 6 ) = iu
*
         CALL dlaebz( 3, itmax, n, 2, 2, nb, atoli, rtoli, pivmin, d, e,
     $                work, iwork( 5 ), work( n+1 ), work( n+5 ), iout,
     $                iwork, w, iblock, iinfo )
*
         IF( iwork( 6 ).EQ.iu ) THEN
            wl = work( n+1 )
            wlu = work( n+3 )
            nwl = iwork( 1 )
            wu = work( n+4 )
            wul = work( n+2 )
            nwu = iwork( 4 )
         ELSE
            wl = work( n+2 )
            wlu = work( n+4 )
            nwl = iwork( 2 )
            wu = work( n+3 )
            wul = work( n+1 )
            nwu = iwork( 3 )
         END IF
*
         IF( nwl.LT.0 .OR. nwl.GE.n .OR. nwu.LT.1 .OR. nwu.GT.n ) THEN
            info = 4
            RETURN
         END IF
      ELSE
*
*        RANGE='A' or 'V' -- Set ATOLI
*
         tnorm = max( abs( d( 1 ) )+abs( e( 1 ) ),
     $           abs( d( n ) )+abs( e( n-1 ) ) )
*
         DO 30 j = 2, n - 1
            tnorm = max( tnorm, abs( d( j ) )+abs( e( j-1 ) )+
     $              abs( e( j ) ) )
   30    CONTINUE
*
         IF( abstol.LE.zero ) THEN
            atoli = ulp*tnorm
         ELSE
            atoli = abstol
         END IF
*
         IF( irange.EQ.2 ) THEN
            wl = vl
            wu = vu
         ELSE
            wl = zero
            wu = zero
         END IF
      END IF
*
*     Find Eigenvalues -- Loop Over Blocks and recompute NWL and NWU.
*     NWL accumulates the number of eigenvalues .le. WL,
*     NWU accumulates the number of eigenvalues .le. WU
*
      m = 0
      iend = 0
      info = 0
      nwl = 0
      nwu = 0
*
      DO 70 jb = 1, nsplit
         ioff = iend
         ibegin = ioff + 1
         iend = isplit( jb )
         in = iend - ioff
*
         IF( in.EQ.1 ) THEN
*
*           Special Case -- IN=1
*
            IF( irange.EQ.1 .OR. wl.GE.d( ibegin )-pivmin )
     $         nwl = nwl + 1
            IF( irange.EQ.1 .OR. wu.GE.d( ibegin )-pivmin )
     $         nwu = nwu + 1
            IF( irange.EQ.1 .OR. ( wl.LT.d( ibegin )-pivmin .AND. wu.GE.
     $          d( ibegin )-pivmin ) ) THEN
               m = m + 1
               w( m ) = d( ibegin )
               iblock( m ) = jb
            END IF
         ELSE
*
*           General Case -- IN > 1
*
*           Compute Gershgorin Interval
*           and use it as the initial interval
*
            gu = d( ibegin )
            gl = d( ibegin )
            tmp1 = zero
*
            DO 40 j = ibegin, iend - 1
               tmp2 = abs( e( j ) )
               gu = max( gu, d( j )+tmp1+tmp2 )
               gl = min( gl, d( j )-tmp1-tmp2 )
               tmp1 = tmp2
   40       CONTINUE
*
            gu = max( gu, d( iend )+tmp1 )
            gl = min( gl, d( iend )-tmp1 )
            bnorm = max( abs( gl ), abs( gu ) )
            gl = gl - fudge*bnorm*ulp*in - fudge*pivmin
            gu = gu + fudge*bnorm*ulp*in + fudge*pivmin
*
*           Compute ATOLI for the current submatrix
*
            IF( abstol.LE.zero ) THEN
               atoli = ulp*max( abs( gl ), abs( gu ) )
            ELSE
               atoli = abstol
            END IF
*
            IF( irange.GT.1 ) THEN
               IF( gu.LT.wl ) THEN
                  nwl = nwl + in
                  nwu = nwu + in
                  GO TO 70
               END IF
               gl = max( gl, wl )
               gu = min( gu, wu )
               IF( gl.GE.gu )
     $            GO TO 70
            END IF
*
*           Set Up Initial Interval
*
            work( n+1 ) = gl
            work( n+in+1 ) = gu
            CALL dlaebz( 1, 0, in, in, 1, nb, atoli, rtoli, pivmin,
     $                   d( ibegin ), e( ibegin ), work( ibegin ),
     $                   idumma, work( n+1 ), work( n+2*in+1 ), im,
     $                   iwork, w( m+1 ), iblock( m+1 ), iinfo )
*
            nwl = nwl + iwork( 1 )
            nwu = nwu + iwork( in+1 )
            iwoff = m - iwork( 1 )
*
*           Compute Eigenvalues
*
            itmax = int( ( log( gu-gl+pivmin )-log( pivmin ) ) /
     $              log( two ) ) + 2
            CALL dlaebz( 2, itmax, in, in, 1, nb, atoli, rtoli, pivmin,
     $                   d( ibegin ), e( ibegin ), work( ibegin ),
     $                   idumma, work( n+1 ), work( n+2*in+1 ), iout,
     $                   iwork, w( m+1 ), iblock( m+1 ), iinfo )
*
*           Copy Eigenvalues Into W and IBLOCK
*           Use -JB for block number for unconverged eigenvalues.
*
            DO 60 j = 1, iout
               tmp1 = half*( work( j+n )+work( j+in+n ) )
*
*              Flag non-convergence.
*
               IF( j.GT.iout-iinfo ) THEN
                  ncnvrg = .true.
                  ib = -jb
               ELSE
                  ib = jb
               END IF
               DO 50 je = iwork( j ) + 1 + iwoff,
     $                 iwork( j+in ) + iwoff
                  w( je ) = tmp1
                  iblock( je ) = ib
   50          CONTINUE
   60       CONTINUE
*
            m = m + im
         END IF
   70 CONTINUE
*
*     If RANGE='I', then (WL,WU) contains eigenvalues NWL+1,...,NWU
*     If NWL+1 < IL or NWU > IU, discard extra eigenvalues.
*
      IF( irange.EQ.3 ) THEN
         im = 0
         idiscl = il - 1 - nwl
         idiscu = nwu - iu
*
         IF( idiscl.GT.0 .OR. idiscu.GT.0 ) THEN
            DO 80 je = 1, m
               IF( w( je ).LE.wlu .AND. idiscl.GT.0 ) THEN
                  idiscl = idiscl - 1
               ELSE IF( w( je ).GE.wul .AND. idiscu.GT.0 ) THEN
                  idiscu = idiscu - 1
               ELSE
                  im = im + 1
                  w( im ) = w( je )
                  iblock( im ) = iblock( je )
               END IF
   80       CONTINUE
            m = im
         END IF
         IF( idiscl.GT.0 .OR. idiscu.GT.0 ) THEN
*
*           Code to deal with effects of bad arithmetic:
*           Some low eigenvalues to be discarded are not in (WL,WLU],
*           or high eigenvalues to be discarded are not in (WUL,WU]
*           so just kill off the smallest IDISCL/largest IDISCU
*           eigenvalues, by simply finding the smallest/largest
*           eigenvalue(s).
*
*           (If N(w) is monotone non-decreasing, this should never
*               happen.)
*
            IF( idiscl.GT.0 ) THEN
               wkill = wu
               DO 100 jdisc = 1, idiscl
                  iw = 0
                  DO 90 je = 1, m
                     IF( iblock( je ).NE.0 .AND.
     $                   ( w( je ).LT.wkill .OR. iw.EQ.0 ) ) THEN
                        iw = je
                        wkill = w( je )
                     END IF
   90             CONTINUE
                  iblock( iw ) = 0
  100          CONTINUE
            END IF
            IF( idiscu.GT.0 ) THEN
*
               wkill = wl
               DO 120 jdisc = 1, idiscu
                  iw = 0
                  DO 110 je = 1, m
                     IF( iblock( je ).NE.0 .AND.
     $                   ( w( je ).GT.wkill .OR. iw.EQ.0 ) ) THEN
                        iw = je
                        wkill = w( je )
                     END IF
  110             CONTINUE
                  iblock( iw ) = 0
  120          CONTINUE
            END IF
            im = 0
            DO 130 je = 1, m
               IF( iblock( je ).NE.0 ) THEN
                  im = im + 1
                  w( im ) = w( je )
                  iblock( im ) = iblock( je )
               END IF
  130       CONTINUE
            m = im
         END IF
         IF( idiscl.LT.0 .OR. idiscu.LT.0 ) THEN
            toofew = .true.
         END IF
      END IF
*
*     If ORDER='B', do nothing -- the eigenvalues are already sorted
*        by block.
*     If ORDER='E', sort the eigenvalues from smallest to largest
*
      IF( iorder.EQ.1 .AND. nsplit.GT.1 ) THEN
         DO 150 je = 1, m - 1
            ie = 0
            tmp1 = w( je )
            DO 140 j = je + 1, m
               IF( w( j ).LT.tmp1 ) THEN
                  ie = j
                  tmp1 = w( j )
               END IF
  140       CONTINUE
*
            IF( ie.NE.0 ) THEN
               itmp1 = iblock( ie )
               w( ie ) = w( je )
               iblock( ie ) = iblock( je )
               w( je ) = tmp1
               iblock( je ) = itmp1
            END IF
  150    CONTINUE
      END IF
*
      info = 0
      IF( ncnvrg )
     $   info = info + 1
      IF( toofew )
     $   info = info + 2
      RETURN
*
*     End of DSTEBZ
*

◆ dstedc()

subroutine dstedc	(	character	compz,
		integer	n,
		double precision, dimension( * )	d,
		double precision, dimension( * )	e,
		double precision, dimension( ldz, * )	z,
		integer	ldz,
		double precision, dimension( * )	work,
		integer	lwork,
		integer, dimension( * )	iwork,
		integer	liwork,
		integer	info )

DSTEDC

Download DSTEDC + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DSTEDC computes all eigenvalues and, optionally, eigenvectors of a
!> symmetric tridiagonal matrix using the divide and conquer method.
!> The eigenvectors of a full or band real symmetric matrix can also be
!> found if DSYTRD or DSPTRD or DSBTRD has been used to reduce this
!> matrix to tridiagonal form.
!>
!> This code makes very mild assumptions about floating point
!> arithmetic. It will work on machines with a guard digit in
!> add/subtract, or on those binary machines without guard digits
!> which subtract like the Cray X-MP, Cray Y-MP, Cray C-90, or Cray-2.
!> It could conceivably fail on hexadecimal or decimal machines
!> without guard digits, but we know of none.  See DLAED3 for details.
!>

Parameters

[in]	COMPZ	!> COMPZ is CHARACTER*1 !> = 'N': Compute eigenvalues only. !> = 'I': Compute eigenvectors of tridiagonal matrix also. !> = 'V': Compute eigenvectors of original dense symmetric !> matrix also. On entry, Z contains the orthogonal !> matrix used to reduce the original matrix to !> tridiagonal form. !>
[in]	N	!> N is INTEGER !> The dimension of the symmetric tridiagonal matrix. N >= 0. !>
[in,out]	D	!> D is DOUBLE PRECISION array, dimension (N) !> On entry, the diagonal elements of the tridiagonal matrix. !> On exit, if INFO = 0, the eigenvalues in ascending order. !>
[in,out]	E	!> E is DOUBLE PRECISION array, dimension (N-1) !> On entry, the subdiagonal elements of the tridiagonal matrix. !> On exit, E has been destroyed. !>
[in,out]	Z	!> Z is DOUBLE PRECISION array, dimension (LDZ,N) !> On entry, if COMPZ = 'V', then Z contains the orthogonal !> matrix used in the reduction to tridiagonal form. !> On exit, if INFO = 0, then if COMPZ = 'V', Z contains the !> orthonormal eigenvectors of the original symmetric matrix, !> and if COMPZ = 'I', Z contains the orthonormal eigenvectors !> of the symmetric tridiagonal matrix. !> If COMPZ = 'N', then Z is not referenced. !>
[in]	LDZ	!> LDZ is INTEGER !> The leading dimension of the array Z. LDZ >= 1. !> If eigenvectors are desired, then LDZ >= max(1,N). !>
[out]	WORK	!> WORK is DOUBLE PRECISION array, dimension (MAX(1,LWORK)) !> On exit, if INFO = 0, WORK(1) returns the optimal LWORK. !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the array WORK. !> If COMPZ = 'N' or N <= 1 then LWORK must be at least 1. !> If COMPZ = 'V' and N > 1 then LWORK must be at least !> ( 1 + 3N + 2Nlg N + 4N2 ), !> where lg( N ) = smallest integer k such !> that 2k >= N. !> If COMPZ = 'I' and N > 1 then LWORK must be at least !> ( 1 + 4N + N2 ). !> Note that for COMPZ = 'I' or 'V', then if N is less than or !> equal to the minimum divide size, usually 25, then LWORK need !> only be max(1,2(N-1)). !> !> If LWORK = -1, then a workspace query is assumed; the routine !> only calculates the optimal size of the WORK array, returns !> this value as the first entry of the WORK array, and no error !> message related to LWORK is issued by XERBLA. !>
[out]	IWORK	!> IWORK is INTEGER array, dimension (MAX(1,LIWORK)) !> On exit, if INFO = 0, IWORK(1) returns the optimal LIWORK. !>
[in]	LIWORK	!> LIWORK is INTEGER !> The dimension of the array IWORK. !> If COMPZ = 'N' or N <= 1 then LIWORK must be at least 1. !> If COMPZ = 'V' and N > 1 then LIWORK must be at least !> ( 6 + 6N + 5Nlg N ). !> If COMPZ = 'I' and N > 1 then LIWORK must be at least !> ( 3 + 5N ). !> Note that for COMPZ = 'I' or 'V', then if N is less than or !> equal to the minimum divide size, usually 25, then LIWORK !> need only be 1. !> !> If LIWORK = -1, then a workspace query is assumed; the !> routine only calculates the optimal size of the IWORK array, !> returns this value as the first entry of the IWORK array, and !> no error message related to LIWORK is issued by XERBLA. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> < 0: if INFO = -i, the i-th argument had an illegal value. !> > 0: The algorithm failed to compute an eigenvalue while !> working on the submatrix lying in rows and columns !> INFO/(N+1) through mod(INFO,N+1). !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: Jeff Rutter, Computer Science Division, University of California at Berkeley, USA
Modified by Francoise Tisseur, University of Tennessee

Definition at line 186 of file dstedc.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          COMPZ
      INTEGER            INFO, LDZ, LIWORK, LWORK, N
*     ..
*     .. Array Arguments ..
      INTEGER            IWORK( * )
      DOUBLE PRECISION   D( * ), E( * ), WORK( * ), Z( LDZ, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ZERO, ONE, TWO
      parameter( zero = 0.0d0, one = 1.0d0, two = 2.0d0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            LQUERY
      INTEGER            FINISH, I, ICOMPZ, II, J, K, LGN, LIWMIN,
     $                   LWMIN, M, SMLSIZ, START, STOREZ, STRTRW
      DOUBLE PRECISION   EPS, ORGNRM, P, TINY
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      INTEGER            ILAENV
      DOUBLE PRECISION   DLAMCH, DLANST
      EXTERNAL           lsame, ilaenv, dlamch, dlanst
*     ..
*     .. External Subroutines ..
      EXTERNAL           dgemm, dlacpy, dlaed0, dlascl, dlaset, dlasrt,
     $                   dsteqr, dsterf, dswap, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, dble, int, log, max, mod, sqrt
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      lquery = ( lwork.EQ.-1 .OR. liwork.EQ.-1 )
*
      IF( lsame( compz, 'N' ) ) THEN
         icompz = 0
      ELSE IF( lsame( compz, 'V' ) ) THEN
         icompz = 1
      ELSE IF( lsame( compz, 'I' ) ) THEN
         icompz = 2
      ELSE
         icompz = -1
      END IF
      IF( icompz.LT.0 ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( ( ldz.LT.1 ) .OR.
     $         ( icompz.GT.0 .AND. ldz.LT.max( 1, n ) ) ) THEN
         info = -6
      END IF
*
      IF( info.EQ.0 ) THEN
*
*        Compute the workspace requirements
*
         smlsiz = ilaenv( 9, 'DSTEDC', ' ', 0, 0, 0, 0 )
         IF( n.LE.1 .OR. icompz.EQ.0 ) THEN
            liwmin = 1
            lwmin = 1
         ELSE IF( n.LE.smlsiz ) THEN
            liwmin = 1
            lwmin = 2*( n - 1 )
         ELSE
            lgn = int( log( dble( n ) )/log( two ) )
            IF( 2**lgn.LT.n )
     $         lgn = lgn + 1
            IF( 2**lgn.LT.n )
     $         lgn = lgn + 1
            IF( icompz.EQ.1 ) THEN
               lwmin = 1 + 3*n + 2*n*lgn + 4*n**2
               liwmin = 6 + 6*n + 5*n*lgn
            ELSE IF( icompz.EQ.2 ) THEN
               lwmin = 1 + 4*n + n**2
               liwmin = 3 + 5*n
            END IF
         END IF
         work( 1 ) = lwmin
         iwork( 1 ) = liwmin
*
         IF( lwork.LT.lwmin .AND. .NOT. lquery ) THEN
            info = -8
         ELSE IF( liwork.LT.liwmin .AND. .NOT. lquery ) THEN
            info = -10
         END IF
      END IF
*
      IF( info.NE.0 ) THEN
         CALL xerbla( 'DSTEDC', -info )
         RETURN
      ELSE IF (lquery) THEN
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
      IF( n.EQ.1 ) THEN
         IF( icompz.NE.0 )
     $      z( 1, 1 ) = one
         RETURN
      END IF
*
*     If the following conditional clause is removed, then the routine
*     will use the Divide and Conquer routine to compute only the
*     eigenvalues, which requires (3N + 3N**2) real workspace and
*     (2 + 5N + 2N lg(N)) integer workspace.
*     Since on many architectures DSTERF is much faster than any other
*     algorithm for finding eigenvalues only, it is used here
*     as the default. If the conditional clause is removed, then
*     information on the size of workspace needs to be changed.
*
*     If COMPZ = 'N', use DSTERF to compute the eigenvalues.
*
      IF( icompz.EQ.0 ) THEN
         CALL dsterf( n, d, e, info )
         GO TO 50
      END IF
*
*     If N is smaller than the minimum divide size (SMLSIZ+1), then
*     solve the problem with another solver.
*
      IF( n.LE.smlsiz ) THEN
*
         CALL dsteqr( compz, n, d, e, z, ldz, work, info )
*
      ELSE
*
*        If COMPZ = 'V', the Z matrix must be stored elsewhere for later
*        use.
*
         IF( icompz.EQ.1 ) THEN
            storez = 1 + n*n
         ELSE
            storez = 1
         END IF
*
         IF( icompz.EQ.2 ) THEN
            CALL dlaset( 'Full', n, n, zero, one, z, ldz )
         END IF
*
*        Scale.
*
         orgnrm = dlanst( 'M', n, d, e )
         IF( orgnrm.EQ.zero )
     $      GO TO 50
*
         eps = dlamch( 'Epsilon' )
*
         start = 1
*
*        while ( START <= N )
*
   10    CONTINUE
         IF( start.LE.n ) THEN
*
*           Let FINISH be the position of the next subdiagonal entry
*           such that E( FINISH ) <= TINY or FINISH = N if no such
*           subdiagonal exists.  The matrix identified by the elements
*           between START and FINISH constitutes an independent
*           sub-problem.
*
            finish = start
   20       CONTINUE
            IF( finish.LT.n ) THEN
               tiny = eps*sqrt( abs( d( finish ) ) )*
     $                    sqrt( abs( d( finish+1 ) ) )
               IF( abs( e( finish ) ).GT.tiny ) THEN
                  finish = finish + 1
                  GO TO 20
               END IF
            END IF
*
*           (Sub) Problem determined.  Compute its size and solve it.
*
            m = finish - start + 1
            IF( m.EQ.1 ) THEN
               start = finish + 1
               GO TO 10
            END IF
            IF( m.GT.smlsiz ) THEN
*
*              Scale.
*
               orgnrm = dlanst( 'M', m, d( start ), e( start ) )
               CALL dlascl( 'G', 0, 0, orgnrm, one, m, 1, d( start ), m,
     $                      info )
               CALL dlascl( 'G', 0, 0, orgnrm, one, m-1, 1, e( start ),
     $                      m-1, info )
*
               IF( icompz.EQ.1 ) THEN
                  strtrw = 1
               ELSE
                  strtrw = start
               END IF
               CALL dlaed0( icompz, n, m, d( start ), e( start ),
     $                      z( strtrw, start ), ldz, work( 1 ), n,
     $                      work( storez ), iwork, info )
               IF( info.NE.0 ) THEN
                  info = ( info / ( m+1 )+start-1 )*( n+1 ) +
     $                   mod( info, ( m+1 ) ) + start - 1
                  GO TO 50
               END IF
*
*              Scale back.
*
               CALL dlascl( 'G', 0, 0, one, orgnrm, m, 1, d( start ), m,
     $                      info )
*
            ELSE
               IF( icompz.EQ.1 ) THEN
*
*                 Since QR won't update a Z matrix which is larger than
*                 the length of D, we must solve the sub-problem in a
*                 workspace and then multiply back into Z.
*
                  CALL dsteqr( 'I', m, d( start ), e( start ), work, m,
     $                         work( m*m+1 ), info )
                  CALL dlacpy( 'A', n, m, z( 1, start ), ldz,
     $                         work( storez ), n )
                  CALL dgemm( 'N', 'N', n, m, m, one,
     $                        work( storez ), n, work, m, zero,
     $                        z( 1, start ), ldz )
               ELSE IF( icompz.EQ.2 ) THEN
                  CALL dsteqr( 'I', m, d( start ), e( start ),
     $                         z( start, start ), ldz, work, info )
               ELSE
                  CALL dsterf( m, d( start ), e( start ), info )
               END IF
               IF( info.NE.0 ) THEN
                  info = start*( n+1 ) + finish
                  GO TO 50
               END IF
            END IF
*
            start = finish + 1
            GO TO 10
         END IF
*
*        endwhile
*
         IF( icompz.EQ.0 ) THEN
*
*          Use Quick Sort
*
           CALL dlasrt( 'I', n, d, info )
*
         ELSE
*
*          Use Selection Sort to minimize swaps of eigenvectors
*
           DO 40 ii = 2, n
              i = ii - 1
              k = i
              p = d( i )
              DO 30 j = ii, n
                 IF( d( j ).LT.p ) THEN
                    k = j
                    p = d( j )
                 END IF
   30         CONTINUE
              IF( k.NE.i ) THEN
                 d( k ) = d( i )
                 d( i ) = p
                 CALL dswap( n, z( 1, i ), 1, z( 1, k ), 1 )
              END IF
   40      CONTINUE
         END IF
      END IF
*
   50 CONTINUE
      work( 1 ) = lwmin
      iwork( 1 ) = liwmin
*
      RETURN
*
*     End of DSTEDC
*

◆ dsteqr()

subroutine dsteqr	(	character	compz,
		integer	n,
		double precision, dimension( * )	d,
		double precision, dimension( * )	e,
		double precision, dimension( ldz, * )	z,
		integer	ldz,
		double precision, dimension( * )	work,
		integer	info )

DSTEQR

Download DSTEQR + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DSTEQR computes all eigenvalues and, optionally, eigenvectors of a
!> symmetric tridiagonal matrix using the implicit QL or QR method.
!> The eigenvectors of a full or band symmetric matrix can also be found
!> if DSYTRD or DSPTRD or DSBTRD has been used to reduce this matrix to
!> tridiagonal form.
!>

Parameters

[in]	COMPZ	!> COMPZ is CHARACTER*1 !> = 'N': Compute eigenvalues only. !> = 'V': Compute eigenvalues and eigenvectors of the original !> symmetric matrix. On entry, Z must contain the !> orthogonal matrix used to reduce the original matrix !> to tridiagonal form. !> = 'I': Compute eigenvalues and eigenvectors of the !> tridiagonal matrix. Z is initialized to the identity !> matrix. !>
[in]	N	!> N is INTEGER !> The order of the matrix. N >= 0. !>
[in,out]	D	!> D is DOUBLE PRECISION array, dimension (N) !> On entry, the diagonal elements of the tridiagonal matrix. !> On exit, if INFO = 0, the eigenvalues in ascending order. !>
[in,out]	E	!> E is DOUBLE PRECISION array, dimension (N-1) !> On entry, the (n-1) subdiagonal elements of the tridiagonal !> matrix. !> On exit, E has been destroyed. !>
[in,out]	Z	!> Z is DOUBLE PRECISION array, dimension (LDZ, N) !> On entry, if COMPZ = 'V', then Z contains the orthogonal !> matrix used in the reduction to tridiagonal form. !> On exit, if INFO = 0, then if COMPZ = 'V', Z contains the !> orthonormal eigenvectors of the original symmetric matrix, !> and if COMPZ = 'I', Z contains the orthonormal eigenvectors !> of the symmetric tridiagonal matrix. !> If COMPZ = 'N', then Z is not referenced. !>
[in]	LDZ	!> LDZ is INTEGER !> The leading dimension of the array Z. LDZ >= 1, and if !> eigenvectors are desired, then LDZ >= max(1,N). !>
[out]	WORK	!> WORK is DOUBLE PRECISION array, dimension (max(1,2*N-2)) !> If COMPZ = 'N', then WORK is not referenced. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !> > 0: the algorithm has failed to find all the eigenvalues in !> a total of 30*N iterations; if INFO = i, then i !> elements of E have not converged to zero; on exit, D !> and E contain the elements of a symmetric tridiagonal !> matrix which is orthogonally similar to the original !> matrix. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 130 of file dsteqr.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          COMPZ
      INTEGER            INFO, LDZ, N
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   D( * ), E( * ), WORK( * ), Z( LDZ, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ZERO, ONE, TWO, THREE
      parameter( zero = 0.0d0, one = 1.0d0, two = 2.0d0,
     $                   three = 3.0d0 )
      INTEGER            MAXIT
      parameter( maxit = 30 )
*     ..
*     .. Local Scalars ..
      INTEGER            I, ICOMPZ, II, ISCALE, J, JTOT, K, L, L1, LEND,
     $                   LENDM1, LENDP1, LENDSV, LM1, LSV, M, MM, MM1,
     $                   NM1, NMAXIT
      DOUBLE PRECISION   ANORM, B, C, EPS, EPS2, F, G, P, R, RT1, RT2,
     $                   S, SAFMAX, SAFMIN, SSFMAX, SSFMIN, TST
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      DOUBLE PRECISION   DLAMCH, DLANST, DLAPY2
      EXTERNAL           lsame, dlamch, dlanst, dlapy2
*     ..
*     .. External Subroutines ..
      EXTERNAL           dlae2, dlaev2, dlartg, dlascl, dlaset, dlasr,
     $                   dlasrt, dswap, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, max, sign, sqrt
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
*
      IF( lsame( compz, 'N' ) ) THEN
         icompz = 0
      ELSE IF( lsame( compz, 'V' ) ) THEN
         icompz = 1
      ELSE IF( lsame( compz, 'I' ) ) THEN
         icompz = 2
      ELSE
         icompz = -1
      END IF
      IF( icompz.LT.0 ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( ( ldz.LT.1 ) .OR. ( icompz.GT.0 .AND. ldz.LT.max( 1,
     $         n ) ) ) THEN
         info = -6
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'DSTEQR', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
      IF( n.EQ.1 ) THEN
         IF( icompz.EQ.2 )
     $      z( 1, 1 ) = one
         RETURN
      END IF
*
*     Determine the unit roundoff and over/underflow thresholds.
*
      eps = dlamch( 'E' )
      eps2 = eps**2
      safmin = dlamch( 'S' )
      safmax = one / safmin
      ssfmax = sqrt( safmax ) / three
      ssfmin = sqrt( safmin ) / eps2
*
*     Compute the eigenvalues and eigenvectors of the tridiagonal
*     matrix.
*
      IF( icompz.EQ.2 )
     $   CALL dlaset( 'Full', n, n, zero, one, z, ldz )
*
      nmaxit = n*maxit
      jtot = 0
*
*     Determine where the matrix splits and choose QL or QR iteration
*     for each block, according to whether top or bottom diagonal
*     element is smaller.
*
      l1 = 1
      nm1 = n - 1
*
   10 CONTINUE
      IF( l1.GT.n )
     $   GO TO 160
      IF( l1.GT.1 )
     $   e( l1-1 ) = zero
      IF( l1.LE.nm1 ) THEN
         DO 20 m = l1, nm1
            tst = abs( e( m ) )
            IF( tst.EQ.zero )
     $         GO TO 30
            IF( tst.LE.( sqrt( abs( d( m ) ) )*sqrt( abs( d( m+
     $          1 ) ) ) )*eps ) THEN
               e( m ) = zero
               GO TO 30
            END IF
   20    CONTINUE
      END IF
      m = n
*
   30 CONTINUE
      l = l1
      lsv = l
      lend = m
      lendsv = lend
      l1 = m + 1
      IF( lend.EQ.l )
     $   GO TO 10
*
*     Scale submatrix in rows and columns L to LEND
*
      anorm = dlanst( 'M', lend-l+1, d( l ), e( l ) )
      iscale = 0
      IF( anorm.EQ.zero )
     $   GO TO 10
      IF( anorm.GT.ssfmax ) THEN
         iscale = 1
         CALL dlascl( 'G', 0, 0, anorm, ssfmax, lend-l+1, 1, d( l ), n,
     $                info )
         CALL dlascl( 'G', 0, 0, anorm, ssfmax, lend-l, 1, e( l ), n,
     $                info )
      ELSE IF( anorm.LT.ssfmin ) THEN
         iscale = 2
         CALL dlascl( 'G', 0, 0, anorm, ssfmin, lend-l+1, 1, d( l ), n,
     $                info )
         CALL dlascl( 'G', 0, 0, anorm, ssfmin, lend-l, 1, e( l ), n,
     $                info )
      END IF
*
*     Choose between QL and QR iteration
*
      IF( abs( d( lend ) ).LT.abs( d( l ) ) ) THEN
         lend = lsv
         l = lendsv
      END IF
*
      IF( lend.GT.l ) THEN
*
*        QL Iteration
*
*        Look for small subdiagonal element.
*
   40    CONTINUE
         IF( l.NE.lend ) THEN
            lendm1 = lend - 1
            DO 50 m = l, lendm1
               tst = abs( e( m ) )**2
               IF( tst.LE.( eps2*abs( d( m ) ) )*abs( d( m+1 ) )+
     $             safmin )GO TO 60
   50       CONTINUE
         END IF
*
         m = lend
*
   60    CONTINUE
         IF( m.LT.lend )
     $      e( m ) = zero
         p = d( l )
         IF( m.EQ.l )
     $      GO TO 80
*
*        If remaining matrix is 2-by-2, use DLAE2 or SLAEV2
*        to compute its eigensystem.
*
         IF( m.EQ.l+1 ) THEN
            IF( icompz.GT.0 ) THEN
               CALL dlaev2( d( l ), e( l ), d( l+1 ), rt1, rt2, c, s )
               work( l ) = c
               work( n-1+l ) = s
               CALL dlasr( 'R', 'V', 'B', n, 2, work( l ),
     $                     work( n-1+l ), z( 1, l ), ldz )
            ELSE
               CALL dlae2( d( l ), e( l ), d( l+1 ), rt1, rt2 )
            END IF
            d( l ) = rt1
            d( l+1 ) = rt2
            e( l ) = zero
            l = l + 2
            IF( l.LE.lend )
     $         GO TO 40
            GO TO 140
         END IF
*
         IF( jtot.EQ.nmaxit )
     $      GO TO 140
         jtot = jtot + 1
*
*        Form shift.
*
         g = ( d( l+1 )-p ) / ( two*e( l ) )
         r = dlapy2( g, one )
         g = d( m ) - p + ( e( l ) / ( g+sign( r, g ) ) )
*
         s = one
         c = one
         p = zero
*
*        Inner loop
*
         mm1 = m - 1
         DO 70 i = mm1, l, -1
            f = s*e( i )
            b = c*e( i )
            CALL dlartg( g, f, c, s, r )
            IF( i.NE.m-1 )
     $         e( i+1 ) = r
            g = d( i+1 ) - p
            r = ( d( i )-g )*s + two*c*b
            p = s*r
            d( i+1 ) = g + p
            g = c*r - b
*
*           If eigenvectors are desired, then save rotations.
*
            IF( icompz.GT.0 ) THEN
               work( i ) = c
               work( n-1+i ) = -s
            END IF
*
   70    CONTINUE
*
*        If eigenvectors are desired, then apply saved rotations.
*
         IF( icompz.GT.0 ) THEN
            mm = m - l + 1
            CALL dlasr( 'R', 'V', 'B', n, mm, work( l ), work( n-1+l ),
     $                  z( 1, l ), ldz )
         END IF
*
         d( l ) = d( l ) - p
         e( l ) = g
         GO TO 40
*
*        Eigenvalue found.
*
   80    CONTINUE
         d( l ) = p
*
         l = l + 1
         IF( l.LE.lend )
     $      GO TO 40
         GO TO 140
*
      ELSE
*
*        QR Iteration
*
*        Look for small superdiagonal element.
*
   90    CONTINUE
         IF( l.NE.lend ) THEN
            lendp1 = lend + 1
            DO 100 m = l, lendp1, -1
               tst = abs( e( m-1 ) )**2
               IF( tst.LE.( eps2*abs( d( m ) ) )*abs( d( m-1 ) )+
     $             safmin )GO TO 110
  100       CONTINUE
         END IF
*
         m = lend
*
  110    CONTINUE
         IF( m.GT.lend )
     $      e( m-1 ) = zero
         p = d( l )
         IF( m.EQ.l )
     $      GO TO 130
*
*        If remaining matrix is 2-by-2, use DLAE2 or SLAEV2
*        to compute its eigensystem.
*
         IF( m.EQ.l-1 ) THEN
            IF( icompz.GT.0 ) THEN
               CALL dlaev2( d( l-1 ), e( l-1 ), d( l ), rt1, rt2, c, s )
               work( m ) = c
               work( n-1+m ) = s
               CALL dlasr( 'R', 'V', 'F', n, 2, work( m ),
     $                     work( n-1+m ), z( 1, l-1 ), ldz )
            ELSE
               CALL dlae2( d( l-1 ), e( l-1 ), d( l ), rt1, rt2 )
            END IF
            d( l-1 ) = rt1
            d( l ) = rt2
            e( l-1 ) = zero
            l = l - 2
            IF( l.GE.lend )
     $         GO TO 90
            GO TO 140
         END IF
*
         IF( jtot.EQ.nmaxit )
     $      GO TO 140
         jtot = jtot + 1
*
*        Form shift.
*
         g = ( d( l-1 )-p ) / ( two*e( l-1 ) )
         r = dlapy2( g, one )
         g = d( m ) - p + ( e( l-1 ) / ( g+sign( r, g ) ) )
*
         s = one
         c = one
         p = zero
*
*        Inner loop
*
         lm1 = l - 1
         DO 120 i = m, lm1
            f = s*e( i )
            b = c*e( i )
            CALL dlartg( g, f, c, s, r )
            IF( i.NE.m )
     $         e( i-1 ) = r
            g = d( i ) - p
            r = ( d( i+1 )-g )*s + two*c*b
            p = s*r
            d( i ) = g + p
            g = c*r - b
*
*           If eigenvectors are desired, then save rotations.
*
            IF( icompz.GT.0 ) THEN
               work( i ) = c
               work( n-1+i ) = s
            END IF
*
  120    CONTINUE
*
*        If eigenvectors are desired, then apply saved rotations.
*
         IF( icompz.GT.0 ) THEN
            mm = l - m + 1
            CALL dlasr( 'R', 'V', 'F', n, mm, work( m ), work( n-1+m ),
     $                  z( 1, m ), ldz )
         END IF
*
         d( l ) = d( l ) - p
         e( lm1 ) = g
         GO TO 90
*
*        Eigenvalue found.
*
  130    CONTINUE
         d( l ) = p
*
         l = l - 1
         IF( l.GE.lend )
     $      GO TO 90
         GO TO 140
*
      END IF
*
*     Undo scaling if necessary
*
  140 CONTINUE
      IF( iscale.EQ.1 ) THEN
         CALL dlascl( 'G', 0, 0, ssfmax, anorm, lendsv-lsv+1, 1,
     $                d( lsv ), n, info )
         CALL dlascl( 'G', 0, 0, ssfmax, anorm, lendsv-lsv, 1, e( lsv ),
     $                n, info )
      ELSE IF( iscale.EQ.2 ) THEN
         CALL dlascl( 'G', 0, 0, ssfmin, anorm, lendsv-lsv+1, 1,
     $                d( lsv ), n, info )
         CALL dlascl( 'G', 0, 0, ssfmin, anorm, lendsv-lsv, 1, e( lsv ),
     $                n, info )
      END IF
*
*     Check for no convergence to an eigenvalue after a total
*     of N*MAXIT iterations.
*
      IF( jtot.LT.nmaxit )
     $   GO TO 10
      DO 150 i = 1, n - 1
         IF( e( i ).NE.zero )
     $      info = info + 1
  150 CONTINUE
      GO TO 190
*
*     Order eigenvalues and eigenvectors.
*
  160 CONTINUE
      IF( icompz.EQ.0 ) THEN
*
*        Use Quick Sort
*
         CALL dlasrt( 'I', n, d, info )
*
      ELSE
*
*        Use Selection Sort to minimize swaps of eigenvectors
*
         DO 180 ii = 2, n
            i = ii - 1
            k = i
            p = d( i )
            DO 170 j = ii, n
               IF( d( j ).LT.p ) THEN
                  k = j
                  p = d( j )
               END IF
  170       CONTINUE
            IF( k.NE.i ) THEN
               d( k ) = d( i )
               d( i ) = p
               CALL dswap( n, z( 1, i ), 1, z( 1, k ), 1 )
            END IF
  180    CONTINUE
      END IF
*
  190 CONTINUE
      RETURN
*
*     End of DSTEQR
*

◆ dsterf()

subroutine dsterf	(	integer	n,
		double precision, dimension( * )	d,
		double precision, dimension( * )	e,
		integer	info )

DSTERF

Download DSTERF + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DSTERF computes all eigenvalues of a symmetric tridiagonal matrix
!> using the Pal-Walker-Kahan variant of the QL or QR algorithm.
!>

Parameters

[in]	N	!> N is INTEGER !> The order of the matrix. N >= 0. !>
[in,out]	D	!> D is DOUBLE PRECISION array, dimension (N) !> On entry, the n diagonal elements of the tridiagonal matrix. !> On exit, if INFO = 0, the eigenvalues in ascending order. !>
[in,out]	E	!> E is DOUBLE PRECISION array, dimension (N-1) !> On entry, the (n-1) subdiagonal elements of the tridiagonal !> matrix. !> On exit, E has been destroyed. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !> > 0: the algorithm failed to find all of the eigenvalues in !> a total of 30*N iterations; if INFO = i, then i !> elements of E have not converged to zero. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 85 of file dsterf.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INFO, N
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   D( * ), E( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ZERO, ONE, TWO, THREE
      parameter( zero = 0.0d0, one = 1.0d0, two = 2.0d0,
     $                   three = 3.0d0 )
      INTEGER            MAXIT
      parameter( maxit = 30 )
*     ..
*     .. Local Scalars ..
      INTEGER            I, ISCALE, JTOT, L, L1, LEND, LENDSV, LSV, M,
     $                   NMAXIT
      DOUBLE PRECISION   ALPHA, ANORM, BB, C, EPS, EPS2, GAMMA, OLDC,
     $                   OLDGAM, P, R, RT1, RT2, RTE, S, SAFMAX, SAFMIN,
     $                   SIGMA, SSFMAX, SSFMIN, RMAX
*     ..
*     .. External Functions ..
      DOUBLE PRECISION   DLAMCH, DLANST, DLAPY2
      EXTERNAL           dlamch, dlanst, dlapy2
*     ..
*     .. External Subroutines ..
      EXTERNAL           dlae2, dlascl, dlasrt, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, sign, sqrt
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
*
*     Quick return if possible
*
      IF( n.LT.0 ) THEN
         info = -1
         CALL xerbla( 'DSTERF', -info )
         RETURN
      END IF
      IF( n.LE.1 )
     $   RETURN
*
*     Determine the unit roundoff for this environment.
*
      eps = dlamch( 'E' )
      eps2 = eps**2
      safmin = dlamch( 'S' )
      safmax = one / safmin
      ssfmax = sqrt( safmax ) / three
      ssfmin = sqrt( safmin ) / eps2
      rmax = dlamch( 'O' )
*
*     Compute the eigenvalues of the tridiagonal matrix.
*
      nmaxit = n*maxit
      sigma = zero
      jtot = 0
*
*     Determine where the matrix splits and choose QL or QR iteration
*     for each block, according to whether top or bottom diagonal
*     element is smaller.
*
      l1 = 1
*
   10 CONTINUE
      IF( l1.GT.n )
     $   GO TO 170
      IF( l1.GT.1 )
     $   e( l1-1 ) = zero
      DO 20 m = l1, n - 1
         IF( abs( e( m ) ).LE.( sqrt( abs( d( m ) ) )*sqrt( abs( d( m+
     $       1 ) ) ) )*eps ) THEN
            e( m ) = zero
            GO TO 30
         END IF
   20 CONTINUE
      m = n
*
   30 CONTINUE
      l = l1
      lsv = l
      lend = m
      lendsv = lend
      l1 = m + 1
      IF( lend.EQ.l )
     $   GO TO 10
*
*     Scale submatrix in rows and columns L to LEND
*
      anorm = dlanst( 'M', lend-l+1, d( l ), e( l ) )
      iscale = 0
      IF( anorm.EQ.zero )
     $   GO TO 10
      IF( (anorm.GT.ssfmax) ) THEN
         iscale = 1
         CALL dlascl( 'G', 0, 0, anorm, ssfmax, lend-l+1, 1, d( l ), n,
     $                info )
         CALL dlascl( 'G', 0, 0, anorm, ssfmax, lend-l, 1, e( l ), n,
     $                info )
      ELSE IF( anorm.LT.ssfmin ) THEN
         iscale = 2
         CALL dlascl( 'G', 0, 0, anorm, ssfmin, lend-l+1, 1, d( l ), n,
     $                info )
         CALL dlascl( 'G', 0, 0, anorm, ssfmin, lend-l, 1, e( l ), n,
     $                info )
      END IF
*
      DO 40 i = l, lend - 1
         e( i ) = e( i )**2
   40 CONTINUE
*
*     Choose between QL and QR iteration
*
      IF( abs( d( lend ) ).LT.abs( d( l ) ) ) THEN
         lend = lsv
         l = lendsv
      END IF
*
      IF( lend.GE.l ) THEN
*
*        QL Iteration
*
*        Look for small subdiagonal element.
*
   50    CONTINUE
         IF( l.NE.lend ) THEN
            DO 60 m = l, lend - 1
               IF( abs( e( m ) ).LE.eps2*abs( d( m )*d( m+1 ) ) )
     $            GO TO 70
   60       CONTINUE
         END IF
         m = lend
*
   70    CONTINUE
         IF( m.LT.lend )
     $      e( m ) = zero
         p = d( l )
         IF( m.EQ.l )
     $      GO TO 90
*
*        If remaining matrix is 2 by 2, use DLAE2 to compute its
*        eigenvalues.
*
         IF( m.EQ.l+1 ) THEN
            rte = sqrt( e( l ) )
            CALL dlae2( d( l ), rte, d( l+1 ), rt1, rt2 )
            d( l ) = rt1
            d( l+1 ) = rt2
            e( l ) = zero
            l = l + 2
            IF( l.LE.lend )
     $         GO TO 50
            GO TO 150
         END IF
*
         IF( jtot.EQ.nmaxit )
     $      GO TO 150
         jtot = jtot + 1
*
*        Form shift.
*
         rte = sqrt( e( l ) )
         sigma = ( d( l+1 )-p ) / ( two*rte )
         r = dlapy2( sigma, one )
         sigma = p - ( rte / ( sigma+sign( r, sigma ) ) )
*
         c = one
         s = zero
         gamma = d( m ) - sigma
         p = gamma*gamma
*
*        Inner loop
*
         DO 80 i = m - 1, l, -1
            bb = e( i )
            r = p + bb
            IF( i.NE.m-1 )
     $         e( i+1 ) = s*r
            oldc = c
            c = p / r
            s = bb / r
            oldgam = gamma
            alpha = d( i )
            gamma = c*( alpha-sigma ) - s*oldgam
            d( i+1 ) = oldgam + ( alpha-gamma )
            IF( c.NE.zero ) THEN
               p = ( gamma*gamma ) / c
            ELSE
               p = oldc*bb
            END IF
   80    CONTINUE
*
         e( l ) = s*p
         d( l ) = sigma + gamma
         GO TO 50
*
*        Eigenvalue found.
*
   90    CONTINUE
         d( l ) = p
*
         l = l + 1
         IF( l.LE.lend )
     $      GO TO 50
         GO TO 150
*
      ELSE
*
*        QR Iteration
*
*        Look for small superdiagonal element.
*
  100    CONTINUE
         DO 110 m = l, lend + 1, -1
            IF( abs( e( m-1 ) ).LE.eps2*abs( d( m )*d( m-1 ) ) )
     $         GO TO 120
  110    CONTINUE
         m = lend
*
  120    CONTINUE
         IF( m.GT.lend )
     $      e( m-1 ) = zero
         p = d( l )
         IF( m.EQ.l )
     $      GO TO 140
*
*        If remaining matrix is 2 by 2, use DLAE2 to compute its
*        eigenvalues.
*
         IF( m.EQ.l-1 ) THEN
            rte = sqrt( e( l-1 ) )
            CALL dlae2( d( l ), rte, d( l-1 ), rt1, rt2 )
            d( l ) = rt1
            d( l-1 ) = rt2
            e( l-1 ) = zero
            l = l - 2
            IF( l.GE.lend )
     $         GO TO 100
            GO TO 150
         END IF
*
         IF( jtot.EQ.nmaxit )
     $      GO TO 150
         jtot = jtot + 1
*
*        Form shift.
*
         rte = sqrt( e( l-1 ) )
         sigma = ( d( l-1 )-p ) / ( two*rte )
         r = dlapy2( sigma, one )
         sigma = p - ( rte / ( sigma+sign( r, sigma ) ) )
*
         c = one
         s = zero
         gamma = d( m ) - sigma
         p = gamma*gamma
*
*        Inner loop
*
         DO 130 i = m, l - 1
            bb = e( i )
            r = p + bb
            IF( i.NE.m )
     $         e( i-1 ) = s*r
            oldc = c
            c = p / r
            s = bb / r
            oldgam = gamma
            alpha = d( i+1 )
            gamma = c*( alpha-sigma ) - s*oldgam
            d( i ) = oldgam + ( alpha-gamma )
            IF( c.NE.zero ) THEN
               p = ( gamma*gamma ) / c
            ELSE
               p = oldc*bb
            END IF
  130    CONTINUE
*
         e( l-1 ) = s*p
         d( l ) = sigma + gamma
         GO TO 100
*
*        Eigenvalue found.
*
  140    CONTINUE
         d( l ) = p
*
         l = l - 1
         IF( l.GE.lend )
     $      GO TO 100
         GO TO 150
*
      END IF
*
*     Undo scaling if necessary
*
  150 CONTINUE
      IF( iscale.EQ.1 )
     $   CALL dlascl( 'G', 0, 0, ssfmax, anorm, lendsv-lsv+1, 1,
     $                d( lsv ), n, info )
      IF( iscale.EQ.2 )
     $   CALL dlascl( 'G', 0, 0, ssfmin, anorm, lendsv-lsv+1, 1,
     $                d( lsv ), n, info )
*
*     Check for no convergence to an eigenvalue after a total
*     of N*MAXIT iterations.
*
      IF( jtot.LT.nmaxit )
     $   GO TO 10
      DO 160 i = 1, n - 1
         IF( e( i ).NE.zero )
     $      info = info + 1
  160 CONTINUE
      GO TO 180
*
*     Sort eigenvalues in increasing order.
*
  170 CONTINUE
      CALL dlasrt( 'I', n, d, info )
*
  180 CONTINUE
      RETURN
*
*     End of DSTERF
*

◆ iladiag()

integer function iladiag ( character diag )

ILADIAG

Download ILADIAG + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> This subroutine translated from a character string specifying if a
!> matrix has unit diagonal or not to the relevant BLAST-specified
!> integer constant.
!>
!> ILADIAG returns an INTEGER.  If ILADIAG < 0, then the input is not a
!> character indicating a unit or non-unit diagonal.  Otherwise ILADIAG
!> returns the constant value corresponding to DIAG.
!>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 57 of file iladiag.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          DIAG
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      INTEGER BLAS_NON_UNIT_DIAG, BLAS_UNIT_DIAG
      parameter( blas_non_unit_diag = 131, blas_unit_diag = 132 )
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. Executable Statements ..
      IF( lsame( diag, 'N' ) ) THEN
         iladiag = blas_non_unit_diag
      ELSE IF( lsame( diag, 'U' ) ) THEN
         iladiag = blas_unit_diag
      ELSE
         iladiag = -1
      END IF
      RETURN
*
*     End of ILADIAG
*

◆ ilaprec()

integer function ilaprec ( character prec )

ILAPREC

Download ILAPREC + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> This subroutine translated from a character string specifying an
!> intermediate precision to the relevant BLAST-specified integer
!> constant.
!>
!> ILAPREC returns an INTEGER.  If ILAPREC < 0, then the input is not a
!> character indicating a supported intermediate precision.  Otherwise
!> ILAPREC returns the constant value corresponding to PREC.
!>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 57 of file ilaprec.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          PREC
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      INTEGER BLAS_PREC_SINGLE, BLAS_PREC_DOUBLE, BLAS_PREC_INDIGENOUS,
     $           BLAS_PREC_EXTRA
      parameter( blas_prec_single = 211, blas_prec_double = 212,
     $     blas_prec_indigenous = 213, blas_prec_extra = 214 )
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. Executable Statements ..
      IF( lsame( prec, 'S' ) ) THEN
         ilaprec = blas_prec_single
      ELSE IF( lsame( prec, 'D' ) ) THEN
         ilaprec = blas_prec_double
      ELSE IF( lsame( prec, 'I' ) ) THEN
         ilaprec = blas_prec_indigenous
      ELSE IF( lsame( prec, 'X' ) .OR. lsame( prec, 'E' ) ) THEN
         ilaprec = blas_prec_extra
      ELSE
         ilaprec = -1
      END IF
      RETURN
*
*     End of ILAPREC
*

◆ ilatrans()

integer function ilatrans ( character trans )

ILATRANS

Download ILATRANS + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> This subroutine translates from a character string specifying a
!> transposition operation to the relevant BLAST-specified integer
!> constant.
!>
!> ILATRANS returns an INTEGER.  If ILATRANS < 0, then the input is not
!> a character indicating a transposition operator.  Otherwise ILATRANS
!> returns the constant value corresponding to TRANS.
!>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 57 of file ilatrans.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          TRANS
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      INTEGER BLAS_NO_TRANS, BLAS_TRANS, BLAS_CONJ_TRANS
      parameter( blas_no_trans = 111, blas_trans = 112,
     $     blas_conj_trans = 113 )
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. Executable Statements ..
      IF( lsame( trans, 'N' ) ) THEN
         ilatrans = blas_no_trans
      ELSE IF( lsame( trans, 'T' ) ) THEN
         ilatrans = blas_trans
      ELSE IF( lsame( trans, 'C' ) ) THEN
         ilatrans = blas_conj_trans
      ELSE
         ilatrans = -1
      END IF
      RETURN
*
*     End of ILATRANS
*

◆ ilauplo()

integer function ilauplo ( character uplo )

ILAUPLO

Download ILAUPLO + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> This subroutine translated from a character string specifying a
!> upper- or lower-triangular matrix to the relevant BLAST-specified
!> integer constant.
!>
!> ILAUPLO returns an INTEGER.  If ILAUPLO < 0, then the input is not
!> a character indicating an upper- or lower-triangular matrix.
!> Otherwise ILAUPLO returns the constant value corresponding to UPLO.
!>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 57 of file ilauplo.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          UPLO
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      INTEGER BLAS_UPPER, BLAS_LOWER
      parameter( blas_upper = 121, blas_lower = 122 )
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. Executable Statements ..
      IF( lsame( uplo, 'U' ) ) THEN
         ilauplo = blas_upper
      ELSE IF( lsame( uplo, 'L' ) ) THEN
         ilauplo = blas_lower
      ELSE
         ilauplo = -1
      END IF
      RETURN
*
*     End of ILAUPLO
*

◆ sbdsdc()

subroutine sbdsdc	(	character	uplo,
		character	compq,
		integer	n,
		real, dimension( * )	d,
		real, dimension( * )	e,
		real, dimension( ldu, * )	u,
		integer	ldu,
		real, dimension( ldvt, * )	vt,
		integer	ldvt,
		real, dimension( * )	q,
		integer, dimension( * )	iq,
		real, dimension( * )	work,
		integer, dimension( * )	iwork,
		integer	info )

SBDSDC

Download SBDSDC + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> SBDSDC computes the singular value decomposition (SVD) of a real
!> N-by-N (upper or lower) bidiagonal matrix B:  B = U * S * VT,
!> using a divide and conquer method, where S is a diagonal matrix
!> with non-negative diagonal elements (the singular values of B), and
!> U and VT are orthogonal matrices of left and right singular vectors,
!> respectively. SBDSDC can be used to compute all singular values,
!> and optionally, singular vectors or singular vectors in compact form.
!>
!> This code makes very mild assumptions about floating point
!> arithmetic. It will work on machines with a guard digit in
!> add/subtract, or on those binary machines without guard digits
!> which subtract like the Cray X-MP, Cray Y-MP, Cray C-90, or Cray-2.
!> It could conceivably fail on hexadecimal or decimal machines
!> without guard digits, but we know of none.  See SLASD3 for details.
!>
!> The code currently calls SLASDQ if singular values only are desired.
!> However, it can be slightly modified to compute singular values
!> using the divide and conquer method.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': B is upper bidiagonal. !> = 'L': B is lower bidiagonal. !>
[in]	COMPQ	!> COMPQ is CHARACTER*1 !> Specifies whether singular vectors are to be computed !> as follows: !> = 'N': Compute singular values only; !> = 'P': Compute singular values and compute singular !> vectors in compact form; !> = 'I': Compute singular values and singular vectors. !>
[in]	N	!> N is INTEGER !> The order of the matrix B. N >= 0. !>
[in,out]	D	!> D is REAL array, dimension (N) !> On entry, the n diagonal elements of the bidiagonal matrix B. !> On exit, if INFO=0, the singular values of B. !>
[in,out]	E	!> E is REAL array, dimension (N-1) !> On entry, the elements of E contain the offdiagonal !> elements of the bidiagonal matrix whose SVD is desired. !> On exit, E has been destroyed. !>
[out]	U	!> U is REAL array, dimension (LDU,N) !> If COMPQ = 'I', then: !> On exit, if INFO = 0, U contains the left singular vectors !> of the bidiagonal matrix. !> For other values of COMPQ, U is not referenced. !>
[in]	LDU	!> LDU is INTEGER !> The leading dimension of the array U. LDU >= 1. !> If singular vectors are desired, then LDU >= max( 1, N ). !>
[out]	VT	!> VT is REAL array, dimension (LDVT,N) !> If COMPQ = 'I', then: !> On exit, if INFO = 0, VT**T contains the right singular !> vectors of the bidiagonal matrix. !> For other values of COMPQ, VT is not referenced. !>
[in]	LDVT	!> LDVT is INTEGER !> The leading dimension of the array VT. LDVT >= 1. !> If singular vectors are desired, then LDVT >= max( 1, N ). !>
[out]	Q	!> Q is REAL array, dimension (LDQ) !> If COMPQ = 'P', then: !> On exit, if INFO = 0, Q and IQ contain the left !> and right singular vectors in a compact form, !> requiring O(N log N) space instead of 2N2. !> In particular, Q contains all the REAL data in !> LDQ >= N(11 + 2SMLSIZ + 8INT(LOG_2(N/(SMLSIZ+1)))) !> words of memory, where SMLSIZ is returned by ILAENV and !> is equal to the maximum size of the subproblems at the !> bottom of the computation tree (usually about 25). !> For other values of COMPQ, Q is not referenced. !>
[out]	IQ	!> IQ is INTEGER array, dimension (LDIQ) !> If COMPQ = 'P', then: !> On exit, if INFO = 0, Q and IQ contain the left !> and right singular vectors in a compact form, !> requiring O(N log N) space instead of 2N2. !> In particular, IQ contains all INTEGER data in !> LDIQ >= N(3 + 3*INT(LOG_2(N/(SMLSIZ+1)))) !> words of memory, where SMLSIZ is returned by ILAENV and !> is equal to the maximum size of the subproblems at the !> bottom of the computation tree (usually about 25). !> For other values of COMPQ, IQ is not referenced. !>
[out]	WORK	!> WORK is REAL array, dimension (MAX(1,LWORK)) !> If COMPQ = 'N' then LWORK >= (4 * N). !> If COMPQ = 'P' then LWORK >= (6 * N). !> If COMPQ = 'I' then LWORK >= (3 * N*2 + 4 N). !>
[out]	IWORK	!> IWORK is INTEGER array, dimension (8*N) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> < 0: if INFO = -i, the i-th argument had an illegal value. !> > 0: The algorithm failed to compute a singular value. !> The update process of divide and conquer failed. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: Ming Gu and Huan Ren, Computer Science Division, University of California at Berkeley, USA

Definition at line 203 of file sbdsdc.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          COMPQ, UPLO
      INTEGER            INFO, LDU, LDVT, N
*     ..
*     .. Array Arguments ..
      INTEGER            IQ( * ), IWORK( * )
      REAL               D( * ), E( * ), Q( * ), U( LDU, * ),
     $                   VT( LDVT, * ), WORK( * )
*     ..
*
*  =====================================================================
*  Changed dimension statement in comment describing E from (N) to
*  (N-1).  Sven, 17 Feb 05.
*  =====================================================================
*
*     .. Parameters ..
      REAL               ZERO, ONE, TWO
      parameter( zero = 0.0e+0, one = 1.0e+0, two = 2.0e+0 )
*     ..
*     .. Local Scalars ..
      INTEGER            DIFL, DIFR, GIVCOL, GIVNUM, GIVPTR, I, IC,
     $                   ICOMPQ, IERR, II, IS, IU, IUPLO, IVT, J, K, KK,
     $                   MLVL, NM1, NSIZE, PERM, POLES, QSTART, SMLSIZ,
     $                   SMLSZP, SQRE, START, WSTART, Z
      REAL               CS, EPS, ORGNRM, P, R, SN
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      INTEGER            ILAENV
      REAL               SLAMCH, SLANST
      EXTERNAL           slamch, slanst, ilaenv, lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           scopy, slartg, slascl, slasd0, slasda, slasdq,
     $                   slaset, slasr, sswap, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          real, abs, int, log, sign
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
*
      iuplo = 0
      IF( lsame( uplo, 'U' ) )
     $   iuplo = 1
      IF( lsame( uplo, 'L' ) )
     $   iuplo = 2
      IF( lsame( compq, 'N' ) ) THEN
         icompq = 0
      ELSE IF( lsame( compq, 'P' ) ) THEN
         icompq = 1
      ELSE IF( lsame( compq, 'I' ) ) THEN
         icompq = 2
      ELSE
         icompq = -1
      END IF
      IF( iuplo.EQ.0 ) THEN
         info = -1
      ELSE IF( icompq.LT.0 ) THEN
         info = -2
      ELSE IF( n.LT.0 ) THEN
         info = -3
      ELSE IF( ( ldu.LT.1 ) .OR. ( ( icompq.EQ.2 ) .AND. ( ldu.LT.
     $         n ) ) ) THEN
         info = -7
      ELSE IF( ( ldvt.LT.1 ) .OR. ( ( icompq.EQ.2 ) .AND. ( ldvt.LT.
     $         n ) ) ) THEN
         info = -9
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'SBDSDC', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
      smlsiz = ilaenv( 9, 'SBDSDC', ' ', 0, 0, 0, 0 )
      IF( n.EQ.1 ) THEN
         IF( icompq.EQ.1 ) THEN
            q( 1 ) = sign( one, d( 1 ) )
            q( 1+smlsiz*n ) = one
         ELSE IF( icompq.EQ.2 ) THEN
            u( 1, 1 ) = sign( one, d( 1 ) )
            vt( 1, 1 ) = one
         END IF
         d( 1 ) = abs( d( 1 ) )
         RETURN
      END IF
      nm1 = n - 1
*
*     If matrix lower bidiagonal, rotate to be upper bidiagonal
*     by applying Givens rotations on the left
*
      wstart = 1
      qstart = 3
      IF( icompq.EQ.1 ) THEN
         CALL scopy( n, d, 1, q( 1 ), 1 )
         CALL scopy( n-1, e, 1, q( n+1 ), 1 )
      END IF
      IF( iuplo.EQ.2 ) THEN
         qstart = 5
         IF( icompq .EQ. 2 ) wstart = 2*n - 1
         DO 10 i = 1, n - 1
            CALL slartg( d( i ), e( i ), cs, sn, r )
            d( i ) = r
            e( i ) = sn*d( i+1 )
            d( i+1 ) = cs*d( i+1 )
            IF( icompq.EQ.1 ) THEN
               q( i+2*n ) = cs
               q( i+3*n ) = sn
            ELSE IF( icompq.EQ.2 ) THEN
               work( i ) = cs
               work( nm1+i ) = -sn
            END IF
   10    CONTINUE
      END IF
*
*     If ICOMPQ = 0, use SLASDQ to compute the singular values.
*
      IF( icompq.EQ.0 ) THEN
*        Ignore WSTART, instead using WORK( 1 ), since the two vectors
*        for CS and -SN above are added only if ICOMPQ == 2,
*        and adding them exceeds documented WORK size of 4*n.
         CALL slasdq( 'U', 0, n, 0, 0, 0, d, e, vt, ldvt, u, ldu, u,
     $                ldu, work( 1 ), info )
         GO TO 40
      END IF
*
*     If N is smaller than the minimum divide size SMLSIZ, then solve
*     the problem with another solver.
*
      IF( n.LE.smlsiz ) THEN
         IF( icompq.EQ.2 ) THEN
            CALL slaset( 'A', n, n, zero, one, u, ldu )
            CALL slaset( 'A', n, n, zero, one, vt, ldvt )
            CALL slasdq( 'U', 0, n, n, n, 0, d, e, vt, ldvt, u, ldu, u,
     $                   ldu, work( wstart ), info )
         ELSE IF( icompq.EQ.1 ) THEN
            iu = 1
            ivt = iu + n
            CALL slaset( 'A', n, n, zero, one, q( iu+( qstart-1 )*n ),
     $                   n )
            CALL slaset( 'A', n, n, zero, one, q( ivt+( qstart-1 )*n ),
     $                   n )
            CALL slasdq( 'U', 0, n, n, n, 0, d, e,
     $                   q( ivt+( qstart-1 )*n ), n,
     $                   q( iu+( qstart-1 )*n ), n,
     $                   q( iu+( qstart-1 )*n ), n, work( wstart ),
     $                   info )
         END IF
         GO TO 40
      END IF
*
      IF( icompq.EQ.2 ) THEN
         CALL slaset( 'A', n, n, zero, one, u, ldu )
         CALL slaset( 'A', n, n, zero, one, vt, ldvt )
      END IF
*
*     Scale.
*
      orgnrm = slanst( 'M', n, d, e )
      IF( orgnrm.EQ.zero )
     $   RETURN
      CALL slascl( 'G', 0, 0, orgnrm, one, n, 1, d, n, ierr )
      CALL slascl( 'G', 0, 0, orgnrm, one, nm1, 1, e, nm1, ierr )
*
      eps = slamch( 'Epsilon' )
*
      mlvl = int( log( real( n ) / real( smlsiz+1 ) ) / log( two ) ) + 1
      smlszp = smlsiz + 1
*
      IF( icompq.EQ.1 ) THEN
         iu = 1
         ivt = 1 + smlsiz
         difl = ivt + smlszp
         difr = difl + mlvl
         z = difr + mlvl*2
         ic = z + mlvl
         is = ic + 1
         poles = is + 1
         givnum = poles + 2*mlvl
*
         k = 1
         givptr = 2
         perm = 3
         givcol = perm + mlvl
      END IF
*
      DO 20 i = 1, n
         IF( abs( d( i ) ).LT.eps ) THEN
            d( i ) = sign( eps, d( i ) )
         END IF
   20 CONTINUE
*
      start = 1
      sqre = 0
*
      DO 30 i = 1, nm1
         IF( ( abs( e( i ) ).LT.eps ) .OR. ( i.EQ.nm1 ) ) THEN
*
*        Subproblem found. First determine its size and then
*        apply divide and conquer on it.
*
            IF( i.LT.nm1 ) THEN
*
*        A subproblem with E(I) small for I < NM1.
*
               nsize = i - start + 1
            ELSE IF( abs( e( i ) ).GE.eps ) THEN
*
*        A subproblem with E(NM1) not too small but I = NM1.
*
               nsize = n - start + 1
            ELSE
*
*        A subproblem with E(NM1) small. This implies an
*        1-by-1 subproblem at D(N). Solve this 1-by-1 problem
*        first.
*
               nsize = i - start + 1
               IF( icompq.EQ.2 ) THEN
                  u( n, n ) = sign( one, d( n ) )
                  vt( n, n ) = one
               ELSE IF( icompq.EQ.1 ) THEN
                  q( n+( qstart-1 )*n ) = sign( one, d( n ) )
                  q( n+( smlsiz+qstart-1 )*n ) = one
               END IF
               d( n ) = abs( d( n ) )
            END IF
            IF( icompq.EQ.2 ) THEN
               CALL slasd0( nsize, sqre, d( start ), e( start ),
     $                      u( start, start ), ldu, vt( start, start ),
     $                      ldvt, smlsiz, iwork, work( wstart ), info )
            ELSE
               CALL slasda( icompq, smlsiz, nsize, sqre, d( start ),
     $                      e( start ), q( start+( iu+qstart-2 )*n ), n,
     $                      q( start+( ivt+qstart-2 )*n ),
     $                      iq( start+k*n ), q( start+( difl+qstart-2 )*
     $                      n ), q( start+( difr+qstart-2 )*n ),
     $                      q( start+( z+qstart-2 )*n ),
     $                      q( start+( poles+qstart-2 )*n ),
     $                      iq( start+givptr*n ), iq( start+givcol*n ),
     $                      n, iq( start+perm*n ),
     $                      q( start+( givnum+qstart-2 )*n ),
     $                      q( start+( ic+qstart-2 )*n ),
     $                      q( start+( is+qstart-2 )*n ),
     $                      work( wstart ), iwork, info )
            END IF
            IF( info.NE.0 ) THEN
               RETURN
            END IF
            start = i + 1
         END IF
   30 CONTINUE
*
*     Unscale
*
      CALL slascl( 'G', 0, 0, one, orgnrm, n, 1, d, n, ierr )
   40 CONTINUE
*
*     Use Selection Sort to minimize swaps of singular vectors
*
      DO 60 ii = 2, n
         i = ii - 1
         kk = i
         p = d( i )
         DO 50 j = ii, n
            IF( d( j ).GT.p ) THEN
               kk = j
               p = d( j )
            END IF
   50    CONTINUE
         IF( kk.NE.i ) THEN
            d( kk ) = d( i )
            d( i ) = p
            IF( icompq.EQ.1 ) THEN
               iq( i ) = kk
            ELSE IF( icompq.EQ.2 ) THEN
               CALL sswap( n, u( 1, i ), 1, u( 1, kk ), 1 )
               CALL sswap( n, vt( i, 1 ), ldvt, vt( kk, 1 ), ldvt )
            END IF
         ELSE IF( icompq.EQ.1 ) THEN
            iq( i ) = i
         END IF
   60 CONTINUE
*
*     If ICOMPQ = 1, use IQ(N,1) as the indicator for UPLO
*
      IF( icompq.EQ.1 ) THEN
         IF( iuplo.EQ.1 ) THEN
            iq( n ) = 1
         ELSE
            iq( n ) = 0
         END IF
      END IF
*
*     If B is lower bidiagonal, update U by those Givens rotations
*     which rotated B to be upper bidiagonal
*
      IF( ( iuplo.EQ.2 ) .AND. ( icompq.EQ.2 ) )
     $   CALL slasr( 'L', 'V', 'B', n, n, work( 1 ), work( n ), u, ldu )
*
      RETURN
*
*     End of SBDSDC
*

◆ sbdsqr()

subroutine sbdsqr	(	character	uplo,
		integer	n,
		integer	ncvt,
		integer	nru,
		integer	ncc,
		real, dimension( * )	d,
		real, dimension( * )	e,
		real, dimension( ldvt, * )	vt,
		integer	ldvt,
		real, dimension( ldu, * )	u,
		integer	ldu,
		real, dimension( ldc, * )	c,
		integer	ldc,
		real, dimension( * )	work,
		integer	info )

SBDSQR

Download SBDSQR + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> SBDSQR computes the singular values and, optionally, the right and/or
!> left singular vectors from the singular value decomposition (SVD) of
!> a real N-by-N (upper or lower) bidiagonal matrix B using the implicit
!> zero-shift QR algorithm.  The SVD of B has the form
!>
!>    B = Q * S * P**T
!>
!> where S is the diagonal matrix of singular values, Q is an orthogonal
!> matrix of left singular vectors, and P is an orthogonal matrix of
!> right singular vectors.  If left singular vectors are requested, this
!> subroutine actually returns U*Q instead of Q, and, if right singular
!> vectors are requested, this subroutine returns P**T*VT instead of
!> P**T, for given real input matrices U and VT.  When U and VT are the
!> orthogonal matrices that reduce a general matrix A to bidiagonal
!> form:  A = U*B*VT, as computed by SGEBRD, then
!>
!>    A = (U*Q) * S * (P**T*VT)
!>
!> is the SVD of A.  Optionally, the subroutine may also compute Q**T*C
!> for a given real input matrix C.
!>
!> See  by J. Demmel and W. Kahan,
!> LAPACK Working Note #3 (or SIAM J. Sci. Statist. Comput. vol. 11,
!> no. 5, pp. 873-912, Sept 1990) and
!>  by
!> B. Parlett and V. Fernando, Technical Report CPAM-554, Mathematics
!> Department, University of California at Berkeley, July 1992
!> for a detailed description of the algorithm.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': B is upper bidiagonal; !> = 'L': B is lower bidiagonal. !>
[in]	N	!> N is INTEGER !> The order of the matrix B. N >= 0. !>
[in]	NCVT	!> NCVT is INTEGER !> The number of columns of the matrix VT. NCVT >= 0. !>
[in]	NRU	!> NRU is INTEGER !> The number of rows of the matrix U. NRU >= 0. !>
[in]	NCC	!> NCC is INTEGER !> The number of columns of the matrix C. NCC >= 0. !>
[in,out]	D	!> D is REAL array, dimension (N) !> On entry, the n diagonal elements of the bidiagonal matrix B. !> On exit, if INFO=0, the singular values of B in decreasing !> order. !>
[in,out]	E	!> E is REAL array, dimension (N-1) !> On entry, the N-1 offdiagonal elements of the bidiagonal !> matrix B. !> On exit, if INFO = 0, E is destroyed; if INFO > 0, D and E !> will contain the diagonal and superdiagonal elements of a !> bidiagonal matrix orthogonally equivalent to the one given !> as input. !>
[in,out]	VT	!> VT is REAL array, dimension (LDVT, NCVT) !> On entry, an N-by-NCVT matrix VT. !> On exit, VT is overwritten by P*T VT. !> Not referenced if NCVT = 0. !>
[in]	LDVT	!> LDVT is INTEGER !> The leading dimension of the array VT. !> LDVT >= max(1,N) if NCVT > 0; LDVT >= 1 if NCVT = 0. !>
[in,out]	U	!> U is REAL array, dimension (LDU, N) !> On entry, an NRU-by-N matrix U. !> On exit, U is overwritten by U * Q. !> Not referenced if NRU = 0. !>
[in]	LDU	!> LDU is INTEGER !> The leading dimension of the array U. LDU >= max(1,NRU). !>
[in,out]	C	!> C is REAL array, dimension (LDC, NCC) !> On entry, an N-by-NCC matrix C. !> On exit, C is overwritten by Q*T C. !> Not referenced if NCC = 0. !>
[in]	LDC	!> LDC is INTEGER !> The leading dimension of the array C. !> LDC >= max(1,N) if NCC > 0; LDC >=1 if NCC = 0. !>
[out]	WORK	!> WORK is REAL array, dimension (4*N) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: If INFO = -i, the i-th argument had an illegal value !> > 0: !> if NCVT = NRU = NCC = 0, !> = 1, a split was marked by a positive value in E !> = 2, current block of Z not diagonalized after 30*N !> iterations (in inner while loop) !> = 3, termination criterion of outer while loop not met !> (program created more than N unreduced blocks) !> else NCVT = NRU = NCC = 0, !> the algorithm did not converge; D and E contain the !> elements of a bidiagonal matrix which is orthogonally !> similar to the input matrix B; if INFO = i, i !> elements of E have not converged to zero. !>

Internal Parameters:

!>  TOLMUL  REAL, default = max(10,min(100,EPS**(-1/8)))
!>          TOLMUL controls the convergence criterion of the QR loop.
!>          If it is positive, TOLMUL*EPS is the desired relative
!>             precision in the computed singular values.
!>          If it is negative, abs(TOLMUL*EPS*sigma_max) is the
!>             desired absolute accuracy in the computed singular
!>             values (corresponds to relative accuracy
!>             abs(TOLMUL*EPS) in the largest singular value.
!>          abs(TOLMUL) should be between 1 and 1/EPS, and preferably
!>             between 10 (for fast convergence) and .1/EPS
!>             (for there to be some accuracy in the results).
!>          Default is to lose at either one eighth or 2 of the
!>             available decimal digits in each computed singular value
!>             (whichever is smaller).
!>
!>  MAXITR  INTEGER, default = 6
!>          MAXITR controls the maximum number of passes of the
!>          algorithm through its inner loop. The algorithms stops
!>          (and so fails to converge) if the number of passes
!>          through the inner loop exceeds MAXITR*N**2.
!>

Note:

!>  Bug report from Cezary Dendek.
!>  On March 23rd 2017, the INTEGER variable MAXIT = MAXITR*N**2 is
!>  removed since it can overflow pretty easily (for N larger or equal
!>  than 18,919). We instead use MAXITDIVN = MAXITR*N.
!>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 238 of file sbdsqr.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          UPLO
      INTEGER            INFO, LDC, LDU, LDVT, N, NCC, NCVT, NRU
*     ..
*     .. Array Arguments ..
      REAL               C( LDC, * ), D( * ), E( * ), U( LDU, * ),
     $                   VT( LDVT, * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ZERO
      parameter( zero = 0.0e0 )
      REAL               ONE
      parameter( one = 1.0e0 )
      REAL               NEGONE
      parameter( negone = -1.0e0 )
      REAL               HNDRTH
      parameter( hndrth = 0.01e0 )
      REAL               TEN
      parameter( ten = 10.0e0 )
      REAL               HNDRD
      parameter( hndrd = 100.0e0 )
      REAL               MEIGTH
      parameter( meigth = -0.125e0 )
      INTEGER            MAXITR
      parameter( maxitr = 6 )
*     ..
*     .. Local Scalars ..
      LOGICAL            LOWER, ROTATE
      INTEGER            I, IDIR, ISUB, ITER, ITERDIVN, J, LL, LLL, M,
     $                   MAXITDIVN, NM1, NM12, NM13, OLDLL, OLDM
      REAL               ABSE, ABSS, COSL, COSR, CS, EPS, F, G, H, MU,
     $                   OLDCS, OLDSN, R, SHIFT, SIGMN, SIGMX, SINL,
     $                   SINR, SLL, SMAX, SMIN, SMINL,  SMINOA,
     $                   SN, THRESH, TOL, TOLMUL, UNFL
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      REAL               SLAMCH
      EXTERNAL           lsame, slamch
*     ..
*     .. External Subroutines ..
      EXTERNAL           slartg, slas2, slasq1, slasr, slasv2, srot,
     $                   sscal, sswap, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, max, min, real, sign, sqrt
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      lower = lsame( uplo, 'L' )
      IF( .NOT.lsame( uplo, 'U' ) .AND. .NOT.lower ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( ncvt.LT.0 ) THEN
         info = -3
      ELSE IF( nru.LT.0 ) THEN
         info = -4
      ELSE IF( ncc.LT.0 ) THEN
         info = -5
      ELSE IF( ( ncvt.EQ.0 .AND. ldvt.LT.1 ) .OR.
     $         ( ncvt.GT.0 .AND. ldvt.LT.max( 1, n ) ) ) THEN
         info = -9
      ELSE IF( ldu.LT.max( 1, nru ) ) THEN
         info = -11
      ELSE IF( ( ncc.EQ.0 .AND. ldc.LT.1 ) .OR.
     $         ( ncc.GT.0 .AND. ldc.LT.max( 1, n ) ) ) THEN
         info = -13
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'SBDSQR', -info )
         RETURN
      END IF
      IF( n.EQ.0 )
     $   RETURN
      IF( n.EQ.1 )
     $   GO TO 160
*
*     ROTATE is true if any singular vectors desired, false otherwise
*
      rotate = ( ncvt.GT.0 ) .OR. ( nru.GT.0 ) .OR. ( ncc.GT.0 )
*
*     If no singular vectors desired, use qd algorithm
*
      IF( .NOT.rotate ) THEN
         CALL slasq1( n, d, e, work, info )
*
*     If INFO equals 2, dqds didn't finish, try to finish
*
         IF( info .NE. 2 ) RETURN
         info = 0
      END IF
*
      nm1 = n - 1
      nm12 = nm1 + nm1
      nm13 = nm12 + nm1
      idir = 0
*
*     Get machine constants
*
      eps = slamch( 'Epsilon' )
      unfl = slamch( 'Safe minimum' )
*
*     If matrix lower bidiagonal, rotate to be upper bidiagonal
*     by applying Givens rotations on the left
*
      IF( lower ) THEN
         DO 10 i = 1, n - 1
            CALL slartg( d( i ), e( i ), cs, sn, r )
            d( i ) = r
            e( i ) = sn*d( i+1 )
            d( i+1 ) = cs*d( i+1 )
            work( i ) = cs
            work( nm1+i ) = sn
   10    CONTINUE
*
*        Update singular vectors if desired
*
         IF( nru.GT.0 )
     $      CALL slasr( 'R', 'V', 'F', nru, n, work( 1 ), work( n ), u,
     $                  ldu )
         IF( ncc.GT.0 )
     $      CALL slasr( 'L', 'V', 'F', n, ncc, work( 1 ), work( n ), c,
     $                  ldc )
      END IF
*
*     Compute singular values to relative accuracy TOL
*     (By setting TOL to be negative, algorithm will compute
*     singular values to absolute accuracy ABS(TOL)*norm(input matrix))
*
      tolmul = max( ten, min( hndrd, eps**meigth ) )
      tol = tolmul*eps
*
*     Compute approximate maximum, minimum singular values
*
      smax = zero
      DO 20 i = 1, n
         smax = max( smax, abs( d( i ) ) )
   20 CONTINUE
      DO 30 i = 1, n - 1
         smax = max( smax, abs( e( i ) ) )
   30 CONTINUE
      sminl = zero
      IF( tol.GE.zero ) THEN
*
*        Relative accuracy desired
*
         sminoa = abs( d( 1 ) )
         IF( sminoa.EQ.zero )
     $      GO TO 50
         mu = sminoa
         DO 40 i = 2, n
            mu = abs( d( i ) )*( mu / ( mu+abs( e( i-1 ) ) ) )
            sminoa = min( sminoa, mu )
            IF( sminoa.EQ.zero )
     $         GO TO 50
   40    CONTINUE
   50    CONTINUE
         sminoa = sminoa / sqrt( real( n ) )
         thresh = max( tol*sminoa, maxitr*(n*(n*unfl)) )
      ELSE
*
*        Absolute accuracy desired
*
         thresh = max( abs( tol )*smax, maxitr*(n*(n*unfl)) )
      END IF
*
*     Prepare for main iteration loop for the singular values
*     (MAXIT is the maximum number of passes through the inner
*     loop permitted before nonconvergence signalled.)
*
      maxitdivn = maxitr*n
      iterdivn = 0
      iter = -1
      oldll = -1
      oldm = -1
*
*     M points to last element of unconverged part of matrix
*
      m = n
*
*     Begin main iteration loop
*
   60 CONTINUE
*
*     Check for convergence or exceeding iteration count
*
      IF( m.LE.1 )
     $   GO TO 160
*
      IF( iter.GE.n ) THEN
         iter = iter - n
         iterdivn = iterdivn + 1
         IF( iterdivn.GE.maxitdivn )
     $      GO TO 200
      END IF
*
*     Find diagonal block of matrix to work on
*
      IF( tol.LT.zero .AND. abs( d( m ) ).LE.thresh )
     $   d( m ) = zero
      smax = abs( d( m ) )
      smin = smax
      DO 70 lll = 1, m - 1
         ll = m - lll
         abss = abs( d( ll ) )
         abse = abs( e( ll ) )
         IF( tol.LT.zero .AND. abss.LE.thresh )
     $      d( ll ) = zero
         IF( abse.LE.thresh )
     $      GO TO 80
         smin = min( smin, abss )
         smax = max( smax, abss, abse )
   70 CONTINUE
      ll = 0
      GO TO 90
   80 CONTINUE
      e( ll ) = zero
*
*     Matrix splits since E(LL) = 0
*
      IF( ll.EQ.m-1 ) THEN
*
*        Convergence of bottom singular value, return to top of loop
*
         m = m - 1
         GO TO 60
      END IF
   90 CONTINUE
      ll = ll + 1
*
*     E(LL) through E(M-1) are nonzero, E(LL-1) is zero
*
      IF( ll.EQ.m-1 ) THEN
*
*        2 by 2 block, handle separately
*
         CALL slasv2( d( m-1 ), e( m-1 ), d( m ), sigmn, sigmx, sinr,
     $                cosr, sinl, cosl )
         d( m-1 ) = sigmx
         e( m-1 ) = zero
         d( m ) = sigmn
*
*        Compute singular vectors, if desired
*
         IF( ncvt.GT.0 )
     $      CALL srot( ncvt, vt( m-1, 1 ), ldvt, vt( m, 1 ), ldvt, cosr,
     $                 sinr )
         IF( nru.GT.0 )
     $      CALL srot( nru, u( 1, m-1 ), 1, u( 1, m ), 1, cosl, sinl )
         IF( ncc.GT.0 )
     $      CALL srot( ncc, c( m-1, 1 ), ldc, c( m, 1 ), ldc, cosl,
     $                 sinl )
         m = m - 2
         GO TO 60
      END IF
*
*     If working on new submatrix, choose shift direction
*     (from larger end diagonal element towards smaller)
*
      IF( ll.GT.oldm .OR. m.LT.oldll ) THEN
         IF( abs( d( ll ) ).GE.abs( d( m ) ) ) THEN
*
*           Chase bulge from top (big end) to bottom (small end)
*
            idir = 1
         ELSE
*
*           Chase bulge from bottom (big end) to top (small end)
*
            idir = 2
         END IF
      END IF
*
*     Apply convergence tests
*
      IF( idir.EQ.1 ) THEN
*
*        Run convergence test in forward direction
*        First apply standard test to bottom of matrix
*
         IF( abs( e( m-1 ) ).LE.abs( tol )*abs( d( m ) ) .OR.
     $       ( tol.LT.zero .AND. abs( e( m-1 ) ).LE.thresh ) ) THEN
            e( m-1 ) = zero
            GO TO 60
         END IF
*
         IF( tol.GE.zero ) THEN
*
*           If relative accuracy desired,
*           apply convergence criterion forward
*
            mu = abs( d( ll ) )
            sminl = mu
            DO 100 lll = ll, m - 1
               IF( abs( e( lll ) ).LE.tol*mu ) THEN
                  e( lll ) = zero
                  GO TO 60
               END IF
               mu = abs( d( lll+1 ) )*( mu / ( mu+abs( e( lll ) ) ) )
               sminl = min( sminl, mu )
  100       CONTINUE
         END IF
*
      ELSE
*
*        Run convergence test in backward direction
*        First apply standard test to top of matrix
*
         IF( abs( e( ll ) ).LE.abs( tol )*abs( d( ll ) ) .OR.
     $       ( tol.LT.zero .AND. abs( e( ll ) ).LE.thresh ) ) THEN
            e( ll ) = zero
            GO TO 60
         END IF
*
         IF( tol.GE.zero ) THEN
*
*           If relative accuracy desired,
*           apply convergence criterion backward
*
            mu = abs( d( m ) )
            sminl = mu
            DO 110 lll = m - 1, ll, -1
               IF( abs( e( lll ) ).LE.tol*mu ) THEN
                  e( lll ) = zero
                  GO TO 60
               END IF
               mu = abs( d( lll ) )*( mu / ( mu+abs( e( lll ) ) ) )
               sminl = min( sminl, mu )
  110       CONTINUE
         END IF
      END IF
      oldll = ll
      oldm = m
*
*     Compute shift.  First, test if shifting would ruin relative
*     accuracy, and if so set the shift to zero.
*
      IF( tol.GE.zero .AND. n*tol*( sminl / smax ).LE.
     $    max( eps, hndrth*tol ) ) THEN
*
*        Use a zero shift to avoid loss of relative accuracy
*
         shift = zero
      ELSE
*
*        Compute the shift from 2-by-2 block at end of matrix
*
         IF( idir.EQ.1 ) THEN
            sll = abs( d( ll ) )
            CALL slas2( d( m-1 ), e( m-1 ), d( m ), shift, r )
         ELSE
            sll = abs( d( m ) )
            CALL slas2( d( ll ), e( ll ), d( ll+1 ), shift, r )
         END IF
*
*        Test if shift negligible, and if so set to zero
*
         IF( sll.GT.zero ) THEN
            IF( ( shift / sll )**2.LT.eps )
     $         shift = zero
         END IF
      END IF
*
*     Increment iteration count
*
      iter = iter + m - ll
*
*     If SHIFT = 0, do simplified QR iteration
*
      IF( shift.EQ.zero ) THEN
         IF( idir.EQ.1 ) THEN
*
*           Chase bulge from top to bottom
*           Save cosines and sines for later singular vector updates
*
            cs = one
            oldcs = one
            DO 120 i = ll, m - 1
               CALL slartg( d( i )*cs, e( i ), cs, sn, r )
               IF( i.GT.ll )
     $            e( i-1 ) = oldsn*r
               CALL slartg( oldcs*r, d( i+1 )*sn, oldcs, oldsn, d( i ) )
               work( i-ll+1 ) = cs
               work( i-ll+1+nm1 ) = sn
               work( i-ll+1+nm12 ) = oldcs
               work( i-ll+1+nm13 ) = oldsn
  120       CONTINUE
            h = d( m )*cs
            d( m ) = h*oldcs
            e( m-1 ) = h*oldsn
*
*           Update singular vectors
*
            IF( ncvt.GT.0 )
     $         CALL slasr( 'L', 'V', 'F', m-ll+1, ncvt, work( 1 ),
     $                     work( n ), vt( ll, 1 ), ldvt )
            IF( nru.GT.0 )
     $         CALL slasr( 'R', 'V', 'F', nru, m-ll+1, work( nm12+1 ),
     $                     work( nm13+1 ), u( 1, ll ), ldu )
            IF( ncc.GT.0 )
     $         CALL slasr( 'L', 'V', 'F', m-ll+1, ncc, work( nm12+1 ),
     $                     work( nm13+1 ), c( ll, 1 ), ldc )
*
*           Test convergence
*
            IF( abs( e( m-1 ) ).LE.thresh )
     $         e( m-1 ) = zero
*
         ELSE
*
*           Chase bulge from bottom to top
*           Save cosines and sines for later singular vector updates
*
            cs = one
            oldcs = one
            DO 130 i = m, ll + 1, -1
               CALL slartg( d( i )*cs, e( i-1 ), cs, sn, r )
               IF( i.LT.m )
     $            e( i ) = oldsn*r
               CALL slartg( oldcs*r, d( i-1 )*sn, oldcs, oldsn, d( i ) )
               work( i-ll ) = cs
               work( i-ll+nm1 ) = -sn
               work( i-ll+nm12 ) = oldcs
               work( i-ll+nm13 ) = -oldsn
  130       CONTINUE
            h = d( ll )*cs
            d( ll ) = h*oldcs
            e( ll ) = h*oldsn
*
*           Update singular vectors
*
            IF( ncvt.GT.0 )
     $         CALL slasr( 'L', 'V', 'B', m-ll+1, ncvt, work( nm12+1 ),
     $                     work( nm13+1 ), vt( ll, 1 ), ldvt )
            IF( nru.GT.0 )
     $         CALL slasr( 'R', 'V', 'B', nru, m-ll+1, work( 1 ),
     $                     work( n ), u( 1, ll ), ldu )
            IF( ncc.GT.0 )
     $         CALL slasr( 'L', 'V', 'B', m-ll+1, ncc, work( 1 ),
     $                     work( n ), c( ll, 1 ), ldc )
*
*           Test convergence
*
            IF( abs( e( ll ) ).LE.thresh )
     $         e( ll ) = zero
         END IF
      ELSE
*
*        Use nonzero shift
*
         IF( idir.EQ.1 ) THEN
*
*           Chase bulge from top to bottom
*           Save cosines and sines for later singular vector updates
*
            f = ( abs( d( ll ) )-shift )*
     $          ( sign( one, d( ll ) )+shift / d( ll ) )
            g = e( ll )
            DO 140 i = ll, m - 1
               CALL slartg( f, g, cosr, sinr, r )
               IF( i.GT.ll )
     $            e( i-1 ) = r
               f = cosr*d( i ) + sinr*e( i )
               e( i ) = cosr*e( i ) - sinr*d( i )
               g = sinr*d( i+1 )
               d( i+1 ) = cosr*d( i+1 )
               CALL slartg( f, g, cosl, sinl, r )
               d( i ) = r
               f = cosl*e( i ) + sinl*d( i+1 )
               d( i+1 ) = cosl*d( i+1 ) - sinl*e( i )
               IF( i.LT.m-1 ) THEN
                  g = sinl*e( i+1 )
                  e( i+1 ) = cosl*e( i+1 )
               END IF
               work( i-ll+1 ) = cosr
               work( i-ll+1+nm1 ) = sinr
               work( i-ll+1+nm12 ) = cosl
               work( i-ll+1+nm13 ) = sinl
  140       CONTINUE
            e( m-1 ) = f
*
*           Update singular vectors
*
            IF( ncvt.GT.0 )
     $         CALL slasr( 'L', 'V', 'F', m-ll+1, ncvt, work( 1 ),
     $                     work( n ), vt( ll, 1 ), ldvt )
            IF( nru.GT.0 )
     $         CALL slasr( 'R', 'V', 'F', nru, m-ll+1, work( nm12+1 ),
     $                     work( nm13+1 ), u( 1, ll ), ldu )
            IF( ncc.GT.0 )
     $         CALL slasr( 'L', 'V', 'F', m-ll+1, ncc, work( nm12+1 ),
     $                     work( nm13+1 ), c( ll, 1 ), ldc )
*
*           Test convergence
*
            IF( abs( e( m-1 ) ).LE.thresh )
     $         e( m-1 ) = zero
*
         ELSE
*
*           Chase bulge from bottom to top
*           Save cosines and sines for later singular vector updates
*
            f = ( abs( d( m ) )-shift )*( sign( one, d( m ) )+shift /
     $          d( m ) )
            g = e( m-1 )
            DO 150 i = m, ll + 1, -1
               CALL slartg( f, g, cosr, sinr, r )
               IF( i.LT.m )
     $            e( i ) = r
               f = cosr*d( i ) + sinr*e( i-1 )
               e( i-1 ) = cosr*e( i-1 ) - sinr*d( i )
               g = sinr*d( i-1 )
               d( i-1 ) = cosr*d( i-1 )
               CALL slartg( f, g, cosl, sinl, r )
               d( i ) = r
               f = cosl*e( i-1 ) + sinl*d( i-1 )
               d( i-1 ) = cosl*d( i-1 ) - sinl*e( i-1 )
               IF( i.GT.ll+1 ) THEN
                  g = sinl*e( i-2 )
                  e( i-2 ) = cosl*e( i-2 )
               END IF
               work( i-ll ) = cosr
               work( i-ll+nm1 ) = -sinr
               work( i-ll+nm12 ) = cosl
               work( i-ll+nm13 ) = -sinl
  150       CONTINUE
            e( ll ) = f
*
*           Test convergence
*
            IF( abs( e( ll ) ).LE.thresh )
     $         e( ll ) = zero
*
*           Update singular vectors if desired
*
            IF( ncvt.GT.0 )
     $         CALL slasr( 'L', 'V', 'B', m-ll+1, ncvt, work( nm12+1 ),
     $                     work( nm13+1 ), vt( ll, 1 ), ldvt )
            IF( nru.GT.0 )
     $         CALL slasr( 'R', 'V', 'B', nru, m-ll+1, work( 1 ),
     $                     work( n ), u( 1, ll ), ldu )
            IF( ncc.GT.0 )
     $         CALL slasr( 'L', 'V', 'B', m-ll+1, ncc, work( 1 ),
     $                     work( n ), c( ll, 1 ), ldc )
         END IF
      END IF
*
*     QR iteration finished, go back and check convergence
*
      GO TO 60
*
*     All singular values converged, so make them positive
*
  160 CONTINUE
      DO 170 i = 1, n
         IF( d( i ).LT.zero ) THEN
            d( i ) = -d( i )
*
*           Change sign of singular vectors, if desired
*
            IF( ncvt.GT.0 )
     $         CALL sscal( ncvt, negone, vt( i, 1 ), ldvt )
         END IF
  170 CONTINUE
*
*     Sort the singular values into decreasing order (insertion sort on
*     singular values, but only one transposition per singular vector)
*
      DO 190 i = 1, n - 1
*
*        Scan for smallest D(I)
*
         isub = 1
         smin = d( 1 )
         DO 180 j = 2, n + 1 - i
            IF( d( j ).LE.smin ) THEN
               isub = j
               smin = d( j )
            END IF
  180    CONTINUE
         IF( isub.NE.n+1-i ) THEN
*
*           Swap singular values and vectors
*
            d( isub ) = d( n+1-i )
            d( n+1-i ) = smin
            IF( ncvt.GT.0 )
     $         CALL sswap( ncvt, vt( isub, 1 ), ldvt, vt( n+1-i, 1 ),
     $                     ldvt )
            IF( nru.GT.0 )
     $         CALL sswap( nru, u( 1, isub ), 1, u( 1, n+1-i ), 1 )
            IF( ncc.GT.0 )
     $         CALL sswap( ncc, c( isub, 1 ), ldc, c( n+1-i, 1 ), ldc )
         END IF
  190 CONTINUE
      GO TO 220
*
*     Maximum number of iterations exceeded, failure to converge
*
  200 CONTINUE
      info = 0
      DO 210 i = 1, n - 1
         IF( e( i ).NE.zero )
     $      info = info + 1
  210 CONTINUE
  220 CONTINUE
      RETURN
*
*     End of SBDSQR
*

◆ sdisna()

subroutine sdisna	(	character	job,
		integer	m,
		integer	n,
		real, dimension( * )	d,
		real, dimension( * )	sep,
		integer	info )

SDISNA

Download SDISNA + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> SDISNA computes the reciprocal condition numbers for the eigenvectors
!> of a real symmetric or complex Hermitian matrix or for the left or
!> right singular vectors of a general m-by-n matrix. The reciprocal
!> condition number is the 'gap' between the corresponding eigenvalue or
!> singular value and the nearest other one.
!>
!> The bound on the error, measured by angle in radians, in the I-th
!> computed vector is given by
!>
!>        SLAMCH( 'E' ) * ( ANORM / SEP( I ) )
!>
!> where ANORM = 2-norm(A) = max( abs( D(j) ) ).  SEP(I) is not allowed
!> to be smaller than SLAMCH( 'E' )*ANORM in order to limit the size of
!> the error bound.
!>
!> SDISNA may also be used to compute error bounds for eigenvectors of
!> the generalized symmetric definite eigenproblem.
!>

Parameters

[in]	JOB	!> JOB is CHARACTER*1 !> Specifies for which problem the reciprocal condition numbers !> should be computed: !> = 'E': the eigenvectors of a symmetric/Hermitian matrix; !> = 'L': the left singular vectors of a general matrix; !> = 'R': the right singular vectors of a general matrix. !>
[in]	M	!> M is INTEGER !> The number of rows of the matrix. M >= 0. !>
[in]	N	!> N is INTEGER !> If JOB = 'L' or 'R', the number of columns of the matrix, !> in which case N >= 0. Ignored if JOB = 'E'. !>
[in]	D	!> D is REAL array, dimension (M) if JOB = 'E' !> dimension (min(M,N)) if JOB = 'L' or 'R' !> The eigenvalues (if JOB = 'E') or singular values (if JOB = !> 'L' or 'R') of the matrix, in either increasing or decreasing !> order. If singular values, they must be non-negative. !>
[out]	SEP	!> SEP is REAL array, dimension (M) if JOB = 'E' !> dimension (min(M,N)) if JOB = 'L' or 'R' !> The reciprocal condition numbers of the vectors. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> < 0: if INFO = -i, the i-th argument had an illegal value. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 116 of file sdisna.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          JOB
      INTEGER            INFO, M, N
*     ..
*     .. Array Arguments ..
      REAL               D( * ), SEP( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ZERO
      parameter( zero = 0.0e+0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            DECR, EIGEN, INCR, LEFT, RIGHT, SING
      INTEGER            I, K
      REAL               ANORM, EPS, NEWGAP, OLDGAP, SAFMIN, THRESH
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      REAL               SLAMCH
      EXTERNAL           lsame, slamch
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, max, min
*     ..
*     .. External Subroutines ..
      EXTERNAL           xerbla
*     ..
*     .. Executable Statements ..
*
*     Test the input arguments
*
      info = 0
      eigen = lsame( job, 'E' )
      left = lsame( job, 'L' )
      right = lsame( job, 'R' )
      sing = left .OR. right
      IF( eigen ) THEN
         k = m
      ELSE IF( sing ) THEN
         k = min( m, n )
      END IF
      IF( .NOT.eigen .AND. .NOT.sing ) THEN
         info = -1
      ELSE IF( m.LT.0 ) THEN
         info = -2
      ELSE IF( k.LT.0 ) THEN
         info = -3
      ELSE
         incr = .true.
         decr = .true.
         DO 10 i = 1, k - 1
            IF( incr )
     $         incr = incr .AND. d( i ).LE.d( i+1 )
            IF( decr )
     $         decr = decr .AND. d( i ).GE.d( i+1 )
   10    CONTINUE
         IF( sing .AND. k.GT.0 ) THEN
            IF( incr )
     $         incr = incr .AND. zero.LE.d( 1 )
            IF( decr )
     $         decr = decr .AND. d( k ).GE.zero
         END IF
         IF( .NOT.( incr .OR. decr ) )
     $      info = -4
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'SDISNA', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( k.EQ.0 )
     $   RETURN
*
*     Compute reciprocal condition numbers
*
      IF( k.EQ.1 ) THEN
         sep( 1 ) = slamch( 'O' )
      ELSE
         oldgap = abs( d( 2 )-d( 1 ) )
         sep( 1 ) = oldgap
         DO 20 i = 2, k - 1
            newgap = abs( d( i+1 )-d( i ) )
            sep( i ) = min( oldgap, newgap )
            oldgap = newgap
   20    CONTINUE
         sep( k ) = oldgap
      END IF
      IF( sing ) THEN
         IF( ( left .AND. m.GT.n ) .OR. ( right .AND. m.LT.n ) ) THEN
            IF( incr )
     $         sep( 1 ) = min( sep( 1 ), d( 1 ) )
            IF( decr )
     $         sep( k ) = min( sep( k ), d( k ) )
         END IF
      END IF
*
*     Ensure that reciprocal condition numbers are not less than
*     threshold, in order to limit the size of the error bound
*
      eps = slamch( 'E' )
      safmin = slamch( 'S' )
      anorm = max( abs( d( 1 ) ), abs( d( k ) ) )
      IF( anorm.EQ.zero ) THEN
         thresh = eps
      ELSE
         thresh = max( eps*anorm, safmin )
      END IF
      DO 30 i = 1, k
         sep( i ) = max( sep( i ), thresh )
   30 CONTINUE
*
      RETURN
*
*     End of SDISNA
*

◆ slaed0()

subroutine slaed0	(	integer	icompq,
		integer	qsiz,
		integer	n,
		real, dimension( * )	d,
		real, dimension( * )	e,
		real, dimension( ldq, * )	q,
		integer	ldq,
		real, dimension( ldqs, * )	qstore,
		integer	ldqs,
		real, dimension( * )	work,
		integer, dimension( * )	iwork,
		integer	info )

SLAED0 used by SSTEDC. Computes all eigenvalues and corresponding eigenvectors of an unreduced symmetric tridiagonal matrix using the divide and conquer method.

Download SLAED0 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> SLAED0 computes all eigenvalues and corresponding eigenvectors of a
!> symmetric tridiagonal matrix using the divide and conquer method.
!>

Parameters

[in]	ICOMPQ	!> ICOMPQ is INTEGER !> = 0: Compute eigenvalues only. !> = 1: Compute eigenvectors of original dense symmetric matrix !> also. On entry, Q contains the orthogonal matrix used !> to reduce the original matrix to tridiagonal form. !> = 2: Compute eigenvalues and eigenvectors of tridiagonal !> matrix. !>
[in]	QSIZ	!> QSIZ is INTEGER !> The dimension of the orthogonal matrix used to reduce !> the full matrix to tridiagonal form. QSIZ >= N if ICOMPQ = 1. !>
[in]	N	!> N is INTEGER !> The dimension of the symmetric tridiagonal matrix. N >= 0. !>
[in,out]	D	!> D is REAL array, dimension (N) !> On entry, the main diagonal of the tridiagonal matrix. !> On exit, its eigenvalues. !>
[in]	E	!> E is REAL array, dimension (N-1) !> The off-diagonal elements of the tridiagonal matrix. !> On exit, E has been destroyed. !>
[in,out]	Q	!> Q is REAL array, dimension (LDQ, N) !> On entry, Q must contain an N-by-N orthogonal matrix. !> If ICOMPQ = 0 Q is not referenced. !> If ICOMPQ = 1 On entry, Q is a subset of the columns of the !> orthogonal matrix used to reduce the full !> matrix to tridiagonal form corresponding to !> the subset of the full matrix which is being !> decomposed at this time. !> If ICOMPQ = 2 On entry, Q will be the identity matrix. !> On exit, Q contains the eigenvectors of the !> tridiagonal matrix. !>
[in]	LDQ	!> LDQ is INTEGER !> The leading dimension of the array Q. If eigenvectors are !> desired, then LDQ >= max(1,N). In any case, LDQ >= 1. !>
[out]	QSTORE	!> QSTORE is REAL array, dimension (LDQS, N) !> Referenced only when ICOMPQ = 1. Used to store parts of !> the eigenvector matrix when the updating matrix multiplies !> take place. !>
[in]	LDQS	!> LDQS is INTEGER !> The leading dimension of the array QSTORE. If ICOMPQ = 1, !> then LDQS >= max(1,N). In any case, LDQS >= 1. !>
[out]	WORK	!> WORK is REAL array, !> If ICOMPQ = 0 or 1, the dimension of WORK must be at least !> 1 + 3N + 2Nlg N + 3N*2 !> ( lg( N ) = smallest integer k !> such that 2^k >= N ) !> If ICOMPQ = 2, the dimension of WORK must be at least !> 4N + N**2. !>
[out]	IWORK	!> IWORK is INTEGER array, !> If ICOMPQ = 0 or 1, the dimension of IWORK must be at least !> 6 + 6N + 5Nlg N. !> ( lg( N ) = smallest integer k !> such that 2^k >= N ) !> If ICOMPQ = 2, the dimension of IWORK must be at least !> 3 + 5N. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> < 0: if INFO = -i, the i-th argument had an illegal value. !> > 0: The algorithm failed to compute an eigenvalue while !> working on the submatrix lying in rows and columns !> INFO/(N+1) through mod(INFO,N+1). !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: Jeff Rutter, Computer Science Division, University of California at Berkeley, USA

Definition at line 170 of file slaed0.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            ICOMPQ, INFO, LDQ, LDQS, N, QSIZ
*     ..
*     .. Array Arguments ..
      INTEGER            IWORK( * )
      REAL               D( * ), E( * ), Q( LDQ, * ), QSTORE( LDQS, * ),
     $                   WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ZERO, ONE, TWO
      parameter( zero = 0.e0, one = 1.e0, two = 2.e0 )
*     ..
*     .. Local Scalars ..
      INTEGER            CURLVL, CURPRB, CURR, I, IGIVCL, IGIVNM,
     $                   IGIVPT, INDXQ, IPERM, IPRMPT, IQ, IQPTR, IWREM,
     $                   J, K, LGN, MATSIZ, MSD2, SMLSIZ, SMM1, SPM1,
     $                   SPM2, SUBMAT, SUBPBS, TLVLS
      REAL               TEMP
*     ..
*     .. External Subroutines ..
      EXTERNAL           scopy, sgemm, slacpy, slaed1, slaed7, ssteqr,
     $                   xerbla
*     ..
*     .. External Functions ..
      INTEGER            ILAENV
      EXTERNAL           ilaenv
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, int, log, max, real
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
*
      IF( icompq.LT.0 .OR. icompq.GT.2 ) THEN
         info = -1
      ELSE IF( ( icompq.EQ.1 ) .AND. ( qsiz.LT.max( 0, n ) ) ) THEN
         info = -2
      ELSE IF( n.LT.0 ) THEN
         info = -3
      ELSE IF( ldq.LT.max( 1, n ) ) THEN
         info = -7
      ELSE IF( ldqs.LT.max( 1, n ) ) THEN
         info = -9
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'SLAED0', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
      smlsiz = ilaenv( 9, 'SLAED0', ' ', 0, 0, 0, 0 )
*
*     Determine the size and placement of the submatrices, and save in
*     the leading elements of IWORK.
*
      iwork( 1 ) = n
      subpbs = 1
      tlvls = 0
   10 CONTINUE
      IF( iwork( subpbs ).GT.smlsiz ) THEN
         DO 20 j = subpbs, 1, -1
            iwork( 2*j ) = ( iwork( j )+1 ) / 2
            iwork( 2*j-1 ) = iwork( j ) / 2
   20    CONTINUE
         tlvls = tlvls + 1
         subpbs = 2*subpbs
         GO TO 10
      END IF
      DO 30 j = 2, subpbs
         iwork( j ) = iwork( j ) + iwork( j-1 )
   30 CONTINUE
*
*     Divide the matrix into SUBPBS submatrices of size at most SMLSIZ+1
*     using rank-1 modifications (cuts).
*
      spm1 = subpbs - 1
      DO 40 i = 1, spm1
         submat = iwork( i ) + 1
         smm1 = submat - 1
         d( smm1 ) = d( smm1 ) - abs( e( smm1 ) )
         d( submat ) = d( submat ) - abs( e( smm1 ) )
   40 CONTINUE
*
      indxq = 4*n + 3
      IF( icompq.NE.2 ) THEN
*
*        Set up workspaces for eigenvalues only/accumulate new vectors
*        routine
*
         temp = log( real( n ) ) / log( two )
         lgn = int( temp )
         IF( 2**lgn.LT.n )
     $      lgn = lgn + 1
         IF( 2**lgn.LT.n )
     $      lgn = lgn + 1
         iprmpt = indxq + n + 1
         iperm = iprmpt + n*lgn
         iqptr = iperm + n*lgn
         igivpt = iqptr + n + 2
         igivcl = igivpt + n*lgn
*
         igivnm = 1
         iq = igivnm + 2*n*lgn
         iwrem = iq + n**2 + 1
*
*        Initialize pointers
*
         DO 50 i = 0, subpbs
            iwork( iprmpt+i ) = 1
            iwork( igivpt+i ) = 1
   50    CONTINUE
         iwork( iqptr ) = 1
      END IF
*
*     Solve each submatrix eigenproblem at the bottom of the divide and
*     conquer tree.
*
      curr = 0
      DO 70 i = 0, spm1
         IF( i.EQ.0 ) THEN
            submat = 1
            matsiz = iwork( 1 )
         ELSE
            submat = iwork( i ) + 1
            matsiz = iwork( i+1 ) - iwork( i )
         END IF
         IF( icompq.EQ.2 ) THEN
            CALL ssteqr( 'I', matsiz, d( submat ), e( submat ),
     $                   q( submat, submat ), ldq, work, info )
            IF( info.NE.0 )
     $         GO TO 130
         ELSE
            CALL ssteqr( 'I', matsiz, d( submat ), e( submat ),
     $                   work( iq-1+iwork( iqptr+curr ) ), matsiz, work,
     $                   info )
            IF( info.NE.0 )
     $         GO TO 130
            IF( icompq.EQ.1 ) THEN
               CALL sgemm( 'N', 'N', qsiz, matsiz, matsiz, one,
     $                     q( 1, submat ), ldq, work( iq-1+iwork( iqptr+
     $                     curr ) ), matsiz, zero, qstore( 1, submat ),
     $                     ldqs )
            END IF
            iwork( iqptr+curr+1 ) = iwork( iqptr+curr ) + matsiz**2
            curr = curr + 1
         END IF
         k = 1
         DO 60 j = submat, iwork( i+1 )
            iwork( indxq+j ) = k
            k = k + 1
   60    CONTINUE
   70 CONTINUE
*
*     Successively merge eigensystems of adjacent submatrices
*     into eigensystem for the corresponding larger matrix.
*
*     while ( SUBPBS > 1 )
*
      curlvl = 1
   80 CONTINUE
      IF( subpbs.GT.1 ) THEN
         spm2 = subpbs - 2
         DO 90 i = 0, spm2, 2
            IF( i.EQ.0 ) THEN
               submat = 1
               matsiz = iwork( 2 )
               msd2 = iwork( 1 )
               curprb = 0
            ELSE
               submat = iwork( i ) + 1
               matsiz = iwork( i+2 ) - iwork( i )
               msd2 = matsiz / 2
               curprb = curprb + 1
            END IF
*
*     Merge lower order eigensystems (of size MSD2 and MATSIZ - MSD2)
*     into an eigensystem of size MATSIZ.
*     SLAED1 is used only for the full eigensystem of a tridiagonal
*     matrix.
*     SLAED7 handles the cases in which eigenvalues only or eigenvalues
*     and eigenvectors of a full symmetric matrix (which was reduced to
*     tridiagonal form) are desired.
*
            IF( icompq.EQ.2 ) THEN
               CALL slaed1( matsiz, d( submat ), q( submat, submat ),
     $                      ldq, iwork( indxq+submat ),
     $                      e( submat+msd2-1 ), msd2, work,
     $                      iwork( subpbs+1 ), info )
            ELSE
               CALL slaed7( icompq, matsiz, qsiz, tlvls, curlvl, curprb,
     $                      d( submat ), qstore( 1, submat ), ldqs,
     $                      iwork( indxq+submat ), e( submat+msd2-1 ),
     $                      msd2, work( iq ), iwork( iqptr ),
     $                      iwork( iprmpt ), iwork( iperm ),
     $                      iwork( igivpt ), iwork( igivcl ),
     $                      work( igivnm ), work( iwrem ),
     $                      iwork( subpbs+1 ), info )
            END IF
            IF( info.NE.0 )
     $         GO TO 130
            iwork( i / 2+1 ) = iwork( i+2 )
   90    CONTINUE
         subpbs = subpbs / 2
         curlvl = curlvl + 1
         GO TO 80
      END IF
*
*     end while
*
*     Re-merge the eigenvalues/vectors which were deflated at the final
*     merge step.
*
      IF( icompq.EQ.1 ) THEN
         DO 100 i = 1, n
            j = iwork( indxq+i )
            work( i ) = d( j )
            CALL scopy( qsiz, qstore( 1, j ), 1, q( 1, i ), 1 )
  100    CONTINUE
         CALL scopy( n, work, 1, d, 1 )
      ELSE IF( icompq.EQ.2 ) THEN
         DO 110 i = 1, n
            j = iwork( indxq+i )
            work( i ) = d( j )
            CALL scopy( n, q( 1, j ), 1, work( n*i+1 ), 1 )
  110    CONTINUE
         CALL scopy( n, work, 1, d, 1 )
         CALL slacpy( 'A', n, n, work( n+1 ), n, q, ldq )
      ELSE
         DO 120 i = 1, n
            j = iwork( indxq+i )
            work( i ) = d( j )
  120    CONTINUE
         CALL scopy( n, work, 1, d, 1 )
      END IF
      GO TO 140
*
  130 CONTINUE
      info = submat*( n+1 ) + submat + matsiz - 1
*
  140 CONTINUE
      RETURN
*
*     End of SLAED0
*

◆ slaed1()

subroutine slaed1	(	integer	n,
		real, dimension( * )	d,
		real, dimension( ldq, * )	q,
		integer	ldq,
		integer, dimension( * )	indxq,
		real	rho,
		integer	cutpnt,
		real, dimension( * )	work,
		integer, dimension( * )	iwork,
		integer	info )

SLAED1 used by SSTEDC. Computes the updated eigensystem of a diagonal matrix after modification by a rank-one symmetric matrix. Used when the original matrix is tridiagonal.

Download SLAED1 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> SLAED1 computes the updated eigensystem of a diagonal
!> matrix after modification by a rank-one symmetric matrix.  This
!> routine is used only for the eigenproblem which requires all
!> eigenvalues and eigenvectors of a tridiagonal matrix.  SLAED7 handles
!> the case in which eigenvalues only or eigenvalues and eigenvectors
!> of a full symmetric matrix (which was reduced to tridiagonal form)
!> are desired.
!>
!>   T = Q(in) ( D(in) + RHO * Z*Z**T ) Q**T(in) = Q(out) * D(out) * Q**T(out)
!>
!>    where Z = Q**T*u, u is a vector of length N with ones in the
!>    CUTPNT and CUTPNT + 1 th elements and zeros elsewhere.
!>
!>    The eigenvectors of the original matrix are stored in Q, and the
!>    eigenvalues are in D.  The algorithm consists of three stages:
!>
!>       The first stage consists of deflating the size of the problem
!>       when there are multiple eigenvalues or if there is a zero in
!>       the Z vector.  For each such occurrence the dimension of the
!>       secular equation problem is reduced by one.  This stage is
!>       performed by the routine SLAED2.
!>
!>       The second stage consists of calculating the updated
!>       eigenvalues. This is done by finding the roots of the secular
!>       equation via the routine SLAED4 (as called by SLAED3).
!>       This routine also calculates the eigenvectors of the current
!>       problem.
!>
!>       The final stage consists of computing the updated eigenvectors
!>       directly using the updated eigenvalues.  The eigenvectors for
!>       the current problem are multiplied with the eigenvectors from
!>       the overall problem.
!>

Parameters

[in]	N	!> N is INTEGER !> The dimension of the symmetric tridiagonal matrix. N >= 0. !>
[in,out]	D	!> D is REAL array, dimension (N) !> On entry, the eigenvalues of the rank-1-perturbed matrix. !> On exit, the eigenvalues of the repaired matrix. !>
[in,out]	Q	!> Q is REAL array, dimension (LDQ,N) !> On entry, the eigenvectors of the rank-1-perturbed matrix. !> On exit, the eigenvectors of the repaired tridiagonal matrix. !>
[in]	LDQ	!> LDQ is INTEGER !> The leading dimension of the array Q. LDQ >= max(1,N). !>
[in,out]	INDXQ	!> INDXQ is INTEGER array, dimension (N) !> On entry, the permutation which separately sorts the two !> subproblems in D into ascending order. !> On exit, the permutation which will reintegrate the !> subproblems back into sorted order, !> i.e. D( INDXQ( I = 1, N ) ) will be in ascending order. !>
[in]	RHO	!> RHO is REAL !> The subdiagonal entry used to create the rank-1 modification. !>
[in]	CUTPNT	!> CUTPNT is INTEGER !> The location of the last eigenvalue in the leading sub-matrix. !> min(1,N) <= CUTPNT <= N/2. !>
[out]	WORK	!> WORK is REAL array, dimension (4N + N*2) !>
[out]	IWORK	!> IWORK is INTEGER array, dimension (4*N) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> < 0: if INFO = -i, the i-th argument had an illegal value. !> > 0: if INFO = 1, an eigenvalue did not converge !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: Jeff Rutter, Computer Science Division, University of California at Berkeley, USA
Modified by Francoise Tisseur, University of Tennessee

Definition at line 161 of file slaed1.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            CUTPNT, INFO, LDQ, N
      REAL               RHO
*     ..
*     .. Array Arguments ..
      INTEGER            INDXQ( * ), IWORK( * )
      REAL               D( * ), Q( LDQ, * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Local Scalars ..
      INTEGER            COLTYP, CPP1, I, IDLMDA, INDX, INDXC, INDXP,
     $                   IQ2, IS, IW, IZ, K, N1, N2
*     ..
*     .. External Subroutines ..
      EXTERNAL           scopy, slaed2, slaed3, slamrg, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, min
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
*
      IF( n.LT.0 ) THEN
         info = -1
      ELSE IF( ldq.LT.max( 1, n ) ) THEN
         info = -4
      ELSE IF( min( 1, n / 2 ).GT.cutpnt .OR. ( n / 2 ).LT.cutpnt ) THEN
         info = -7
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'SLAED1', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
*     The following values are integer pointers which indicate
*     the portion of the workspace
*     used by a particular array in SLAED2 and SLAED3.
*
      iz = 1
      idlmda = iz + n
      iw = idlmda + n
      iq2 = iw + n
*
      indx = 1
      indxc = indx + n
      coltyp = indxc + n
      indxp = coltyp + n
*
*
*     Form the z-vector which consists of the last row of Q_1 and the
*     first row of Q_2.
*
      CALL scopy( cutpnt, q( cutpnt, 1 ), ldq, work( iz ), 1 )
      cpp1 = cutpnt + 1
      CALL scopy( n-cutpnt, q( cpp1, cpp1 ), ldq, work( iz+cutpnt ), 1 )
*
*     Deflate eigenvalues.
*
      CALL slaed2( k, n, cutpnt, d, q, ldq, indxq, rho, work( iz ),
     $             work( idlmda ), work( iw ), work( iq2 ),
     $             iwork( indx ), iwork( indxc ), iwork( indxp ),
     $             iwork( coltyp ), info )
*
      IF( info.NE.0 )
     $   GO TO 20
*
*     Solve Secular Equation.
*
      IF( k.NE.0 ) THEN
         is = ( iwork( coltyp )+iwork( coltyp+1 ) )*cutpnt +
     $        ( iwork( coltyp+1 )+iwork( coltyp+2 ) )*( n-cutpnt ) + iq2
         CALL slaed3( k, n, cutpnt, d, q, ldq, rho, work( idlmda ),
     $                work( iq2 ), iwork( indxc ), iwork( coltyp ),
     $                work( iw ), work( is ), info )
         IF( info.NE.0 )
     $      GO TO 20
*
*     Prepare the INDXQ sorting permutation.
*
         n1 = k
         n2 = n - k
         CALL slamrg( n1, n2, d, 1, -1, indxq )
      ELSE
         DO 10 i = 1, n
            indxq( i ) = i
   10    CONTINUE
      END IF
*
   20 CONTINUE
      RETURN
*
*     End of SLAED1
*

◆ slaed2()

subroutine slaed2	(	integer	k,
		integer	n,
		integer	n1,
		real, dimension( * )	d,
		real, dimension( ldq, * )	q,
		integer	ldq,
		integer, dimension( * )	indxq,
		real	rho,
		real, dimension( * )	z,
		real, dimension( * )	dlamda,
		real, dimension( * )	w,
		real, dimension( * )	q2,
		integer, dimension( * )	indx,
		integer, dimension( * )	indxc,
		integer, dimension( * )	indxp,
		integer, dimension( * )	coltyp,
		integer	info )

SLAED2 used by SSTEDC. Merges eigenvalues and deflates secular equation. Used when the original matrix is tridiagonal.

Download SLAED2 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> SLAED2 merges the two sets of eigenvalues together into a single
!> sorted set.  Then it tries to deflate the size of the problem.
!> There are two ways in which deflation can occur:  when two or more
!> eigenvalues are close together or if there is a tiny entry in the
!> Z vector.  For each such occurrence the order of the related secular
!> equation problem is reduced by one.
!>

Parameters

[out]	K	!> K is INTEGER !> The number of non-deflated eigenvalues, and the order of the !> related secular equation. 0 <= K <=N. !>
[in]	N	!> N is INTEGER !> The dimension of the symmetric tridiagonal matrix. N >= 0. !>
[in]	N1	!> N1 is INTEGER !> The location of the last eigenvalue in the leading sub-matrix. !> min(1,N) <= N1 <= N/2. !>
[in,out]	D	!> D is REAL array, dimension (N) !> On entry, D contains the eigenvalues of the two submatrices to !> be combined. !> On exit, D contains the trailing (N-K) updated eigenvalues !> (those which were deflated) sorted into increasing order. !>
[in,out]	Q	!> Q is REAL array, dimension (LDQ, N) !> On entry, Q contains the eigenvectors of two submatrices in !> the two square blocks with corners at (1,1), (N1,N1) !> and (N1+1, N1+1), (N,N). !> On exit, Q contains the trailing (N-K) updated eigenvectors !> (those which were deflated) in its last N-K columns. !>
[in]	LDQ	!> LDQ is INTEGER !> The leading dimension of the array Q. LDQ >= max(1,N). !>
[in,out]	INDXQ	!> INDXQ is INTEGER array, dimension (N) !> The permutation which separately sorts the two sub-problems !> in D into ascending order. Note that elements in the second !> half of this permutation must first have N1 added to their !> values. Destroyed on exit. !>
[in,out]	RHO	!> RHO is REAL !> On entry, the off-diagonal element associated with the rank-1 !> cut which originally split the two submatrices which are now !> being recombined. !> On exit, RHO has been modified to the value required by !> SLAED3. !>
[in]	Z	!> Z is REAL array, dimension (N) !> On entry, Z contains the updating vector (the last !> row of the first sub-eigenvector matrix and the first row of !> the second sub-eigenvector matrix). !> On exit, the contents of Z have been destroyed by the updating !> process. !>
[out]	DLAMDA	!> DLAMDA is REAL array, dimension (N) !> A copy of the first K eigenvalues which will be used by !> SLAED3 to form the secular equation. !>
[out]	W	!> W is REAL array, dimension (N) !> The first k values of the final deflation-altered z-vector !> which will be passed to SLAED3. !>
[out]	Q2	!> Q2 is REAL array, dimension (N12+(N-N1)2) !> A copy of the first K eigenvectors which will be used by !> SLAED3 in a matrix multiply (SGEMM) to solve for the new !> eigenvectors. !>
[out]	INDX	!> INDX is INTEGER array, dimension (N) !> The permutation used to sort the contents of DLAMDA into !> ascending order. !>
[out]	INDXC	!> INDXC is INTEGER array, dimension (N) !> The permutation used to arrange the columns of the deflated !> Q matrix into three groups: the first group contains non-zero !> elements only at and above N1, the second contains !> non-zero elements only below N1, and the third is dense. !>
[out]	INDXP	!> INDXP is INTEGER array, dimension (N) !> The permutation used to place deflated values of D at the end !> of the array. INDXP(1:K) points to the nondeflated D-values !> and INDXP(K+1:N) points to the deflated eigenvalues. !>
[out]	COLTYP	!> COLTYP is INTEGER array, dimension (N) !> During execution, a label which will indicate which of the !> following types a column in the Q2 matrix is: !> 1 : non-zero in the upper half only; !> 2 : dense; !> 3 : non-zero in the lower half only; !> 4 : deflated. !> On exit, COLTYP(i) is the number of columns of type i, !> for i=1 to 4 only. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> < 0: if INFO = -i, the i-th argument had an illegal value. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: Jeff Rutter, Computer Science Division, University of California at Berkeley, USA
Modified by Francoise Tisseur, University of Tennessee

Definition at line 210 of file slaed2.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INFO, K, LDQ, N, N1
      REAL               RHO
*     ..
*     .. Array Arguments ..
      INTEGER            COLTYP( * ), INDX( * ), INDXC( * ), INDXP( * ),
     $                   INDXQ( * )
      REAL               D( * ), DLAMDA( * ), Q( LDQ, * ), Q2( * ),
     $                   W( * ), Z( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               MONE, ZERO, ONE, TWO, EIGHT
      parameter( mone = -1.0e0, zero = 0.0e0, one = 1.0e0,
     $                   two = 2.0e0, eight = 8.0e0 )
*     ..
*     .. Local Arrays ..
      INTEGER            CTOT( 4 ), PSM( 4 )
*     ..
*     .. Local Scalars ..
      INTEGER            CT, I, IMAX, IQ1, IQ2, J, JMAX, JS, K2, N1P1,
     $                   N2, NJ, PJ
      REAL               C, EPS, S, T, TAU, TOL
*     ..
*     .. External Functions ..
      INTEGER            ISAMAX
      REAL               SLAMCH, SLAPY2
      EXTERNAL           isamax, slamch, slapy2
*     ..
*     .. External Subroutines ..
      EXTERNAL           scopy, slacpy, slamrg, srot, sscal, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, max, min, sqrt
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
*
      IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( ldq.LT.max( 1, n ) ) THEN
         info = -6
      ELSE IF( min( 1, ( n / 2 ) ).GT.n1 .OR. ( n / 2 ).LT.n1 ) THEN
         info = -3
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'SLAED2', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
      n2 = n - n1
      n1p1 = n1 + 1
*
      IF( rho.LT.zero ) THEN
         CALL sscal( n2, mone, z( n1p1 ), 1 )
      END IF
*
*     Normalize z so that norm(z) = 1.  Since z is the concatenation of
*     two normalized vectors, norm2(z) = sqrt(2).
*
      t = one / sqrt( two )
      CALL sscal( n, t, z, 1 )
*
*     RHO = ABS( norm(z)**2 * RHO )
*
      rho = abs( two*rho )
*
*     Sort the eigenvalues into increasing order
*
      DO 10 i = n1p1, n
         indxq( i ) = indxq( i ) + n1
   10 CONTINUE
*
*     re-integrate the deflated parts from the last pass
*
      DO 20 i = 1, n
         dlamda( i ) = d( indxq( i ) )
   20 CONTINUE
      CALL slamrg( n1, n2, dlamda, 1, 1, indxc )
      DO 30 i = 1, n
         indx( i ) = indxq( indxc( i ) )
   30 CONTINUE
*
*     Calculate the allowable deflation tolerance
*
      imax = isamax( n, z, 1 )
      jmax = isamax( n, d, 1 )
      eps = slamch( 'Epsilon' )
      tol = eight*eps*max( abs( d( jmax ) ), abs( z( imax ) ) )
*
*     If the rank-1 modifier is small enough, no more needs to be done
*     except to reorganize Q so that its columns correspond with the
*     elements in D.
*
      IF( rho*abs( z( imax ) ).LE.tol ) THEN
         k = 0
         iq2 = 1
         DO 40 j = 1, n
            i = indx( j )
            CALL scopy( n, q( 1, i ), 1, q2( iq2 ), 1 )
            dlamda( j ) = d( i )
            iq2 = iq2 + n
   40    CONTINUE
         CALL slacpy( 'A', n, n, q2, n, q, ldq )
         CALL scopy( n, dlamda, 1, d, 1 )
         GO TO 190
      END IF
*
*     If there are multiple eigenvalues then the problem deflates.  Here
*     the number of equal eigenvalues are found.  As each equal
*     eigenvalue is found, an elementary reflector is computed to rotate
*     the corresponding eigensubspace so that the corresponding
*     components of Z are zero in this new basis.
*
      DO 50 i = 1, n1
         coltyp( i ) = 1
   50 CONTINUE
      DO 60 i = n1p1, n
         coltyp( i ) = 3
   60 CONTINUE
*
*
      k = 0
      k2 = n + 1
      DO 70 j = 1, n
         nj = indx( j )
         IF( rho*abs( z( nj ) ).LE.tol ) THEN
*
*           Deflate due to small z component.
*
            k2 = k2 - 1
            coltyp( nj ) = 4
            indxp( k2 ) = nj
            IF( j.EQ.n )
     $         GO TO 100
         ELSE
            pj = nj
            GO TO 80
         END IF
   70 CONTINUE
   80 CONTINUE
      j = j + 1
      nj = indx( j )
      IF( j.GT.n )
     $   GO TO 100
      IF( rho*abs( z( nj ) ).LE.tol ) THEN
*
*        Deflate due to small z component.
*
         k2 = k2 - 1
         coltyp( nj ) = 4
         indxp( k2 ) = nj
      ELSE
*
*        Check if eigenvalues are close enough to allow deflation.
*
         s = z( pj )
         c = z( nj )
*
*        Find sqrt(a**2+b**2) without overflow or
*        destructive underflow.
*
         tau = slapy2( c, s )
         t = d( nj ) - d( pj )
         c = c / tau
         s = -s / tau
         IF( abs( t*c*s ).LE.tol ) THEN
*
*           Deflation is possible.
*
            z( nj ) = tau
            z( pj ) = zero
            IF( coltyp( nj ).NE.coltyp( pj ) )
     $         coltyp( nj ) = 2
            coltyp( pj ) = 4
            CALL srot( n, q( 1, pj ), 1, q( 1, nj ), 1, c, s )
            t = d( pj )*c**2 + d( nj )*s**2
            d( nj ) = d( pj )*s**2 + d( nj )*c**2
            d( pj ) = t
            k2 = k2 - 1
            i = 1
   90       CONTINUE
            IF( k2+i.LE.n ) THEN
               IF( d( pj ).LT.d( indxp( k2+i ) ) ) THEN
                  indxp( k2+i-1 ) = indxp( k2+i )
                  indxp( k2+i ) = pj
                  i = i + 1
                  GO TO 90
               ELSE
                  indxp( k2+i-1 ) = pj
               END IF
            ELSE
               indxp( k2+i-1 ) = pj
            END IF
            pj = nj
         ELSE
            k = k + 1
            dlamda( k ) = d( pj )
            w( k ) = z( pj )
            indxp( k ) = pj
            pj = nj
         END IF
      END IF
      GO TO 80
  100 CONTINUE
*
*     Record the last eigenvalue.
*
      k = k + 1
      dlamda( k ) = d( pj )
      w( k ) = z( pj )
      indxp( k ) = pj
*
*     Count up the total number of the various types of columns, then
*     form a permutation which positions the four column types into
*     four uniform groups (although one or more of these groups may be
*     empty).
*
      DO 110 j = 1, 4
         ctot( j ) = 0
  110 CONTINUE
      DO 120 j = 1, n
         ct = coltyp( j )
         ctot( ct ) = ctot( ct ) + 1
  120 CONTINUE
*
*     PSM(*) = Position in SubMatrix (of types 1 through 4)
*
      psm( 1 ) = 1
      psm( 2 ) = 1 + ctot( 1 )
      psm( 3 ) = psm( 2 ) + ctot( 2 )
      psm( 4 ) = psm( 3 ) + ctot( 3 )
      k = n - ctot( 4 )
*
*     Fill out the INDXC array so that the permutation which it induces
*     will place all type-1 columns first, all type-2 columns next,
*     then all type-3's, and finally all type-4's.
*
      DO 130 j = 1, n
         js = indxp( j )
         ct = coltyp( js )
         indx( psm( ct ) ) = js
         indxc( psm( ct ) ) = j
         psm( ct ) = psm( ct ) + 1
  130 CONTINUE
*
*     Sort the eigenvalues and corresponding eigenvectors into DLAMDA
*     and Q2 respectively.  The eigenvalues/vectors which were not
*     deflated go into the first K slots of DLAMDA and Q2 respectively,
*     while those which were deflated go into the last N - K slots.
*
      i = 1
      iq1 = 1
      iq2 = 1 + ( ctot( 1 )+ctot( 2 ) )*n1
      DO 140 j = 1, ctot( 1 )
         js = indx( i )
         CALL scopy( n1, q( 1, js ), 1, q2( iq1 ), 1 )
         z( i ) = d( js )
         i = i + 1
         iq1 = iq1 + n1
  140 CONTINUE
*
      DO 150 j = 1, ctot( 2 )
         js = indx( i )
         CALL scopy( n1, q( 1, js ), 1, q2( iq1 ), 1 )
         CALL scopy( n2, q( n1+1, js ), 1, q2( iq2 ), 1 )
         z( i ) = d( js )
         i = i + 1
         iq1 = iq1 + n1
         iq2 = iq2 + n2
  150 CONTINUE
*
      DO 160 j = 1, ctot( 3 )
         js = indx( i )
         CALL scopy( n2, q( n1+1, js ), 1, q2( iq2 ), 1 )
         z( i ) = d( js )
         i = i + 1
         iq2 = iq2 + n2
  160 CONTINUE
*
      iq1 = iq2
      DO 170 j = 1, ctot( 4 )
         js = indx( i )
         CALL scopy( n, q( 1, js ), 1, q2( iq2 ), 1 )
         iq2 = iq2 + n
         z( i ) = d( js )
         i = i + 1
  170 CONTINUE
*
*     The deflated eigenvalues and their corresponding vectors go back
*     into the last N - K slots of D and Q respectively.
*
      IF( k.LT.n ) THEN
         CALL slacpy( 'A', n, ctot( 4 ), q2( iq1 ), n,
     $                q( 1, k+1 ), ldq )
         CALL scopy( n-k, z( k+1 ), 1, d( k+1 ), 1 )
      END IF
*
*     Copy CTOT into COLTYP for referencing in SLAED3.
*
      DO 180 j = 1, 4
         coltyp( j ) = ctot( j )
  180 CONTINUE
*
  190 CONTINUE
      RETURN
*
*     End of SLAED2
*

◆ slaed3()

subroutine slaed3	(	integer	k,
		integer	n,
		integer	n1,
		real, dimension( * )	d,
		real, dimension( ldq, * )	q,
		integer	ldq,
		real	rho,
		real, dimension( * )	dlamda,
		real, dimension( * )	q2,
		integer, dimension( * )	indx,
		integer, dimension( * )	ctot,
		real, dimension( * )	w,
		real, dimension( * )	s,
		integer	info )

SLAED3 used by SSTEDC. Finds the roots of the secular equation and updates the eigenvectors. Used when the original matrix is tridiagonal.

Download SLAED3 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> SLAED3 finds the roots of the secular equation, as defined by the
!> values in D, W, and RHO, between 1 and K.  It makes the
!> appropriate calls to SLAED4 and then updates the eigenvectors by
!> multiplying the matrix of eigenvectors of the pair of eigensystems
!> being combined by the matrix of eigenvectors of the K-by-K system
!> which is solved here.
!>
!> This code makes very mild assumptions about floating point
!> arithmetic. It will work on machines with a guard digit in
!> add/subtract, or on those binary machines without guard digits
!> which subtract like the Cray X-MP, Cray Y-MP, Cray C-90, or Cray-2.
!> It could conceivably fail on hexadecimal or decimal machines
!> without guard digits, but we know of none.
!>

Parameters

[in]	K	!> K is INTEGER !> The number of terms in the rational function to be solved by !> SLAED4. K >= 0. !>
[in]	N	!> N is INTEGER !> The number of rows and columns in the Q matrix. !> N >= K (deflation may result in N>K). !>
[in]	N1	!> N1 is INTEGER !> The location of the last eigenvalue in the leading submatrix. !> min(1,N) <= N1 <= N/2. !>
[out]	D	!> D is REAL array, dimension (N) !> D(I) contains the updated eigenvalues for !> 1 <= I <= K. !>
[out]	Q	!> Q is REAL array, dimension (LDQ,N) !> Initially the first K columns are used as workspace. !> On output the columns 1 to K contain !> the updated eigenvectors. !>
[in]	LDQ	!> LDQ is INTEGER !> The leading dimension of the array Q. LDQ >= max(1,N). !>
[in]	RHO	!> RHO is REAL !> The value of the parameter in the rank one update equation. !> RHO >= 0 required. !>
[in,out]	DLAMDA	!> DLAMDA is REAL array, dimension (K) !> The first K elements of this array contain the old roots !> of the deflated updating problem. These are the poles !> of the secular equation. May be changed on output by !> having lowest order bit set to zero on Cray X-MP, Cray Y-MP, !> Cray-2, or Cray C-90, as described above. !>
[in]	Q2	!> Q2 is REAL array, dimension (LDQ2*N) !> The first K columns of this matrix contain the non-deflated !> eigenvectors for the split problem. !>
[in]	INDX	!> INDX is INTEGER array, dimension (N) !> The permutation used to arrange the columns of the deflated !> Q matrix into three groups (see SLAED2). !> The rows of the eigenvectors found by SLAED4 must be likewise !> permuted before the matrix multiply can take place. !>
[in]	CTOT	!> CTOT is INTEGER array, dimension (4) !> A count of the total number of the various types of columns !> in Q, as described in INDX. The fourth column type is any !> column which has been deflated. !>
[in,out]	W	!> W is REAL array, dimension (K) !> The first K elements of this array contain the components !> of the deflation-adjusted updating vector. Destroyed on !> output. !>
[out]	S	!> S is REAL array, dimension (N1 + 1)*K !> Will contain the eigenvectors of the repaired matrix which !> will be multiplied by the previously accumulated eigenvectors !> to update the system. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> < 0: if INFO = -i, the i-th argument had an illegal value. !> > 0: if INFO = 1, an eigenvalue did not converge !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: Jeff Rutter, Computer Science Division, University of California at Berkeley, USA
Modified by Francoise Tisseur, University of Tennessee

Definition at line 183 of file slaed3.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INFO, K, LDQ, N, N1
      REAL               RHO
*     ..
*     .. Array Arguments ..
      INTEGER            CTOT( * ), INDX( * )
      REAL               D( * ), DLAMDA( * ), Q( LDQ, * ), Q2( * ),
     $                   S( * ), W( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ONE, ZERO
      parameter( one = 1.0e0, zero = 0.0e0 )
*     ..
*     .. Local Scalars ..
      INTEGER            I, II, IQ2, J, N12, N2, N23
      REAL               TEMP
*     ..
*     .. External Functions ..
      REAL               SLAMC3, SNRM2
      EXTERNAL           slamc3, snrm2
*     ..
*     .. External Subroutines ..
      EXTERNAL           scopy, sgemm, slacpy, slaed4, slaset, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, sign, sqrt
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
*
      IF( k.LT.0 ) THEN
         info = -1
      ELSE IF( n.LT.k ) THEN
         info = -2
      ELSE IF( ldq.LT.max( 1, n ) ) THEN
         info = -6
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'SLAED3', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( k.EQ.0 )
     $   RETURN
*
*     Modify values DLAMDA(i) to make sure all DLAMDA(i)-DLAMDA(j) can
*     be computed with high relative accuracy (barring over/underflow).
*     This is a problem on machines without a guard digit in
*     add/subtract (Cray XMP, Cray YMP, Cray C 90 and Cray 2).
*     The following code replaces DLAMDA(I) by 2*DLAMDA(I)-DLAMDA(I),
*     which on any of these machines zeros out the bottommost
*     bit of DLAMDA(I) if it is 1; this makes the subsequent
*     subtractions DLAMDA(I)-DLAMDA(J) unproblematic when cancellation
*     occurs. On binary machines with a guard digit (almost all
*     machines) it does not change DLAMDA(I) at all. On hexadecimal
*     and decimal machines with a guard digit, it slightly
*     changes the bottommost bits of DLAMDA(I). It does not account
*     for hexadecimal or decimal machines without guard digits
*     (we know of none). We use a subroutine call to compute
*     2*DLAMBDA(I) to prevent optimizing compilers from eliminating
*     this code.
*
      DO 10 i = 1, k
         dlamda( i ) = slamc3( dlamda( i ), dlamda( i ) ) - dlamda( i )
   10 CONTINUE
*
      DO 20 j = 1, k
         CALL slaed4( k, j, dlamda, w, q( 1, j ), rho, d( j ), info )
*
*        If the zero finder fails, the computation is terminated.
*
         IF( info.NE.0 )
     $      GO TO 120
   20 CONTINUE
*
      IF( k.EQ.1 )
     $   GO TO 110
      IF( k.EQ.2 ) THEN
         DO 30 j = 1, k
            w( 1 ) = q( 1, j )
            w( 2 ) = q( 2, j )
            ii = indx( 1 )
            q( 1, j ) = w( ii )
            ii = indx( 2 )
            q( 2, j ) = w( ii )
   30    CONTINUE
         GO TO 110
      END IF
*
*     Compute updated W.
*
      CALL scopy( k, w, 1, s, 1 )
*
*     Initialize W(I) = Q(I,I)
*
      CALL scopy( k, q, ldq+1, w, 1 )
      DO 60 j = 1, k
         DO 40 i = 1, j - 1
            w( i ) = w( i )*( q( i, j ) / ( dlamda( i )-dlamda( j ) ) )
   40    CONTINUE
         DO 50 i = j + 1, k
            w( i ) = w( i )*( q( i, j ) / ( dlamda( i )-dlamda( j ) ) )
   50    CONTINUE
   60 CONTINUE
      DO 70 i = 1, k
         w( i ) = sign( sqrt( -w( i ) ), s( i ) )
   70 CONTINUE
*
*     Compute eigenvectors of the modified rank-1 modification.
*
      DO 100 j = 1, k
         DO 80 i = 1, k
            s( i ) = w( i ) / q( i, j )
   80    CONTINUE
         temp = snrm2( k, s, 1 )
         DO 90 i = 1, k
            ii = indx( i )
            q( i, j ) = s( ii ) / temp
   90    CONTINUE
  100 CONTINUE
*
*     Compute the updated eigenvectors.
*
  110 CONTINUE
*
      n2 = n - n1
      n12 = ctot( 1 ) + ctot( 2 )
      n23 = ctot( 2 ) + ctot( 3 )
*
      CALL slacpy( 'A', n23, k, q( ctot( 1 )+1, 1 ), ldq, s, n23 )
      iq2 = n1*n12 + 1
      IF( n23.NE.0 ) THEN
         CALL sgemm( 'N', 'N', n2, k, n23, one, q2( iq2 ), n2, s, n23,
     $               zero, q( n1+1, 1 ), ldq )
      ELSE
         CALL slaset( 'A', n2, k, zero, zero, q( n1+1, 1 ), ldq )
      END IF
*
      CALL slacpy( 'A', n12, k, q, ldq, s, n12 )
      IF( n12.NE.0 ) THEN
         CALL sgemm( 'N', 'N', n1, k, n12, one, q2, n1, s, n12, zero, q,
     $               ldq )
      ELSE
         CALL slaset( 'A', n1, k, zero, zero, q( 1, 1 ), ldq )
      END IF
*
*
  120 CONTINUE
      RETURN
*
*     End of SLAED3
*

◆ slaed4()

subroutine slaed4	(	integer	n,
		integer	i,
		real, dimension( * )	d,
		real, dimension( * )	z,
		real, dimension( * )	delta,
		real	rho,
		real	dlam,
		integer	info )

SLAED4 used by SSTEDC. Finds a single root of the secular equation.

Download SLAED4 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> This subroutine computes the I-th updated eigenvalue of a symmetric
!> rank-one modification to a diagonal matrix whose elements are
!> given in the array d, and that
!>
!>            D(i) < D(j)  for  i < j
!>
!> and that RHO > 0.  This is arranged by the calling routine, and is
!> no loss in generality.  The rank-one modified system is thus
!>
!>            diag( D )  +  RHO * Z * Z_transpose.
!>
!> where we assume the Euclidean norm of Z is 1.
!>
!> The method consists of approximating the rational functions in the
!> secular equation by simpler interpolating rational functions.
!>

Parameters

[in]	N	!> N is INTEGER !> The length of all arrays. !>
[in]	I	!> I is INTEGER !> The index of the eigenvalue to be computed. 1 <= I <= N. !>
[in]	D	!> D is REAL array, dimension (N) !> The original eigenvalues. It is assumed that they are in !> order, D(I) < D(J) for I < J. !>
[in]	Z	!> Z is REAL array, dimension (N) !> The components of the updating vector. !>
[out]	DELTA	!> DELTA is REAL array, dimension (N) !> If N > 2, DELTA contains (D(j) - lambda_I) in its j-th !> component. If N = 1, then DELTA(1) = 1. If N = 2, see SLAED5 !> for detail. The vector DELTA contains the information necessary !> to construct the eigenvectors by SLAED3 and SLAED9. !>
[in]	RHO	!> RHO is REAL !> The scalar in the symmetric updating formula. !>
[out]	DLAM	!> DLAM is REAL !> The computed lambda_I, the I-th updated eigenvalue. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> > 0: if INFO = 1, the updating process failed. !>

Internal Parameters:

!>  Logical variable ORGATI (origin-at-i?) is used for distinguishing
!>  whether D(i) or D(i+1) is treated as the origin.
!>
!>            ORGATI = .true.    origin at i
!>            ORGATI = .false.   origin at i+1
!>
!>   Logical variable SWTCH3 (switch-for-3-poles?) is for noting
!>   if we are working with THREE poles!
!>
!>   MAXIT is the maximum number of iterations allowed for each
!>   eigenvalue.
!>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: Ren-Cang Li, Computer Science Division, University of California at Berkeley, USA

Definition at line 144 of file slaed4.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            I, INFO, N
      REAL               DLAM, RHO
*     ..
*     .. Array Arguments ..
      REAL               D( * ), DELTA( * ), Z( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      INTEGER            MAXIT
      parameter( maxit = 30 )
      REAL               ZERO, ONE, TWO, THREE, FOUR, EIGHT, TEN
      parameter( zero = 0.0e0, one = 1.0e0, two = 2.0e0,
     $                   three = 3.0e0, four = 4.0e0, eight = 8.0e0,
     $                   ten = 10.0e0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            ORGATI, SWTCH, SWTCH3
      INTEGER            II, IIM1, IIP1, IP1, ITER, J, NITER
      REAL               A, B, C, DEL, DLTLB, DLTUB, DPHI, DPSI, DW,
     $                   EPS, ERRETM, ETA, MIDPT, PHI, PREW, PSI,
     $                   RHOINV, TAU, TEMP, TEMP1, W
*     ..
*     .. Local Arrays ..
      REAL               ZZ( 3 )
*     ..
*     .. External Functions ..
      REAL               SLAMCH
      EXTERNAL           slamch
*     ..
*     .. External Subroutines ..
      EXTERNAL           slaed5, slaed6
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, max, min, sqrt
*     ..
*     .. Executable Statements ..
*
*     Since this routine is called in an inner loop, we do no argument
*     checking.
*
*     Quick return for N=1 and 2.
*
      info = 0
      IF( n.EQ.1 ) THEN
*
*         Presumably, I=1 upon entry
*
         dlam = d( 1 ) + rho*z( 1 )*z( 1 )
         delta( 1 ) = one
         RETURN
      END IF
      IF( n.EQ.2 ) THEN
         CALL slaed5( i, d, z, delta, rho, dlam )
         RETURN
      END IF
*
*     Compute machine epsilon
*
      eps = slamch( 'Epsilon' )
      rhoinv = one / rho
*
*     The case I = N
*
      IF( i.EQ.n ) THEN
*
*        Initialize some basic variables
*
         ii = n - 1
         niter = 1
*
*        Calculate initial guess
*
         midpt = rho / two
*
*        If ||Z||_2 is not one, then TEMP should be set to
*        RHO * ||Z||_2^2 / TWO
*
         DO 10 j = 1, n
            delta( j ) = ( d( j )-d( i ) ) - midpt
   10    CONTINUE
*
         psi = zero
         DO 20 j = 1, n - 2
            psi = psi + z( j )*z( j ) / delta( j )
   20    CONTINUE
*
         c = rhoinv + psi
         w = c + z( ii )*z( ii ) / delta( ii ) +
     $       z( n )*z( n ) / delta( n )
*
         IF( w.LE.zero ) THEN
            temp = z( n-1 )*z( n-1 ) / ( d( n )-d( n-1 )+rho ) +
     $             z( n )*z( n ) / rho
            IF( c.LE.temp ) THEN
               tau = rho
            ELSE
               del = d( n ) - d( n-1 )
               a = -c*del + z( n-1 )*z( n-1 ) + z( n )*z( n )
               b = z( n )*z( n )*del
               IF( a.LT.zero ) THEN
                  tau = two*b / ( sqrt( a*a+four*b*c )-a )
               ELSE
                  tau = ( a+sqrt( a*a+four*b*c ) ) / ( two*c )
               END IF
            END IF
*
*           It can be proved that
*               D(N)+RHO/2 <= LAMBDA(N) < D(N)+TAU <= D(N)+RHO
*
            dltlb = midpt
            dltub = rho
         ELSE
            del = d( n ) - d( n-1 )
            a = -c*del + z( n-1 )*z( n-1 ) + z( n )*z( n )
            b = z( n )*z( n )*del
            IF( a.LT.zero ) THEN
               tau = two*b / ( sqrt( a*a+four*b*c )-a )
            ELSE
               tau = ( a+sqrt( a*a+four*b*c ) ) / ( two*c )
            END IF
*
*           It can be proved that
*               D(N) < D(N)+TAU < LAMBDA(N) < D(N)+RHO/2
*
            dltlb = zero
            dltub = midpt
         END IF
*
         DO 30 j = 1, n
            delta( j ) = ( d( j )-d( i ) ) - tau
   30    CONTINUE
*
*        Evaluate PSI and the derivative DPSI
*
         dpsi = zero
         psi = zero
         erretm = zero
         DO 40 j = 1, ii
            temp = z( j ) / delta( j )
            psi = psi + z( j )*temp
            dpsi = dpsi + temp*temp
            erretm = erretm + psi
   40    CONTINUE
         erretm = abs( erretm )
*
*        Evaluate PHI and the derivative DPHI
*
         temp = z( n ) / delta( n )
         phi = z( n )*temp
         dphi = temp*temp
         erretm = eight*( -phi-psi ) + erretm - phi + rhoinv +
     $            abs( tau )*( dpsi+dphi )
*
         w = rhoinv + phi + psi
*
*        Test for convergence
*
         IF( abs( w ).LE.eps*erretm ) THEN
            dlam = d( i ) + tau
            GO TO 250
         END IF
*
         IF( w.LE.zero ) THEN
            dltlb = max( dltlb, tau )
         ELSE
            dltub = min( dltub, tau )
         END IF
*
*        Calculate the new step
*
         niter = niter + 1
         c = w - delta( n-1 )*dpsi - delta( n )*dphi
         a = ( delta( n-1 )+delta( n ) )*w -
     $       delta( n-1 )*delta( n )*( dpsi+dphi )
         b = delta( n-1 )*delta( n )*w
         IF( c.LT.zero )
     $      c = abs( c )
         IF( c.EQ.zero ) THEN
*          ETA = B/A
*           ETA = RHO - TAU
            eta = dltub - tau
         ELSE IF( a.GE.zero ) THEN
            eta = ( a+sqrt( abs( a*a-four*b*c ) ) ) / ( two*c )
         ELSE
            eta = two*b / ( a-sqrt( abs( a*a-four*b*c ) ) )
         END IF
*
*        Note, eta should be positive if w is negative, and
*        eta should be negative otherwise. However,
*        if for some reason caused by roundoff, eta*w > 0,
*        we simply use one Newton step instead. This way
*        will guarantee eta*w < 0.
*
         IF( w*eta.GT.zero )
     $      eta = -w / ( dpsi+dphi )
         temp = tau + eta
         IF( temp.GT.dltub .OR. temp.LT.dltlb ) THEN
            IF( w.LT.zero ) THEN
               eta = ( dltub-tau ) / two
            ELSE
               eta = ( dltlb-tau ) / two
            END IF
         END IF
         DO 50 j = 1, n
            delta( j ) = delta( j ) - eta
   50    CONTINUE
*
         tau = tau + eta
*
*        Evaluate PSI and the derivative DPSI
*
         dpsi = zero
         psi = zero
         erretm = zero
         DO 60 j = 1, ii
            temp = z( j ) / delta( j )
            psi = psi + z( j )*temp
            dpsi = dpsi + temp*temp
            erretm = erretm + psi
   60    CONTINUE
         erretm = abs( erretm )
*
*        Evaluate PHI and the derivative DPHI
*
         temp = z( n ) / delta( n )
         phi = z( n )*temp
         dphi = temp*temp
         erretm = eight*( -phi-psi ) + erretm - phi + rhoinv +
     $            abs( tau )*( dpsi+dphi )
*
         w = rhoinv + phi + psi
*
*        Main loop to update the values of the array   DELTA
*
         iter = niter + 1
*
         DO 90 niter = iter, maxit
*
*           Test for convergence
*
            IF( abs( w ).LE.eps*erretm ) THEN
               dlam = d( i ) + tau
               GO TO 250
            END IF
*
            IF( w.LE.zero ) THEN
               dltlb = max( dltlb, tau )
            ELSE
               dltub = min( dltub, tau )
            END IF
*
*           Calculate the new step
*
            c = w - delta( n-1 )*dpsi - delta( n )*dphi
            a = ( delta( n-1 )+delta( n ) )*w -
     $          delta( n-1 )*delta( n )*( dpsi+dphi )
            b = delta( n-1 )*delta( n )*w
            IF( a.GE.zero ) THEN
               eta = ( a+sqrt( abs( a*a-four*b*c ) ) ) / ( two*c )
            ELSE
               eta = two*b / ( a-sqrt( abs( a*a-four*b*c ) ) )
            END IF
*
*           Note, eta should be positive if w is negative, and
*           eta should be negative otherwise. However,
*           if for some reason caused by roundoff, eta*w > 0,
*           we simply use one Newton step instead. This way
*           will guarantee eta*w < 0.
*
            IF( w*eta.GT.zero )
     $         eta = -w / ( dpsi+dphi )
            temp = tau + eta
            IF( temp.GT.dltub .OR. temp.LT.dltlb ) THEN
               IF( w.LT.zero ) THEN
                  eta = ( dltub-tau ) / two
               ELSE
                  eta = ( dltlb-tau ) / two
               END IF
            END IF
            DO 70 j = 1, n
               delta( j ) = delta( j ) - eta
   70       CONTINUE
*
            tau = tau + eta
*
*           Evaluate PSI and the derivative DPSI
*
            dpsi = zero
            psi = zero
            erretm = zero
            DO 80 j = 1, ii
               temp = z( j ) / delta( j )
               psi = psi + z( j )*temp
               dpsi = dpsi + temp*temp
               erretm = erretm + psi
   80       CONTINUE
            erretm = abs( erretm )
*
*           Evaluate PHI and the derivative DPHI
*
            temp = z( n ) / delta( n )
            phi = z( n )*temp
            dphi = temp*temp
            erretm = eight*( -phi-psi ) + erretm - phi + rhoinv +
     $               abs( tau )*( dpsi+dphi )
*
            w = rhoinv + phi + psi
   90    CONTINUE
*
*        Return with INFO = 1, NITER = MAXIT and not converged
*
         info = 1
         dlam = d( i ) + tau
         GO TO 250
*
*        End for the case I = N
*
      ELSE
*
*        The case for I < N
*
         niter = 1
         ip1 = i + 1
*
*        Calculate initial guess
*
         del = d( ip1 ) - d( i )
         midpt = del / two
         DO 100 j = 1, n
            delta( j ) = ( d( j )-d( i ) ) - midpt
  100    CONTINUE
*
         psi = zero
         DO 110 j = 1, i - 1
            psi = psi + z( j )*z( j ) / delta( j )
  110    CONTINUE
*
         phi = zero
         DO 120 j = n, i + 2, -1
            phi = phi + z( j )*z( j ) / delta( j )
  120    CONTINUE
         c = rhoinv + psi + phi
         w = c + z( i )*z( i ) / delta( i ) +
     $       z( ip1 )*z( ip1 ) / delta( ip1 )
*
         IF( w.GT.zero ) THEN
*
*           d(i)< the ith eigenvalue < (d(i)+d(i+1))/2
*
*           We choose d(i) as origin.
*
            orgati = .true.
            a = c*del + z( i )*z( i ) + z( ip1 )*z( ip1 )
            b = z( i )*z( i )*del
            IF( a.GT.zero ) THEN
               tau = two*b / ( a+sqrt( abs( a*a-four*b*c ) ) )
            ELSE
               tau = ( a-sqrt( abs( a*a-four*b*c ) ) ) / ( two*c )
            END IF
            dltlb = zero
            dltub = midpt
         ELSE
*
*           (d(i)+d(i+1))/2 <= the ith eigenvalue < d(i+1)
*
*           We choose d(i+1) as origin.
*
            orgati = .false.
            a = c*del - z( i )*z( i ) - z( ip1 )*z( ip1 )
            b = z( ip1 )*z( ip1 )*del
            IF( a.LT.zero ) THEN
               tau = two*b / ( a-sqrt( abs( a*a+four*b*c ) ) )
            ELSE
               tau = -( a+sqrt( abs( a*a+four*b*c ) ) ) / ( two*c )
            END IF
            dltlb = -midpt
            dltub = zero
         END IF
*
         IF( orgati ) THEN
            DO 130 j = 1, n
               delta( j ) = ( d( j )-d( i ) ) - tau
  130       CONTINUE
         ELSE
            DO 140 j = 1, n
               delta( j ) = ( d( j )-d( ip1 ) ) - tau
  140       CONTINUE
         END IF
         IF( orgati ) THEN
            ii = i
         ELSE
            ii = i + 1
         END IF
         iim1 = ii - 1
         iip1 = ii + 1
*
*        Evaluate PSI and the derivative DPSI
*
         dpsi = zero
         psi = zero
         erretm = zero
         DO 150 j = 1, iim1
            temp = z( j ) / delta( j )
            psi = psi + z( j )*temp
            dpsi = dpsi + temp*temp
            erretm = erretm + psi
  150    CONTINUE
         erretm = abs( erretm )
*
*        Evaluate PHI and the derivative DPHI
*
         dphi = zero
         phi = zero
         DO 160 j = n, iip1, -1
            temp = z( j ) / delta( j )
            phi = phi + z( j )*temp
            dphi = dphi + temp*temp
            erretm = erretm + phi
  160    CONTINUE
*
         w = rhoinv + phi + psi
*
*        W is the value of the secular function with
*        its ii-th element removed.
*
         swtch3 = .false.
         IF( orgati ) THEN
            IF( w.LT.zero )
     $         swtch3 = .true.
         ELSE
            IF( w.GT.zero )
     $         swtch3 = .true.
         END IF
         IF( ii.EQ.1 .OR. ii.EQ.n )
     $      swtch3 = .false.
*
         temp = z( ii ) / delta( ii )
         dw = dpsi + dphi + temp*temp
         temp = z( ii )*temp
         w = w + temp
         erretm = eight*( phi-psi ) + erretm + two*rhoinv +
     $            three*abs( temp ) + abs( tau )*dw
*
*        Test for convergence
*
         IF( abs( w ).LE.eps*erretm ) THEN
            IF( orgati ) THEN
               dlam = d( i ) + tau
            ELSE
               dlam = d( ip1 ) + tau
            END IF
            GO TO 250
         END IF
*
         IF( w.LE.zero ) THEN
            dltlb = max( dltlb, tau )
         ELSE
            dltub = min( dltub, tau )
         END IF
*
*        Calculate the new step
*
         niter = niter + 1
         IF( .NOT.swtch3 ) THEN
            IF( orgati ) THEN
               c = w - delta( ip1 )*dw - ( d( i )-d( ip1 ) )*
     $             ( z( i ) / delta( i ) )**2
            ELSE
               c = w - delta( i )*dw - ( d( ip1 )-d( i ) )*
     $             ( z( ip1 ) / delta( ip1 ) )**2
            END IF
            a = ( delta( i )+delta( ip1 ) )*w -
     $          delta( i )*delta( ip1 )*dw
            b = delta( i )*delta( ip1 )*w
            IF( c.EQ.zero ) THEN
               IF( a.EQ.zero ) THEN
                  IF( orgati ) THEN
                     a = z( i )*z( i ) + delta( ip1 )*delta( ip1 )*
     $                   ( dpsi+dphi )
                  ELSE
                     a = z( ip1 )*z( ip1 ) + delta( i )*delta( i )*
     $                   ( dpsi+dphi )
                  END IF
               END IF
               eta = b / a
            ELSE IF( a.LE.zero ) THEN
               eta = ( a-sqrt( abs( a*a-four*b*c ) ) ) / ( two*c )
            ELSE
               eta = two*b / ( a+sqrt( abs( a*a-four*b*c ) ) )
            END IF
         ELSE
*
*           Interpolation using THREE most relevant poles
*
            temp = rhoinv + psi + phi
            IF( orgati ) THEN
               temp1 = z( iim1 ) / delta( iim1 )
               temp1 = temp1*temp1
               c = temp - delta( iip1 )*( dpsi+dphi ) -
     $             ( d( iim1 )-d( iip1 ) )*temp1
               zz( 1 ) = z( iim1 )*z( iim1 )
               zz( 3 ) = delta( iip1 )*delta( iip1 )*
     $                   ( ( dpsi-temp1 )+dphi )
            ELSE
               temp1 = z( iip1 ) / delta( iip1 )
               temp1 = temp1*temp1
               c = temp - delta( iim1 )*( dpsi+dphi ) -
     $             ( d( iip1 )-d( iim1 ) )*temp1
               zz( 1 ) = delta( iim1 )*delta( iim1 )*
     $                   ( dpsi+( dphi-temp1 ) )
               zz( 3 ) = z( iip1 )*z( iip1 )
            END IF
            zz( 2 ) = z( ii )*z( ii )
            CALL slaed6( niter, orgati, c, delta( iim1 ), zz, w, eta,
     $                   info )
            IF( info.NE.0 )
     $         GO TO 250
         END IF
*
*        Note, eta should be positive if w is negative, and
*        eta should be negative otherwise. However,
*        if for some reason caused by roundoff, eta*w > 0,
*        we simply use one Newton step instead. This way
*        will guarantee eta*w < 0.
*
         IF( w*eta.GE.zero )
     $      eta = -w / dw
         temp = tau + eta
         IF( temp.GT.dltub .OR. temp.LT.dltlb ) THEN
            IF( w.LT.zero ) THEN
               eta = ( dltub-tau ) / two
            ELSE
               eta = ( dltlb-tau ) / two
            END IF
         END IF
*
         prew = w
*
         DO 180 j = 1, n
            delta( j ) = delta( j ) - eta
  180    CONTINUE
*
*        Evaluate PSI and the derivative DPSI
*
         dpsi = zero
         psi = zero
         erretm = zero
         DO 190 j = 1, iim1
            temp = z( j ) / delta( j )
            psi = psi + z( j )*temp
            dpsi = dpsi + temp*temp
            erretm = erretm + psi
  190    CONTINUE
         erretm = abs( erretm )
*
*        Evaluate PHI and the derivative DPHI
*
         dphi = zero
         phi = zero
         DO 200 j = n, iip1, -1
            temp = z( j ) / delta( j )
            phi = phi + z( j )*temp
            dphi = dphi + temp*temp
            erretm = erretm + phi
  200    CONTINUE
*
         temp = z( ii ) / delta( ii )
         dw = dpsi + dphi + temp*temp
         temp = z( ii )*temp
         w = rhoinv + phi + psi + temp
         erretm = eight*( phi-psi ) + erretm + two*rhoinv +
     $            three*abs( temp ) + abs( tau+eta )*dw
*
         swtch = .false.
         IF( orgati ) THEN
            IF( -w.GT.abs( prew ) / ten )
     $         swtch = .true.
         ELSE
            IF( w.GT.abs( prew ) / ten )
     $         swtch = .true.
         END IF
*
         tau = tau + eta
*
*        Main loop to update the values of the array   DELTA
*
         iter = niter + 1
*
         DO 240 niter = iter, maxit
*
*           Test for convergence
*
            IF( abs( w ).LE.eps*erretm ) THEN
               IF( orgati ) THEN
                  dlam = d( i ) + tau
               ELSE
                  dlam = d( ip1 ) + tau
               END IF
               GO TO 250
            END IF
*
            IF( w.LE.zero ) THEN
               dltlb = max( dltlb, tau )
            ELSE
               dltub = min( dltub, tau )
            END IF
*
*           Calculate the new step
*
            IF( .NOT.swtch3 ) THEN
               IF( .NOT.swtch ) THEN
                  IF( orgati ) THEN
                     c = w - delta( ip1 )*dw -
     $                   ( d( i )-d( ip1 ) )*( z( i ) / delta( i ) )**2
                  ELSE
                     c = w - delta( i )*dw - ( d( ip1 )-d( i ) )*
     $                   ( z( ip1 ) / delta( ip1 ) )**2
                  END IF
               ELSE
                  temp = z( ii ) / delta( ii )
                  IF( orgati ) THEN
                     dpsi = dpsi + temp*temp
                  ELSE
                     dphi = dphi + temp*temp
                  END IF
                  c = w - delta( i )*dpsi - delta( ip1 )*dphi
               END IF
               a = ( delta( i )+delta( ip1 ) )*w -
     $             delta( i )*delta( ip1 )*dw
               b = delta( i )*delta( ip1 )*w
               IF( c.EQ.zero ) THEN
                  IF( a.EQ.zero ) THEN
                     IF( .NOT.swtch ) THEN
                        IF( orgati ) THEN
                           a = z( i )*z( i ) + delta( ip1 )*
     $                         delta( ip1 )*( dpsi+dphi )
                        ELSE
                           a = z( ip1 )*z( ip1 ) +
     $                         delta( i )*delta( i )*( dpsi+dphi )
                        END IF
                     ELSE
                        a = delta( i )*delta( i )*dpsi +
     $                      delta( ip1 )*delta( ip1 )*dphi
                     END IF
                  END IF
                  eta = b / a
               ELSE IF( a.LE.zero ) THEN
                  eta = ( a-sqrt( abs( a*a-four*b*c ) ) ) / ( two*c )
               ELSE
                  eta = two*b / ( a+sqrt( abs( a*a-four*b*c ) ) )
               END IF
            ELSE
*
*              Interpolation using THREE most relevant poles
*
               temp = rhoinv + psi + phi
               IF( swtch ) THEN
                  c = temp - delta( iim1 )*dpsi - delta( iip1 )*dphi
                  zz( 1 ) = delta( iim1 )*delta( iim1 )*dpsi
                  zz( 3 ) = delta( iip1 )*delta( iip1 )*dphi
               ELSE
                  IF( orgati ) THEN
                     temp1 = z( iim1 ) / delta( iim1 )
                     temp1 = temp1*temp1
                     c = temp - delta( iip1 )*( dpsi+dphi ) -
     $                   ( d( iim1 )-d( iip1 ) )*temp1
                     zz( 1 ) = z( iim1 )*z( iim1 )
                     zz( 3 ) = delta( iip1 )*delta( iip1 )*
     $                         ( ( dpsi-temp1 )+dphi )
                  ELSE
                     temp1 = z( iip1 ) / delta( iip1 )
                     temp1 = temp1*temp1
                     c = temp - delta( iim1 )*( dpsi+dphi ) -
     $                   ( d( iip1 )-d( iim1 ) )*temp1
                     zz( 1 ) = delta( iim1 )*delta( iim1 )*
     $                         ( dpsi+( dphi-temp1 ) )
                     zz( 3 ) = z( iip1 )*z( iip1 )
                  END IF
               END IF
               CALL slaed6( niter, orgati, c, delta( iim1 ), zz, w, eta,
     $                      info )
               IF( info.NE.0 )
     $            GO TO 250
            END IF
*
*           Note, eta should be positive if w is negative, and
*           eta should be negative otherwise. However,
*           if for some reason caused by roundoff, eta*w > 0,
*           we simply use one Newton step instead. This way
*           will guarantee eta*w < 0.
*
            IF( w*eta.GE.zero )
     $         eta = -w / dw
            temp = tau + eta
            IF( temp.GT.dltub .OR. temp.LT.dltlb ) THEN
               IF( w.LT.zero ) THEN
                  eta = ( dltub-tau ) / two
               ELSE
                  eta = ( dltlb-tau ) / two
               END IF
            END IF
*
            DO 210 j = 1, n
               delta( j ) = delta( j ) - eta
  210       CONTINUE
*
            tau = tau + eta
            prew = w
*
*           Evaluate PSI and the derivative DPSI
*
            dpsi = zero
            psi = zero
            erretm = zero
            DO 220 j = 1, iim1
               temp = z( j ) / delta( j )
               psi = psi + z( j )*temp
               dpsi = dpsi + temp*temp
               erretm = erretm + psi
  220       CONTINUE
            erretm = abs( erretm )
*
*           Evaluate PHI and the derivative DPHI
*
            dphi = zero
            phi = zero
            DO 230 j = n, iip1, -1
               temp = z( j ) / delta( j )
               phi = phi + z( j )*temp
               dphi = dphi + temp*temp
               erretm = erretm + phi
  230       CONTINUE
*
            temp = z( ii ) / delta( ii )
            dw = dpsi + dphi + temp*temp
            temp = z( ii )*temp
            w = rhoinv + phi + psi + temp
            erretm = eight*( phi-psi ) + erretm + two*rhoinv +
     $               three*abs( temp ) + abs( tau )*dw
            IF( w*prew.GT.zero .AND. abs( w ).GT.abs( prew ) / ten )
     $         swtch = .NOT.swtch
*
  240    CONTINUE
*
*        Return with INFO = 1, NITER = MAXIT and not converged
*
         info = 1
         IF( orgati ) THEN
            dlam = d( i ) + tau
         ELSE
            dlam = d( ip1 ) + tau
         END IF
*
      END IF
*
  250 CONTINUE
*
      RETURN
*
*     End of SLAED4
*

◆ slaed5()

subroutine slaed5	(	integer	i,
		real, dimension( 2 )	d,
		real, dimension( 2 )	z,
		real, dimension( 2 )	delta,
		real	rho,
		real	dlam )

SLAED5 used by SSTEDC. Solves the 2-by-2 secular equation.

Download SLAED5 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> This subroutine computes the I-th eigenvalue of a symmetric rank-one
!> modification of a 2-by-2 diagonal matrix
!>
!>            diag( D )  +  RHO * Z * transpose(Z) .
!>
!> The diagonal elements in the array D are assumed to satisfy
!>
!>            D(i) < D(j)  for  i < j .
!>
!> We also assume RHO > 0 and that the Euclidean norm of the vector
!> Z is one.
!>

Parameters

[in]	I	!> I is INTEGER !> The index of the eigenvalue to be computed. I = 1 or I = 2. !>
[in]	D	!> D is REAL array, dimension (2) !> The original eigenvalues. We assume D(1) < D(2). !>
[in]	Z	!> Z is REAL array, dimension (2) !> The components of the updating vector. !>
[out]	DELTA	!> DELTA is REAL array, dimension (2) !> The vector DELTA contains the information necessary !> to construct the eigenvectors. !>
[in]	RHO	!> RHO is REAL !> The scalar in the symmetric updating formula. !>
[out]	DLAM	!> DLAM is REAL !> The computed lambda_I, the I-th updated eigenvalue. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: Ren-Cang Li, Computer Science Division, University of California at Berkeley, USA

Definition at line 107 of file slaed5.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            I
      REAL               DLAM, RHO
*     ..
*     .. Array Arguments ..
      REAL               D( 2 ), DELTA( 2 ), Z( 2 )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ZERO, ONE, TWO, FOUR
      parameter( zero = 0.0e0, one = 1.0e0, two = 2.0e0,
     $                   four = 4.0e0 )
*     ..
*     .. Local Scalars ..
      REAL               B, C, DEL, TAU, TEMP, W
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, sqrt
*     ..
*     .. Executable Statements ..
*
      del = d( 2 ) - d( 1 )
      IF( i.EQ.1 ) THEN
         w = one + two*rho*( z( 2 )*z( 2 )-z( 1 )*z( 1 ) ) / del
         IF( w.GT.zero ) THEN
            b = del + rho*( z( 1 )*z( 1 )+z( 2 )*z( 2 ) )
            c = rho*z( 1 )*z( 1 )*del
*
*           B > ZERO, always
*
            tau = two*c / ( b+sqrt( abs( b*b-four*c ) ) )
            dlam = d( 1 ) + tau
            delta( 1 ) = -z( 1 ) / tau
            delta( 2 ) = z( 2 ) / ( del-tau )
         ELSE
            b = -del + rho*( z( 1 )*z( 1 )+z( 2 )*z( 2 ) )
            c = rho*z( 2 )*z( 2 )*del
            IF( b.GT.zero ) THEN
               tau = -two*c / ( b+sqrt( b*b+four*c ) )
            ELSE
               tau = ( b-sqrt( b*b+four*c ) ) / two
            END IF
            dlam = d( 2 ) + tau
            delta( 1 ) = -z( 1 ) / ( del+tau )
            delta( 2 ) = -z( 2 ) / tau
         END IF
         temp = sqrt( delta( 1 )*delta( 1 )+delta( 2 )*delta( 2 ) )
         delta( 1 ) = delta( 1 ) / temp
         delta( 2 ) = delta( 2 ) / temp
      ELSE
*
*     Now I=2
*
         b = -del + rho*( z( 1 )*z( 1 )+z( 2 )*z( 2 ) )
         c = rho*z( 2 )*z( 2 )*del
         IF( b.GT.zero ) THEN
            tau = ( b+sqrt( b*b+four*c ) ) / two
         ELSE
            tau = two*c / ( -b+sqrt( b*b+four*c ) )
         END IF
         dlam = d( 2 ) + tau
         delta( 1 ) = -z( 1 ) / ( del+tau )
         delta( 2 ) = -z( 2 ) / tau
         temp = sqrt( delta( 1 )*delta( 1 )+delta( 2 )*delta( 2 ) )
         delta( 1 ) = delta( 1 ) / temp
         delta( 2 ) = delta( 2 ) / temp
      END IF
      RETURN
*
*     End of SLAED5
*

◆ slaed6()

subroutine slaed6	(	integer	kniter,
		logical	orgati,
		real	rho,
		real, dimension( 3 )	d,
		real, dimension( 3 )	z,
		real	finit,
		real	tau,
		integer	info )

SLAED6 used by SSTEDC. Computes one Newton step in solution of the secular equation.

Download SLAED6 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> SLAED6 computes the positive or negative root (closest to the origin)
!> of
!>                  z(1)        z(2)        z(3)
!> f(x) =   rho + --------- + ---------- + ---------
!>                 d(1)-x      d(2)-x      d(3)-x
!>
!> It is assumed that
!>
!>       if ORGATI = .true. the root is between d(2) and d(3);
!>       otherwise it is between d(1) and d(2)
!>
!> This routine will be called by SLAED4 when necessary. In most cases,
!> the root sought is the smallest in magnitude, though it might not be
!> in some extremely rare situations.
!>

Parameters

[in]	KNITER	!> KNITER is INTEGER !> Refer to SLAED4 for its significance. !>
[in]	ORGATI	!> ORGATI is LOGICAL !> If ORGATI is true, the needed root is between d(2) and !> d(3); otherwise it is between d(1) and d(2). See !> SLAED4 for further details. !>
[in]	RHO	!> RHO is REAL !> Refer to the equation f(x) above. !>
[in]	D	!> D is REAL array, dimension (3) !> D satisfies d(1) < d(2) < d(3). !>
[in]	Z	!> Z is REAL array, dimension (3) !> Each of the elements in z must be positive. !>
[in]	FINIT	!> FINIT is REAL !> The value of f at 0. It is more accurate than the one !> evaluated inside this routine (if someone wants to do !> so). !>
[out]	TAU	!> TAU is REAL !> The root of the equation f(x). !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> > 0: if INFO = 1, failure to converge !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  10/02/03: This version has a few statements commented out for thread
!>  safety (machine parameters are computed on each entry). SJH.
!>
!>  05/10/06: Modified from a new version of Ren-Cang Li, use
!>     Gragg-Thornton-Warner cubic convergent scheme for better stability.
!>

Contributors:: Ren-Cang Li, Computer Science Division, University of California at Berkeley, USA

Definition at line 139 of file slaed6.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      LOGICAL            ORGATI
      INTEGER            INFO, KNITER
      REAL               FINIT, RHO, TAU
*     ..
*     .. Array Arguments ..
      REAL               D( 3 ), Z( 3 )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      INTEGER            MAXIT
      parameter( maxit = 40 )
      REAL               ZERO, ONE, TWO, THREE, FOUR, EIGHT
      parameter( zero = 0.0e0, one = 1.0e0, two = 2.0e0,
     $                   three = 3.0e0, four = 4.0e0, eight = 8.0e0 )
*     ..
*     .. External Functions ..
      REAL               SLAMCH
      EXTERNAL           slamch
*     ..
*     .. Local Arrays ..
      REAL               DSCALE( 3 ), ZSCALE( 3 )
*     ..
*     .. Local Scalars ..
      LOGICAL            SCALE
      INTEGER            I, ITER, NITER
      REAL               A, B, BASE, C, DDF, DF, EPS, ERRETM, ETA, F,
     $                   FC, SCLFAC, SCLINV, SMALL1, SMALL2, SMINV1,
     $                   SMINV2, TEMP, TEMP1, TEMP2, TEMP3, TEMP4,
     $                   LBD, UBD
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, int, log, max, min, sqrt
*     ..
*     .. Executable Statements ..
*
      info = 0
*
      IF( orgati ) THEN
         lbd = d(2)
         ubd = d(3)
      ELSE
         lbd = d(1)
         ubd = d(2)
      END IF
      IF( finit .LT. zero )THEN
         lbd = zero
      ELSE
         ubd = zero
      END IF
*
      niter = 1
      tau = zero
      IF( kniter.EQ.2 ) THEN
         IF( orgati ) THEN
            temp = ( d( 3 )-d( 2 ) ) / two
            c = rho + z( 1 ) / ( ( d( 1 )-d( 2 ) )-temp )
            a = c*( d( 2 )+d( 3 ) ) + z( 2 ) + z( 3 )
            b = c*d( 2 )*d( 3 ) + z( 2 )*d( 3 ) + z( 3 )*d( 2 )
         ELSE
            temp = ( d( 1 )-d( 2 ) ) / two
            c = rho + z( 3 ) / ( ( d( 3 )-d( 2 ) )-temp )
            a = c*( d( 1 )+d( 2 ) ) + z( 1 ) + z( 2 )
            b = c*d( 1 )*d( 2 ) + z( 1 )*d( 2 ) + z( 2 )*d( 1 )
         END IF
         temp = max( abs( a ), abs( b ), abs( c ) )
         a = a / temp
         b = b / temp
         c = c / temp
         IF( c.EQ.zero ) THEN
            tau = b / a
         ELSE IF( a.LE.zero ) THEN
            tau = ( a-sqrt( abs( a*a-four*b*c ) ) ) / ( two*c )
         ELSE
            tau = two*b / ( a+sqrt( abs( a*a-four*b*c ) ) )
         END IF
         IF( tau .LT. lbd .OR. tau .GT. ubd )
     $      tau = ( lbd+ubd )/two
         IF( d(1).EQ.tau .OR. d(2).EQ.tau .OR. d(3).EQ.tau ) THEN
            tau = zero
         ELSE
            temp = finit + tau*z(1)/( d(1)*( d( 1 )-tau ) ) +
     $                     tau*z(2)/( d(2)*( d( 2 )-tau ) ) +
     $                     tau*z(3)/( d(3)*( d( 3 )-tau ) )
            IF( temp .LE. zero )THEN
               lbd = tau
            ELSE
               ubd = tau
            END IF
            IF( abs( finit ).LE.abs( temp ) )
     $         tau = zero
         END IF
      END IF
*
*     get machine parameters for possible scaling to avoid overflow
*
*     modified by Sven: parameters SMALL1, SMINV1, SMALL2,
*     SMINV2, EPS are not SAVEd anymore between one call to the
*     others but recomputed at each call
*
      eps = slamch( 'Epsilon' )
      base = slamch( 'Base' )
      small1 = base**( int( log( slamch( 'SafMin' ) ) / log( base ) /
     $         three ) )
      sminv1 = one / small1
      small2 = small1*small1
      sminv2 = sminv1*sminv1
*
*     Determine if scaling of inputs necessary to avoid overflow
*     when computing 1/TEMP**3
*
      IF( orgati ) THEN
         temp = min( abs( d( 2 )-tau ), abs( d( 3 )-tau ) )
      ELSE
         temp = min( abs( d( 1 )-tau ), abs( d( 2 )-tau ) )
      END IF
      scale = .false.
      IF( temp.LE.small1 ) THEN
         scale = .true.
         IF( temp.LE.small2 ) THEN
*
*        Scale up by power of radix nearest 1/SAFMIN**(2/3)
*
            sclfac = sminv2
            sclinv = small2
         ELSE
*
*        Scale up by power of radix nearest 1/SAFMIN**(1/3)
*
            sclfac = sminv1
            sclinv = small1
         END IF
*
*        Scaling up safe because D, Z, TAU scaled elsewhere to be O(1)
*
         DO 10 i = 1, 3
            dscale( i ) = d( i )*sclfac
            zscale( i ) = z( i )*sclfac
   10    CONTINUE
         tau = tau*sclfac
         lbd = lbd*sclfac
         ubd = ubd*sclfac
      ELSE
*
*        Copy D and Z to DSCALE and ZSCALE
*
         DO 20 i = 1, 3
            dscale( i ) = d( i )
            zscale( i ) = z( i )
   20    CONTINUE
      END IF
*
      fc = zero
      df = zero
      ddf = zero
      DO 30 i = 1, 3
         temp = one / ( dscale( i )-tau )
         temp1 = zscale( i )*temp
         temp2 = temp1*temp
         temp3 = temp2*temp
         fc = fc + temp1 / dscale( i )
         df = df + temp2
         ddf = ddf + temp3
   30 CONTINUE
      f = finit + tau*fc
*
      IF( abs( f ).LE.zero )
     $   GO TO 60
      IF( f .LE. zero )THEN
         lbd = tau
      ELSE
         ubd = tau
      END IF
*
*        Iteration begins -- Use Gragg-Thornton-Warner cubic convergent
*                            scheme
*
*     It is not hard to see that
*
*           1) Iterations will go up monotonically
*              if FINIT < 0;
*
*           2) Iterations will go down monotonically
*              if FINIT > 0.
*
      iter = niter + 1
*
      DO 50 niter = iter, maxit
*
         IF( orgati ) THEN
            temp1 = dscale( 2 ) - tau
            temp2 = dscale( 3 ) - tau
         ELSE
            temp1 = dscale( 1 ) - tau
            temp2 = dscale( 2 ) - tau
         END IF
         a = ( temp1+temp2 )*f - temp1*temp2*df
         b = temp1*temp2*f
         c = f - ( temp1+temp2 )*df + temp1*temp2*ddf
         temp = max( abs( a ), abs( b ), abs( c ) )
         a = a / temp
         b = b / temp
         c = c / temp
         IF( c.EQ.zero ) THEN
            eta = b / a
         ELSE IF( a.LE.zero ) THEN
            eta = ( a-sqrt( abs( a*a-four*b*c ) ) ) / ( two*c )
         ELSE
            eta = two*b / ( a+sqrt( abs( a*a-four*b*c ) ) )
         END IF
         IF( f*eta.GE.zero ) THEN
            eta = -f / df
         END IF
*
         tau = tau + eta
         IF( tau .LT. lbd .OR. tau .GT. ubd )
     $      tau = ( lbd + ubd )/two
*
         fc = zero
         erretm = zero
         df = zero
         ddf = zero
         DO 40 i = 1, 3
            IF ( ( dscale( i )-tau ).NE.zero ) THEN
               temp = one / ( dscale( i )-tau )
               temp1 = zscale( i )*temp
               temp2 = temp1*temp
               temp3 = temp2*temp
               temp4 = temp1 / dscale( i )
               fc = fc + temp4
               erretm = erretm + abs( temp4 )
               df = df + temp2
               ddf = ddf + temp3
            ELSE
               GO TO 60
            END IF
   40    CONTINUE
         f = finit + tau*fc
         erretm = eight*( abs( finit )+abs( tau )*erretm ) +
     $            abs( tau )*df
         IF( ( abs( f ).LE.four*eps*erretm ) .OR.
     $      ( (ubd-lbd).LE.four*eps*abs(tau) )  )
     $      GO TO 60
         IF( f .LE. zero )THEN
            lbd = tau
         ELSE
            ubd = tau
         END IF
   50 CONTINUE
      info = 1
   60 CONTINUE
*
*     Undo scaling
*
      IF( scale )
     $   tau = tau*sclinv
      RETURN
*
*     End of SLAED6
*

◆ slaed7()

subroutine slaed7	(	integer	icompq,
		integer	n,
		integer	qsiz,
		integer	tlvls,
		integer	curlvl,
		integer	curpbm,
		real, dimension( * )	d,
		real, dimension( ldq, * )	q,
		integer	ldq,
		integer, dimension( * )	indxq,
		real	rho,
		integer	cutpnt,
		real, dimension( * )	qstore,
		integer, dimension( * )	qptr,
		integer, dimension( * )	prmptr,
		integer, dimension( * )	perm,
		integer, dimension( * )	givptr,
		integer, dimension( 2, * )	givcol,
		real, dimension( 2, * )	givnum,
		real, dimension( * )	work,
		integer, dimension( * )	iwork,
		integer	info )

SLAED7 used by SSTEDC. Computes the updated eigensystem of a diagonal matrix after modification by a rank-one symmetric matrix. Used when the original matrix is dense.

Download SLAED7 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> SLAED7 computes the updated eigensystem of a diagonal
!> matrix after modification by a rank-one symmetric matrix. This
!> routine is used only for the eigenproblem which requires all
!> eigenvalues and optionally eigenvectors of a dense symmetric matrix
!> that has been reduced to tridiagonal form.  SLAED1 handles
!> the case in which all eigenvalues and eigenvectors of a symmetric
!> tridiagonal matrix are desired.
!>
!>   T = Q(in) ( D(in) + RHO * Z*Z**T ) Q**T(in) = Q(out) * D(out) * Q**T(out)
!>
!>    where Z = Q**Tu, u is a vector of length N with ones in the
!>    CUTPNT and CUTPNT + 1 th elements and zeros elsewhere.
!>
!>    The eigenvectors of the original matrix are stored in Q, and the
!>    eigenvalues are in D.  The algorithm consists of three stages:
!>
!>       The first stage consists of deflating the size of the problem
!>       when there are multiple eigenvalues or if there is a zero in
!>       the Z vector.  For each such occurrence the dimension of the
!>       secular equation problem is reduced by one.  This stage is
!>       performed by the routine SLAED8.
!>
!>       The second stage consists of calculating the updated
!>       eigenvalues. This is done by finding the roots of the secular
!>       equation via the routine SLAED4 (as called by SLAED9).
!>       This routine also calculates the eigenvectors of the current
!>       problem.
!>
!>       The final stage consists of computing the updated eigenvectors
!>       directly using the updated eigenvalues.  The eigenvectors for
!>       the current problem are multiplied with the eigenvectors from
!>       the overall problem.
!>

Parameters

[in]	ICOMPQ	!> ICOMPQ is INTEGER !> = 0: Compute eigenvalues only. !> = 1: Compute eigenvectors of original dense symmetric matrix !> also. On entry, Q contains the orthogonal matrix used !> to reduce the original matrix to tridiagonal form. !>
[in]	N	!> N is INTEGER !> The dimension of the symmetric tridiagonal matrix. N >= 0. !>
[in]	QSIZ	!> QSIZ is INTEGER !> The dimension of the orthogonal matrix used to reduce !> the full matrix to tridiagonal form. QSIZ >= N if ICOMPQ = 1. !>
[in]	TLVLS	!> TLVLS is INTEGER !> The total number of merging levels in the overall divide and !> conquer tree. !>
[in]	CURLVL	!> CURLVL is INTEGER !> The current level in the overall merge routine, !> 0 <= CURLVL <= TLVLS. !>
[in]	CURPBM	!> CURPBM is INTEGER !> The current problem in the current level in the overall !> merge routine (counting from upper left to lower right). !>
[in,out]	D	!> D is REAL array, dimension (N) !> On entry, the eigenvalues of the rank-1-perturbed matrix. !> On exit, the eigenvalues of the repaired matrix. !>
[in,out]	Q	!> Q is REAL array, dimension (LDQ, N) !> On entry, the eigenvectors of the rank-1-perturbed matrix. !> On exit, the eigenvectors of the repaired tridiagonal matrix. !>
[in]	LDQ	!> LDQ is INTEGER !> The leading dimension of the array Q. LDQ >= max(1,N). !>
[out]	INDXQ	!> INDXQ is INTEGER array, dimension (N) !> The permutation which will reintegrate the subproblem just !> solved back into sorted order, i.e., D( INDXQ( I = 1, N ) ) !> will be in ascending order. !>
[in]	RHO	!> RHO is REAL !> The subdiagonal element used to create the rank-1 !> modification. !>
[in]	CUTPNT	!> CUTPNT is INTEGER !> Contains the location of the last eigenvalue in the leading !> sub-matrix. min(1,N) <= CUTPNT <= N. !>
[in,out]	QSTORE	!> QSTORE is REAL array, dimension (N**2+1) !> Stores eigenvectors of submatrices encountered during !> divide and conquer, packed together. QPTR points to !> beginning of the submatrices. !>
[in,out]	QPTR	!> QPTR is INTEGER array, dimension (N+2) !> List of indices pointing to beginning of submatrices stored !> in QSTORE. The submatrices are numbered starting at the !> bottom left of the divide and conquer tree, from left to !> right and bottom to top. !>
[in]	PRMPTR	!> PRMPTR is INTEGER array, dimension (N lg N) !> Contains a list of pointers which indicate where in PERM a !> level's permutation is stored. PRMPTR(i+1) - PRMPTR(i) !> indicates the size of the permutation and also the size of !> the full, non-deflated problem. !>
[in]	PERM	!> PERM is INTEGER array, dimension (N lg N) !> Contains the permutations (from deflation and sorting) to be !> applied to each eigenblock. !>
[in]	GIVPTR	!> GIVPTR is INTEGER array, dimension (N lg N) !> Contains a list of pointers which indicate where in GIVCOL a !> level's Givens rotations are stored. GIVPTR(i+1) - GIVPTR(i) !> indicates the number of Givens rotations. !>
[in]	GIVCOL	!> GIVCOL is INTEGER array, dimension (2, N lg N) !> Each pair of numbers indicates a pair of columns to take place !> in a Givens rotation. !>
[in]	GIVNUM	!> GIVNUM is REAL array, dimension (2, N lg N) !> Each number indicates the S value to be used in the !> corresponding Givens rotation. !>
[out]	WORK	!> WORK is REAL array, dimension (3N+2QSIZ*N) !>
[out]	IWORK	!> IWORK is INTEGER array, dimension (4*N) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> < 0: if INFO = -i, the i-th argument had an illegal value. !> > 0: if INFO = 1, an eigenvalue did not converge !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: Jeff Rutter, Computer Science Division, University of California at Berkeley, USA

Definition at line 256 of file slaed7.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            CURLVL, CURPBM, CUTPNT, ICOMPQ, INFO, LDQ, N,
     $                   QSIZ, TLVLS
      REAL               RHO
*     ..
*     .. Array Arguments ..
      INTEGER            GIVCOL( 2, * ), GIVPTR( * ), INDXQ( * ),
     $                   IWORK( * ), PERM( * ), PRMPTR( * ), QPTR( * )
      REAL               D( * ), GIVNUM( 2, * ), Q( LDQ, * ),
     $                   QSTORE( * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ONE, ZERO
      parameter( one = 1.0e0, zero = 0.0e0 )
*     ..
*     .. Local Scalars ..
      INTEGER            COLTYP, CURR, I, IDLMDA, INDX, INDXC, INDXP,
     $                   IQ2, IS, IW, IZ, K, LDQ2, N1, N2, PTR
*     ..
*     .. External Subroutines ..
      EXTERNAL           sgemm, slaed8, slaed9, slaeda, slamrg, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, min
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
*
      IF( icompq.LT.0 .OR. icompq.GT.1 ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( icompq.EQ.1 .AND. qsiz.LT.n ) THEN
         info = -3
      ELSE IF( ldq.LT.max( 1, n ) ) THEN
         info = -9
      ELSE IF( min( 1, n ).GT.cutpnt .OR. n.LT.cutpnt ) THEN
         info = -12
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'SLAED7', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
*     The following values are for bookkeeping purposes only.  They are
*     integer pointers which indicate the portion of the workspace
*     used by a particular array in SLAED8 and SLAED9.
*
      IF( icompq.EQ.1 ) THEN
         ldq2 = qsiz
      ELSE
         ldq2 = n
      END IF
*
      iz = 1
      idlmda = iz + n
      iw = idlmda + n
      iq2 = iw + n
      is = iq2 + n*ldq2
*
      indx = 1
      indxc = indx + n
      coltyp = indxc + n
      indxp = coltyp + n
*
*     Form the z-vector which consists of the last row of Q_1 and the
*     first row of Q_2.
*
      ptr = 1 + 2**tlvls
      DO 10 i = 1, curlvl - 1
         ptr = ptr + 2**( tlvls-i )
   10 CONTINUE
      curr = ptr + curpbm
      CALL slaeda( n, tlvls, curlvl, curpbm, prmptr, perm, givptr,
     $             givcol, givnum, qstore, qptr, work( iz ),
     $             work( iz+n ), info )
*
*     When solving the final problem, we no longer need the stored data,
*     so we will overwrite the data from this level onto the previously
*     used storage space.
*
      IF( curlvl.EQ.tlvls ) THEN
         qptr( curr ) = 1
         prmptr( curr ) = 1
         givptr( curr ) = 1
      END IF
*
*     Sort and Deflate eigenvalues.
*
      CALL slaed8( icompq, k, n, qsiz, d, q, ldq, indxq, rho, cutpnt,
     $             work( iz ), work( idlmda ), work( iq2 ), ldq2,
     $             work( iw ), perm( prmptr( curr ) ), givptr( curr+1 ),
     $             givcol( 1, givptr( curr ) ),
     $             givnum( 1, givptr( curr ) ), iwork( indxp ),
     $             iwork( indx ), info )
      prmptr( curr+1 ) = prmptr( curr ) + n
      givptr( curr+1 ) = givptr( curr+1 ) + givptr( curr )
*
*     Solve Secular Equation.
*
      IF( k.NE.0 ) THEN
         CALL slaed9( k, 1, k, n, d, work( is ), k, rho, work( idlmda ),
     $                work( iw ), qstore( qptr( curr ) ), k, info )
         IF( info.NE.0 )
     $      GO TO 30
         IF( icompq.EQ.1 ) THEN
            CALL sgemm( 'N', 'N', qsiz, k, k, one, work( iq2 ), ldq2,
     $                  qstore( qptr( curr ) ), k, zero, q, ldq )
         END IF
         qptr( curr+1 ) = qptr( curr ) + k**2
*
*     Prepare the INDXQ sorting permutation.
*
         n1 = k
         n2 = n - k
         CALL slamrg( n1, n2, d, 1, -1, indxq )
      ELSE
         qptr( curr+1 ) = qptr( curr )
         DO 20 i = 1, n
            indxq( i ) = i
   20    CONTINUE
      END IF
*
   30 CONTINUE
      RETURN
*
*     End of SLAED7
*

◆ slaed8()

subroutine slaed8	(	integer	icompq,
		integer	k,
		integer	n,
		integer	qsiz,
		real, dimension( * )	d,
		real, dimension( ldq, * )	q,
		integer	ldq,
		integer, dimension( * )	indxq,
		real	rho,
		integer	cutpnt,
		real, dimension( * )	z,
		real, dimension( * )	dlamda,
		real, dimension( ldq2, * )	q2,
		integer	ldq2,
		real, dimension( * )	w,
		integer, dimension( * )	perm,
		integer	givptr,
		integer, dimension( 2, * )	givcol,
		real, dimension( 2, * )	givnum,
		integer, dimension( * )	indxp,
		integer, dimension( * )	indx,
		integer	info )

SLAED8 used by SSTEDC. Merges eigenvalues and deflates secular equation. Used when the original matrix is dense.

Download SLAED8 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> SLAED8 merges the two sets of eigenvalues together into a single
!> sorted set.  Then it tries to deflate the size of the problem.
!> There are two ways in which deflation can occur:  when two or more
!> eigenvalues are close together or if there is a tiny element in the
!> Z vector.  For each such occurrence the order of the related secular
!> equation problem is reduced by one.
!>

Parameters

[in]	ICOMPQ	!> ICOMPQ is INTEGER !> = 0: Compute eigenvalues only. !> = 1: Compute eigenvectors of original dense symmetric matrix !> also. On entry, Q contains the orthogonal matrix used !> to reduce the original matrix to tridiagonal form. !>
[out]	K	!> K is INTEGER !> The number of non-deflated eigenvalues, and the order of the !> related secular equation. !>
[in]	N	!> N is INTEGER !> The dimension of the symmetric tridiagonal matrix. N >= 0. !>
[in]	QSIZ	!> QSIZ is INTEGER !> The dimension of the orthogonal matrix used to reduce !> the full matrix to tridiagonal form. QSIZ >= N if ICOMPQ = 1. !>
[in,out]	D	!> D is REAL array, dimension (N) !> On entry, the eigenvalues of the two submatrices to be !> combined. On exit, the trailing (N-K) updated eigenvalues !> (those which were deflated) sorted into increasing order. !>
[in,out]	Q	!> Q is REAL array, dimension (LDQ,N) !> If ICOMPQ = 0, Q is not referenced. Otherwise, !> on entry, Q contains the eigenvectors of the partially solved !> system which has been previously updated in matrix !> multiplies with other partially solved eigensystems. !> On exit, Q contains the trailing (N-K) updated eigenvectors !> (those which were deflated) in its last N-K columns. !>
[in]	LDQ	!> LDQ is INTEGER !> The leading dimension of the array Q. LDQ >= max(1,N). !>
[in]	INDXQ	!> INDXQ is INTEGER array, dimension (N) !> The permutation which separately sorts the two sub-problems !> in D into ascending order. Note that elements in the second !> half of this permutation must first have CUTPNT added to !> their values in order to be accurate. !>
[in,out]	RHO	!> RHO is REAL !> On entry, the off-diagonal element associated with the rank-1 !> cut which originally split the two submatrices which are now !> being recombined. !> On exit, RHO has been modified to the value required by !> SLAED3. !>
[in]	CUTPNT	!> CUTPNT is INTEGER !> The location of the last eigenvalue in the leading !> sub-matrix. min(1,N) <= CUTPNT <= N. !>
[in]	Z	!> Z is REAL array, dimension (N) !> On entry, Z contains the updating vector (the last row of !> the first sub-eigenvector matrix and the first row of the !> second sub-eigenvector matrix). !> On exit, the contents of Z are destroyed by the updating !> process. !>
[out]	DLAMDA	!> DLAMDA is REAL array, dimension (N) !> A copy of the first K eigenvalues which will be used by !> SLAED3 to form the secular equation. !>
[out]	Q2	!> Q2 is REAL array, dimension (LDQ2,N) !> If ICOMPQ = 0, Q2 is not referenced. Otherwise, !> a copy of the first K eigenvectors which will be used by !> SLAED7 in a matrix multiply (SGEMM) to update the new !> eigenvectors. !>
[in]	LDQ2	!> LDQ2 is INTEGER !> The leading dimension of the array Q2. LDQ2 >= max(1,N). !>
[out]	W	!> W is REAL array, dimension (N) !> The first k values of the final deflation-altered z-vector and !> will be passed to SLAED3. !>
[out]	PERM	!> PERM is INTEGER array, dimension (N) !> The permutations (from deflation and sorting) to be applied !> to each eigenblock. !>
[out]	GIVPTR	!> GIVPTR is INTEGER !> The number of Givens rotations which took place in this !> subproblem. !>
[out]	GIVCOL	!> GIVCOL is INTEGER array, dimension (2, N) !> Each pair of numbers indicates a pair of columns to take place !> in a Givens rotation. !>
[out]	GIVNUM	!> GIVNUM is REAL array, dimension (2, N) !> Each number indicates the S value to be used in the !> corresponding Givens rotation. !>
[out]	INDXP	!> INDXP is INTEGER array, dimension (N) !> The permutation used to place deflated values of D at the end !> of the array. INDXP(1:K) points to the nondeflated D-values !> and INDXP(K+1:N) points to the deflated eigenvalues. !>
[out]	INDX	!> INDX is INTEGER array, dimension (N) !> The permutation used to sort the contents of D into ascending !> order. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> < 0: if INFO = -i, the i-th argument had an illegal value. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: Jeff Rutter, Computer Science Division, University of California at Berkeley, USA

Definition at line 240 of file slaed8.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            CUTPNT, GIVPTR, ICOMPQ, INFO, K, LDQ, LDQ2, N,
     $                   QSIZ
      REAL               RHO
*     ..
*     .. Array Arguments ..
      INTEGER            GIVCOL( 2, * ), INDX( * ), INDXP( * ),
     $                   INDXQ( * ), PERM( * )
      REAL               D( * ), DLAMDA( * ), GIVNUM( 2, * ),
     $                   Q( LDQ, * ), Q2( LDQ2, * ), W( * ), Z( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               MONE, ZERO, ONE, TWO, EIGHT
      parameter( mone = -1.0e0, zero = 0.0e0, one = 1.0e0,
     $                   two = 2.0e0, eight = 8.0e0 )
*     ..
*     .. Local Scalars ..
*
      INTEGER            I, IMAX, J, JLAM, JMAX, JP, K2, N1, N1P1, N2
      REAL               C, EPS, S, T, TAU, TOL
*     ..
*     .. External Functions ..
      INTEGER            ISAMAX
      REAL               SLAMCH, SLAPY2
      EXTERNAL           isamax, slamch, slapy2
*     ..
*     .. External Subroutines ..
      EXTERNAL           scopy, slacpy, slamrg, srot, sscal, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, max, min, sqrt
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
*
      IF( icompq.LT.0 .OR. icompq.GT.1 ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -3
      ELSE IF( icompq.EQ.1 .AND. qsiz.LT.n ) THEN
         info = -4
      ELSE IF( ldq.LT.max( 1, n ) ) THEN
         info = -7
      ELSE IF( cutpnt.LT.min( 1, n ) .OR. cutpnt.GT.n ) THEN
         info = -10
      ELSE IF( ldq2.LT.max( 1, n ) ) THEN
         info = -14
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'SLAED8', -info )
         RETURN
      END IF
*
*     Need to initialize GIVPTR to O here in case of quick exit
*     to prevent an unspecified code behavior (usually sigfault)
*     when IWORK array on entry to *stedc is not zeroed
*     (or at least some IWORK entries which used in *laed7 for GIVPTR).
*
      givptr = 0
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
      n1 = cutpnt
      n2 = n - n1
      n1p1 = n1 + 1
*
      IF( rho.LT.zero ) THEN
         CALL sscal( n2, mone, z( n1p1 ), 1 )
      END IF
*
*     Normalize z so that norm(z) = 1
*
      t = one / sqrt( two )
      DO 10 j = 1, n
         indx( j ) = j
   10 CONTINUE
      CALL sscal( n, t, z, 1 )
      rho = abs( two*rho )
*
*     Sort the eigenvalues into increasing order
*
      DO 20 i = cutpnt + 1, n
         indxq( i ) = indxq( i ) + cutpnt
   20 CONTINUE
      DO 30 i = 1, n
         dlamda( i ) = d( indxq( i ) )
         w( i ) = z( indxq( i ) )
   30 CONTINUE
      i = 1
      j = cutpnt + 1
      CALL slamrg( n1, n2, dlamda, 1, 1, indx )
      DO 40 i = 1, n
         d( i ) = dlamda( indx( i ) )
         z( i ) = w( indx( i ) )
   40 CONTINUE
*
*     Calculate the allowable deflation tolerance
*
      imax = isamax( n, z, 1 )
      jmax = isamax( n, d, 1 )
      eps = slamch( 'Epsilon' )
      tol = eight*eps*abs( d( jmax ) )
*
*     If the rank-1 modifier is small enough, no more needs to be done
*     except to reorganize Q so that its columns correspond with the
*     elements in D.
*
      IF( rho*abs( z( imax ) ).LE.tol ) THEN
         k = 0
         IF( icompq.EQ.0 ) THEN
            DO 50 j = 1, n
               perm( j ) = indxq( indx( j ) )
   50       CONTINUE
         ELSE
            DO 60 j = 1, n
               perm( j ) = indxq( indx( j ) )
               CALL scopy( qsiz, q( 1, perm( j ) ), 1, q2( 1, j ), 1 )
   60       CONTINUE
            CALL slacpy( 'A', qsiz, n, q2( 1, 1 ), ldq2, q( 1, 1 ),
     $                   ldq )
         END IF
         RETURN
      END IF
*
*     If there are multiple eigenvalues then the problem deflates.  Here
*     the number of equal eigenvalues are found.  As each equal
*     eigenvalue is found, an elementary reflector is computed to rotate
*     the corresponding eigensubspace so that the corresponding
*     components of Z are zero in this new basis.
*
      k = 0
      k2 = n + 1
      DO 70 j = 1, n
         IF( rho*abs( z( j ) ).LE.tol ) THEN
*
*           Deflate due to small z component.
*
            k2 = k2 - 1
            indxp( k2 ) = j
            IF( j.EQ.n )
     $         GO TO 110
         ELSE
            jlam = j
            GO TO 80
         END IF
   70 CONTINUE
   80 CONTINUE
      j = j + 1
      IF( j.GT.n )
     $   GO TO 100
      IF( rho*abs( z( j ) ).LE.tol ) THEN
*
*        Deflate due to small z component.
*
         k2 = k2 - 1
         indxp( k2 ) = j
      ELSE
*
*        Check if eigenvalues are close enough to allow deflation.
*
         s = z( jlam )
         c = z( j )
*
*        Find sqrt(a**2+b**2) without overflow or
*        destructive underflow.
*
         tau = slapy2( c, s )
         t = d( j ) - d( jlam )
         c = c / tau
         s = -s / tau
         IF( abs( t*c*s ).LE.tol ) THEN
*
*           Deflation is possible.
*
            z( j ) = tau
            z( jlam ) = zero
*
*           Record the appropriate Givens rotation
*
            givptr = givptr + 1
            givcol( 1, givptr ) = indxq( indx( jlam ) )
            givcol( 2, givptr ) = indxq( indx( j ) )
            givnum( 1, givptr ) = c
            givnum( 2, givptr ) = s
            IF( icompq.EQ.1 ) THEN
               CALL srot( qsiz, q( 1, indxq( indx( jlam ) ) ), 1,
     $                    q( 1, indxq( indx( j ) ) ), 1, c, s )
            END IF
            t = d( jlam )*c*c + d( j )*s*s
            d( j ) = d( jlam )*s*s + d( j )*c*c
            d( jlam ) = t
            k2 = k2 - 1
            i = 1
   90       CONTINUE
            IF( k2+i.LE.n ) THEN
               IF( d( jlam ).LT.d( indxp( k2+i ) ) ) THEN
                  indxp( k2+i-1 ) = indxp( k2+i )
                  indxp( k2+i ) = jlam
                  i = i + 1
                  GO TO 90
               ELSE
                  indxp( k2+i-1 ) = jlam
               END IF
            ELSE
               indxp( k2+i-1 ) = jlam
            END IF
            jlam = j
         ELSE
            k = k + 1
            w( k ) = z( jlam )
            dlamda( k ) = d( jlam )
            indxp( k ) = jlam
            jlam = j
         END IF
      END IF
      GO TO 80
  100 CONTINUE
*
*     Record the last eigenvalue.
*
      k = k + 1
      w( k ) = z( jlam )
      dlamda( k ) = d( jlam )
      indxp( k ) = jlam
*
  110 CONTINUE
*
*     Sort the eigenvalues and corresponding eigenvectors into DLAMDA
*     and Q2 respectively.  The eigenvalues/vectors which were not
*     deflated go into the first K slots of DLAMDA and Q2 respectively,
*     while those which were deflated go into the last N - K slots.
*
      IF( icompq.EQ.0 ) THEN
         DO 120 j = 1, n
            jp = indxp( j )
            dlamda( j ) = d( jp )
            perm( j ) = indxq( indx( jp ) )
  120    CONTINUE
      ELSE
         DO 130 j = 1, n
            jp = indxp( j )
            dlamda( j ) = d( jp )
            perm( j ) = indxq( indx( jp ) )
            CALL scopy( qsiz, q( 1, perm( j ) ), 1, q2( 1, j ), 1 )
  130    CONTINUE
      END IF
*
*     The deflated eigenvalues and their corresponding vectors go back
*     into the last N - K slots of D and Q respectively.
*
      IF( k.LT.n ) THEN
         IF( icompq.EQ.0 ) THEN
            CALL scopy( n-k, dlamda( k+1 ), 1, d( k+1 ), 1 )
         ELSE
            CALL scopy( n-k, dlamda( k+1 ), 1, d( k+1 ), 1 )
            CALL slacpy( 'A', qsiz, n-k, q2( 1, k+1 ), ldq2,
     $                   q( 1, k+1 ), ldq )
         END IF
      END IF
*
      RETURN
*
*     End of SLAED8
*

◆ slaed9()

subroutine slaed9	(	integer	k,
		integer	kstart,
		integer	kstop,
		integer	n,
		real, dimension( * )	d,
		real, dimension( ldq, * )	q,
		integer	ldq,
		real	rho,
		real, dimension( * )	dlamda,
		real, dimension( * )	w,
		real, dimension( lds, * )	s,
		integer	lds,
		integer	info )

SLAED9 used by SSTEDC. Finds the roots of the secular equation and updates the eigenvectors. Used when the original matrix is dense.

Download SLAED9 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> SLAED9 finds the roots of the secular equation, as defined by the
!> values in D, Z, and RHO, between KSTART and KSTOP.  It makes the
!> appropriate calls to SLAED4 and then stores the new matrix of
!> eigenvectors for use in calculating the next level of Z vectors.
!>

Parameters

[in]	K	!> K is INTEGER !> The number of terms in the rational function to be solved by !> SLAED4. K >= 0. !>
[in]	KSTART	!> KSTART is INTEGER !>
[in]	KSTOP	!> KSTOP is INTEGER !> The updated eigenvalues Lambda(I), KSTART <= I <= KSTOP !> are to be computed. 1 <= KSTART <= KSTOP <= K. !>
[in]	N	!> N is INTEGER !> The number of rows and columns in the Q matrix. !> N >= K (delation may result in N > K). !>
[out]	D	!> D is REAL array, dimension (N) !> D(I) contains the updated eigenvalues !> for KSTART <= I <= KSTOP. !>
[out]	Q	!> Q is REAL array, dimension (LDQ,N) !>
[in]	LDQ	!> LDQ is INTEGER !> The leading dimension of the array Q. LDQ >= max( 1, N ). !>
[in]	RHO	!> RHO is REAL !> The value of the parameter in the rank one update equation. !> RHO >= 0 required. !>
[in]	DLAMDA	!> DLAMDA is REAL array, dimension (K) !> The first K elements of this array contain the old roots !> of the deflated updating problem. These are the poles !> of the secular equation. !>
[in]	W	!> W is REAL array, dimension (K) !> The first K elements of this array contain the components !> of the deflation-adjusted updating vector. !>
[out]	S	!> S is REAL array, dimension (LDS, K) !> Will contain the eigenvectors of the repaired matrix which !> will be stored for subsequent Z vector calculation and !> multiplied by the previously accumulated eigenvectors !> to update the system. !>
[in]	LDS	!> LDS is INTEGER !> The leading dimension of S. LDS >= max( 1, K ). !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> < 0: if INFO = -i, the i-th argument had an illegal value. !> > 0: if INFO = 1, an eigenvalue did not converge !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: Jeff Rutter, Computer Science Division, University of California at Berkeley, USA

Definition at line 154 of file slaed9.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INFO, K, KSTART, KSTOP, LDQ, LDS, N
      REAL               RHO
*     ..
*     .. Array Arguments ..
      REAL               D( * ), DLAMDA( * ), Q( LDQ, * ), S( LDS, * ),
     $                   W( * )
*     ..
*
*  =====================================================================
*
*     .. Local Scalars ..
      INTEGER            I, J
      REAL               TEMP
*     ..
*     .. External Functions ..
      REAL               SLAMC3, SNRM2
      EXTERNAL           slamc3, snrm2
*     ..
*     .. External Subroutines ..
      EXTERNAL           scopy, slaed4, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, sign, sqrt
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
*
      IF( k.LT.0 ) THEN
         info = -1
      ELSE IF( kstart.LT.1 .OR. kstart.GT.max( 1, k ) ) THEN
         info = -2
      ELSE IF( max( 1, kstop ).LT.kstart .OR. kstop.GT.max( 1, k ) )
     $          THEN
         info = -3
      ELSE IF( n.LT.k ) THEN
         info = -4
      ELSE IF( ldq.LT.max( 1, k ) ) THEN
         info = -7
      ELSE IF( lds.LT.max( 1, k ) ) THEN
         info = -12
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'SLAED9', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( k.EQ.0 )
     $   RETURN
*
*     Modify values DLAMDA(i) to make sure all DLAMDA(i)-DLAMDA(j) can
*     be computed with high relative accuracy (barring over/underflow).
*     This is a problem on machines without a guard digit in
*     add/subtract (Cray XMP, Cray YMP, Cray C 90 and Cray 2).
*     The following code replaces DLAMDA(I) by 2*DLAMDA(I)-DLAMDA(I),
*     which on any of these machines zeros out the bottommost
*     bit of DLAMDA(I) if it is 1; this makes the subsequent
*     subtractions DLAMDA(I)-DLAMDA(J) unproblematic when cancellation
*     occurs. On binary machines with a guard digit (almost all
*     machines) it does not change DLAMDA(I) at all. On hexadecimal
*     and decimal machines with a guard digit, it slightly
*     changes the bottommost bits of DLAMDA(I). It does not account
*     for hexadecimal or decimal machines without guard digits
*     (we know of none). We use a subroutine call to compute
*     2*DLAMBDA(I) to prevent optimizing compilers from eliminating
*     this code.
*
      DO 10 i = 1, n
         dlamda( i ) = slamc3( dlamda( i ), dlamda( i ) ) - dlamda( i )
   10 CONTINUE
*
      DO 20 j = kstart, kstop
         CALL slaed4( k, j, dlamda, w, q( 1, j ), rho, d( j ), info )
*
*        If the zero finder fails, the computation is terminated.
*
         IF( info.NE.0 )
     $      GO TO 120
   20 CONTINUE
*
      IF( k.EQ.1 .OR. k.EQ.2 ) THEN
         DO 40 i = 1, k
            DO 30 j = 1, k
               s( j, i ) = q( j, i )
   30       CONTINUE
   40    CONTINUE
         GO TO 120
      END IF
*
*     Compute updated W.
*
      CALL scopy( k, w, 1, s, 1 )
*
*     Initialize W(I) = Q(I,I)
*
      CALL scopy( k, q, ldq+1, w, 1 )
      DO 70 j = 1, k
         DO 50 i = 1, j - 1
            w( i ) = w( i )*( q( i, j ) / ( dlamda( i )-dlamda( j ) ) )
   50    CONTINUE
         DO 60 i = j + 1, k
            w( i ) = w( i )*( q( i, j ) / ( dlamda( i )-dlamda( j ) ) )
   60    CONTINUE
   70 CONTINUE
      DO 80 i = 1, k
         w( i ) = sign( sqrt( -w( i ) ), s( i, 1 ) )
   80 CONTINUE
*
*     Compute eigenvectors of the modified rank-1 modification.
*
      DO 110 j = 1, k
         DO 90 i = 1, k
            q( i, j ) = w( i ) / q( i, j )
   90    CONTINUE
         temp = snrm2( k, q( 1, j ), 1 )
         DO 100 i = 1, k
            s( i, j ) = q( i, j ) / temp
  100    CONTINUE
  110 CONTINUE
*
  120 CONTINUE
      RETURN
*
*     End of SLAED9
*

◆ slaeda()

subroutine slaeda	(	integer	n,
		integer	tlvls,
		integer	curlvl,
		integer	curpbm,
		integer, dimension( * )	prmptr,
		integer, dimension( * )	perm,
		integer, dimension( * )	givptr,
		integer, dimension( 2, * )	givcol,
		real, dimension( 2, * )	givnum,
		real, dimension( * )	q,
		integer, dimension( * )	qptr,
		real, dimension( * )	z,
		real, dimension( * )	ztemp,
		integer	info )

SLAEDA used by SSTEDC. Computes the Z vector determining the rank-one modification of the diagonal matrix. Used when the original matrix is dense.

Download SLAEDA + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> SLAEDA computes the Z vector corresponding to the merge step in the
!> CURLVLth step of the merge process with TLVLS steps for the CURPBMth
!> problem.
!>

Parameters

[in]	N	!> N is INTEGER !> The dimension of the symmetric tridiagonal matrix. N >= 0. !>
[in]	TLVLS	!> TLVLS is INTEGER !> The total number of merging levels in the overall divide and !> conquer tree. !>
[in]	CURLVL	!> CURLVL is INTEGER !> The current level in the overall merge routine, !> 0 <= curlvl <= tlvls. !>
[in]	CURPBM	!> CURPBM is INTEGER !> The current problem in the current level in the overall !> merge routine (counting from upper left to lower right). !>
[in]	PRMPTR	!> PRMPTR is INTEGER array, dimension (N lg N) !> Contains a list of pointers which indicate where in PERM a !> level's permutation is stored. PRMPTR(i+1) - PRMPTR(i) !> indicates the size of the permutation and incidentally the !> size of the full, non-deflated problem. !>
[in]	PERM	!> PERM is INTEGER array, dimension (N lg N) !> Contains the permutations (from deflation and sorting) to be !> applied to each eigenblock. !>
[in]	GIVPTR	!> GIVPTR is INTEGER array, dimension (N lg N) !> Contains a list of pointers which indicate where in GIVCOL a !> level's Givens rotations are stored. GIVPTR(i+1) - GIVPTR(i) !> indicates the number of Givens rotations. !>
[in]	GIVCOL	!> GIVCOL is INTEGER array, dimension (2, N lg N) !> Each pair of numbers indicates a pair of columns to take place !> in a Givens rotation. !>
[in]	GIVNUM	!> GIVNUM is REAL array, dimension (2, N lg N) !> Each number indicates the S value to be used in the !> corresponding Givens rotation. !>
[in]	Q	!> Q is REAL array, dimension (N**2) !> Contains the square eigenblocks from previous levels, the !> starting positions for blocks are given by QPTR. !>
[in]	QPTR	!> QPTR is INTEGER array, dimension (N+2) !> Contains a list of pointers which indicate where in Q an !> eigenblock is stored. SQRT( QPTR(i+1) - QPTR(i) ) indicates !> the size of the block. !>
[out]	Z	!> Z is REAL array, dimension (N) !> On output this vector contains the updating vector (the last !> row of the first sub-eigenvector matrix and the first row of !> the second sub-eigenvector matrix). !>
[out]	ZTEMP	!> ZTEMP is REAL array, dimension (N) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> < 0: if INFO = -i, the i-th argument had an illegal value. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: Jeff Rutter, Computer Science Division, University of California at Berkeley, USA

Definition at line 164 of file slaeda.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            CURLVL, CURPBM, INFO, N, TLVLS
*     ..
*     .. Array Arguments ..
      INTEGER            GIVCOL( 2, * ), GIVPTR( * ), PERM( * ),
     $                   PRMPTR( * ), QPTR( * )
      REAL               GIVNUM( 2, * ), Q( * ), Z( * ), ZTEMP( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ZERO, HALF, ONE
      parameter( zero = 0.0e0, half = 0.5e0, one = 1.0e0 )
*     ..
*     .. Local Scalars ..
      INTEGER            BSIZ1, BSIZ2, CURR, I, K, MID, PSIZ1, PSIZ2,
     $                   PTR, ZPTR1
*     ..
*     .. External Subroutines ..
      EXTERNAL           scopy, sgemv, srot, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          int, real, sqrt
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
*
      IF( n.LT.0 ) THEN
         info = -1
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'SLAEDA', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
*     Determine location of first number in second half.
*
      mid = n / 2 + 1
*
*     Gather last/first rows of appropriate eigenblocks into center of Z
*
      ptr = 1
*
*     Determine location of lowest level subproblem in the full storage
*     scheme
*
      curr = ptr + curpbm*2**curlvl + 2**( curlvl-1 ) - 1
*
*     Determine size of these matrices.  We add HALF to the value of
*     the SQRT in case the machine underestimates one of these square
*     roots.
*
      bsiz1 = int( half+sqrt( real( qptr( curr+1 )-qptr( curr ) ) ) )
      bsiz2 = int( half+sqrt( real( qptr( curr+2 )-qptr( curr+1 ) ) ) )
      DO 10 k = 1, mid - bsiz1 - 1
         z( k ) = zero
   10 CONTINUE
      CALL scopy( bsiz1, q( qptr( curr )+bsiz1-1 ), bsiz1,
     $            z( mid-bsiz1 ), 1 )
      CALL scopy( bsiz2, q( qptr( curr+1 ) ), bsiz2, z( mid ), 1 )
      DO 20 k = mid + bsiz2, n
         z( k ) = zero
   20 CONTINUE
*
*     Loop through remaining levels 1 -> CURLVL applying the Givens
*     rotations and permutation and then multiplying the center matrices
*     against the current Z.
*
      ptr = 2**tlvls + 1
      DO 70 k = 1, curlvl - 1
         curr = ptr + curpbm*2**( curlvl-k ) + 2**( curlvl-k-1 ) - 1
         psiz1 = prmptr( curr+1 ) - prmptr( curr )
         psiz2 = prmptr( curr+2 ) - prmptr( curr+1 )
         zptr1 = mid - psiz1
*
*       Apply Givens at CURR and CURR+1
*
         DO 30 i = givptr( curr ), givptr( curr+1 ) - 1
            CALL srot( 1, z( zptr1+givcol( 1, i )-1 ), 1,
     $                 z( zptr1+givcol( 2, i )-1 ), 1, givnum( 1, i ),
     $                 givnum( 2, i ) )
   30    CONTINUE
         DO 40 i = givptr( curr+1 ), givptr( curr+2 ) - 1
            CALL srot( 1, z( mid-1+givcol( 1, i ) ), 1,
     $                 z( mid-1+givcol( 2, i ) ), 1, givnum( 1, i ),
     $                 givnum( 2, i ) )
   40    CONTINUE
         psiz1 = prmptr( curr+1 ) - prmptr( curr )
         psiz2 = prmptr( curr+2 ) - prmptr( curr+1 )
         DO 50 i = 0, psiz1 - 1
            ztemp( i+1 ) = z( zptr1+perm( prmptr( curr )+i )-1 )
   50    CONTINUE
         DO 60 i = 0, psiz2 - 1
            ztemp( psiz1+i+1 ) = z( mid+perm( prmptr( curr+1 )+i )-1 )
   60    CONTINUE
*
*        Multiply Blocks at CURR and CURR+1
*
*        Determine size of these matrices.  We add HALF to the value of
*        the SQRT in case the machine underestimates one of these
*        square roots.
*
         bsiz1 = int( half+sqrt( real( qptr( curr+1 )-qptr( curr ) ) ) )
         bsiz2 = int( half+sqrt( real( qptr( curr+2 )-qptr( curr+
     $           1 ) ) ) )
         IF( bsiz1.GT.0 ) THEN
            CALL sgemv( 'T', bsiz1, bsiz1, one, q( qptr( curr ) ),
     $                  bsiz1, ztemp( 1 ), 1, zero, z( zptr1 ), 1 )
         END IF
         CALL scopy( psiz1-bsiz1, ztemp( bsiz1+1 ), 1, z( zptr1+bsiz1 ),
     $               1 )
         IF( bsiz2.GT.0 ) THEN
            CALL sgemv( 'T', bsiz2, bsiz2, one, q( qptr( curr+1 ) ),
     $                  bsiz2, ztemp( psiz1+1 ), 1, zero, z( mid ), 1 )
         END IF
         CALL scopy( psiz2-bsiz2, ztemp( psiz1+bsiz2+1 ), 1,
     $               z( mid+bsiz2 ), 1 )
*
         ptr = ptr + 2**( tlvls-k )
   70 CONTINUE
*
      RETURN
*
*     End of SLAEDA
*

◆ slagtf()

subroutine slagtf	(	integer	n,
		real, dimension( * )	a,
		real	lambda,
		real, dimension( * )	b,
		real, dimension( * )	c,
		real	tol,
		real, dimension( * )	d,
		integer, dimension( * )	in,
		integer	info )

SLAGTF computes an LU factorization of a matrix T-λI, where T is a general tridiagonal matrix, and λ a scalar, using partial pivoting with row interchanges.

Download SLAGTF + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> SLAGTF factorizes the matrix (T - lambda*I), where T is an n by n
!> tridiagonal matrix and lambda is a scalar, as
!>
!>    T - lambda*I = PLU,
!>
!> where P is a permutation matrix, L is a unit lower tridiagonal matrix
!> with at most one non-zero sub-diagonal elements per column and U is
!> an upper triangular matrix with at most two non-zero super-diagonal
!> elements per column.
!>
!> The factorization is obtained by Gaussian elimination with partial
!> pivoting and implicit row scaling.
!>
!> The parameter LAMBDA is included in the routine so that SLAGTF may
!> be used, in conjunction with SLAGTS, to obtain eigenvectors of T by
!> inverse iteration.
!>

Parameters

[in]	N	!> N is INTEGER !> The order of the matrix T. !>
[in,out]	A	!> A is REAL array, dimension (N) !> On entry, A must contain the diagonal elements of T. !> !> On exit, A is overwritten by the n diagonal elements of the !> upper triangular matrix U of the factorization of T. !>
[in]	LAMBDA	!> LAMBDA is REAL !> On entry, the scalar lambda. !>
[in,out]	B	!> B is REAL array, dimension (N-1) !> On entry, B must contain the (n-1) super-diagonal elements of !> T. !> !> On exit, B is overwritten by the (n-1) super-diagonal !> elements of the matrix U of the factorization of T. !>
[in,out]	C	!> C is REAL array, dimension (N-1) !> On entry, C must contain the (n-1) sub-diagonal elements of !> T. !> !> On exit, C is overwritten by the (n-1) sub-diagonal elements !> of the matrix L of the factorization of T. !>
[in]	TOL	!> TOL is REAL !> On entry, a relative tolerance used to indicate whether or !> not the matrix (T - lambdaI) is nearly singular. TOL should !> normally be chose as approximately the largest relative error !> in the elements of T. For example, if the elements of T are !> correct to about 4 significant figures, then TOL should be !> set to about 510**(-4). If TOL is supplied as less than eps, !> where eps is the relative machine precision, then the value !> eps is used in place of TOL. !>
[out]	D	!> D is REAL array, dimension (N-2) !> On exit, D is overwritten by the (n-2) second super-diagonal !> elements of the matrix U of the factorization of T. !>
[out]	IN	!> IN is INTEGER array, dimension (N) !> On exit, IN contains details of the permutation matrix P. If !> an interchange occurred at the kth step of the elimination, !> then IN(k) = 1, otherwise IN(k) = 0. The element IN(n) !> returns the smallest positive integer j such that !> !> abs( u(j,j) ) <= norm( (T - lambdaI)(j) )TOL, !> !> where norm( A(j) ) denotes the sum of the absolute values of !> the jth row of the matrix A. If no such j exists then IN(n) !> is returned as zero. If IN(n) is returned as positive, then a !> diagonal element of U is small, indicating that !> (T - lambda*I) is singular or nearly singular, !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -k, the kth argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 155 of file slagtf.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INFO, N
      REAL               LAMBDA, TOL
*     ..
*     .. Array Arguments ..
      INTEGER            IN( * )
      REAL               A( * ), B( * ), C( * ), D( * )
*     ..
*
* =====================================================================
*
*     .. Parameters ..
      REAL               ZERO
      parameter( zero = 0.0e+0 )
*     ..
*     .. Local Scalars ..
      INTEGER            K
      REAL               EPS, MULT, PIV1, PIV2, SCALE1, SCALE2, TEMP, TL
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, max
*     ..
*     .. External Functions ..
      REAL               SLAMCH
      EXTERNAL           slamch
*     ..
*     .. External Subroutines ..
      EXTERNAL           xerbla
*     ..
*     .. Executable Statements ..
*
      info = 0
      IF( n.LT.0 ) THEN
         info = -1
         CALL xerbla( 'SLAGTF', -info )
         RETURN
      END IF
*
      IF( n.EQ.0 )
     $   RETURN
*
      a( 1 ) = a( 1 ) - lambda
      in( n ) = 0
      IF( n.EQ.1 ) THEN
         IF( a( 1 ).EQ.zero )
     $      in( 1 ) = 1
         RETURN
      END IF
*
      eps = slamch( 'Epsilon' )
*
      tl = max( tol, eps )
      scale1 = abs( a( 1 ) ) + abs( b( 1 ) )
      DO 10 k = 1, n - 1
         a( k+1 ) = a( k+1 ) - lambda
         scale2 = abs( c( k ) ) + abs( a( k+1 ) )
         IF( k.LT.( n-1 ) )
     $      scale2 = scale2 + abs( b( k+1 ) )
         IF( a( k ).EQ.zero ) THEN
            piv1 = zero
         ELSE
            piv1 = abs( a( k ) ) / scale1
         END IF
         IF( c( k ).EQ.zero ) THEN
            in( k ) = 0
            piv2 = zero
            scale1 = scale2
            IF( k.LT.( n-1 ) )
     $         d( k ) = zero
         ELSE
            piv2 = abs( c( k ) ) / scale2
            IF( piv2.LE.piv1 ) THEN
               in( k ) = 0
               scale1 = scale2
               c( k ) = c( k ) / a( k )
               a( k+1 ) = a( k+1 ) - c( k )*b( k )
               IF( k.LT.( n-1 ) )
     $            d( k ) = zero
            ELSE
               in( k ) = 1
               mult = a( k ) / c( k )
               a( k ) = c( k )
               temp = a( k+1 )
               a( k+1 ) = b( k ) - mult*temp
               IF( k.LT.( n-1 ) ) THEN
                  d( k ) = b( k+1 )
                  b( k+1 ) = -mult*d( k )
               END IF
               b( k ) = temp
               c( k ) = mult
            END IF
         END IF
         IF( ( max( piv1, piv2 ).LE.tl ) .AND. ( in( n ).EQ.0 ) )
     $      in( n ) = k
   10 CONTINUE
      IF( ( abs( a( n ) ).LE.scale1*tl ) .AND. ( in( n ).EQ.0 ) )
     $   in( n ) = n
*
      RETURN
*
*     End of SLAGTF
*

◆ slamrg()

subroutine slamrg	(	integer	n1,
		integer	n2,
		real, dimension( * )	a,
		integer	strd1,
		integer	strd2,
		integer, dimension( * )	index )

SLAMRG creates a permutation list to merge the entries of two independently sorted sets into a single set sorted in ascending order.

Download SLAMRG + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> SLAMRG will create a permutation list which will merge the elements
!> of A (which is composed of two independently sorted sets) into a
!> single set which is sorted in ascending order.
!>

Parameters

[in]	N1	!> N1 is INTEGER !>
[in]	N2	!> N2 is INTEGER !> These arguments contain the respective lengths of the two !> sorted lists to be merged. !>
[in]	A	!> A is REAL array, dimension (N1+N2) !> The first N1 elements of A contain a list of numbers which !> are sorted in either ascending or descending order. Likewise !> for the final N2 elements. !>
[in]	STRD1	!> STRD1 is INTEGER !>
[in]	STRD2	!> STRD2 is INTEGER !> These are the strides to be taken through the array A. !> Allowable strides are 1 and -1. They indicate whether a !> subset of A is sorted in ascending (STRDx = 1) or descending !> (STRDx = -1) order. !>
[out]	INDEX	!> INDEX is INTEGER array, dimension (N1+N2) !> On exit this array will contain a permutation such that !> if B( I ) = A( INDEX( I ) ) for I=1,N1+N2, then B will be !> sorted in ascending order. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 98 of file slamrg.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            N1, N2, STRD1, STRD2
*     ..
*     .. Array Arguments ..
      INTEGER            INDEX( * )
      REAL               A( * )
*     ..
*
*  =====================================================================
*
*     .. Local Scalars ..
      INTEGER            I, IND1, IND2, N1SV, N2SV
*     ..
*     .. Executable Statements ..
*
      n1sv = n1
      n2sv = n2
      IF( strd1.GT.0 ) THEN
         ind1 = 1
      ELSE
         ind1 = n1
      END IF
      IF( strd2.GT.0 ) THEN
         ind2 = 1 + n1
      ELSE
         ind2 = n1 + n2
      END IF
      i = 1
*     while ( (N1SV > 0) & (N2SV > 0) )
   10 CONTINUE
      IF( n1sv.GT.0 .AND. n2sv.GT.0 ) THEN
         IF( a( ind1 ).LE.a( ind2 ) ) THEN
            index( i ) = ind1
            i = i + 1
            ind1 = ind1 + strd1
            n1sv = n1sv - 1
         ELSE
            index( i ) = ind2
            i = i + 1
            ind2 = ind2 + strd2
            n2sv = n2sv - 1
         END IF
         GO TO 10
      END IF
*     end while
      IF( n1sv.EQ.0 ) THEN
         DO 20 n1sv = 1, n2sv
            index( i ) = ind2
            i = i + 1
            ind2 = ind2 + strd2
   20    CONTINUE
      ELSE
*     N2SV .EQ. 0
         DO 30 n2sv = 1, n1sv
            index( i ) = ind1
            i = i + 1
            ind1 = ind1 + strd1
   30    CONTINUE
      END IF
*
      RETURN
*
*     End of SLAMRG
*

◆ slartgs()

subroutine slartgs	(	real	x,
		real	y,
		real	sigma,
		real	cs,
		real	sn )

SLARTGS generates a plane rotation designed to introduce a bulge in implicit QR iteration for the bidiagonal SVD problem.

Download SLARTGS + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> SLARTGS generates a plane rotation designed to introduce a bulge in
!> Golub-Reinsch-style implicit QR iteration for the bidiagonal SVD
!> problem. X and Y are the top-row entries, and SIGMA is the shift.
!> The computed CS and SN define a plane rotation satisfying
!>
!>    [  CS  SN  ]  .  [ X^2 - SIGMA ]  =  [ R ],
!>    [ -SN  CS  ]     [    X * Y    ]     [ 0 ]
!>
!> with R nonnegative.  If X^2 - SIGMA and X * Y are 0, then the
!> rotation is by PI/2.
!>

Parameters

[in]	X	!> X is REAL !> The (1,1) entry of an upper bidiagonal matrix. !>
[in]	Y	!> Y is REAL !> The (1,2) entry of an upper bidiagonal matrix. !>
[in]	SIGMA	!> SIGMA is REAL !> The shift. !>
[out]	CS	!> CS is REAL !> The cosine of the rotation. !>
[out]	SN	!> SN is REAL !> The sine of the rotation. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 89 of file slartgs.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      REAL                    CS, SIGMA, SN, X, Y
*     ..
*
*  ===================================================================
*
*     .. Parameters ..
      REAL                    NEGONE, ONE, ZERO
      parameter( negone = -1.0e0, one = 1.0e0, zero = 0.0e0 )
*     ..
*     .. Local Scalars ..
      REAL                    R, S, THRESH, W, Z
*     ..
*     .. External Subroutines ..
      EXTERNAL           slartgp
*     ..
*     .. External Functions ..
      REAL                    SLAMCH
      EXTERNAL           slamch
*     .. Executable Statements ..
*
      thresh = slamch('E')
*
*     Compute the first column of B**T*B - SIGMA^2*I, up to a scale
*     factor.
*
      IF( (sigma .EQ. zero .AND. abs(x) .LT. thresh) .OR.
     $          (abs(x) .EQ. sigma .AND. y .EQ. zero) ) THEN
         z = zero
         w = zero
      ELSE IF( sigma .EQ. zero ) THEN
         IF( x .GE. zero ) THEN
            z = x
            w = y
         ELSE
            z = -x
            w = -y
         END IF
      ELSE IF( abs(x) .LT. thresh ) THEN
         z = -sigma*sigma
         w = zero
      ELSE
         IF( x .GE. zero ) THEN
            s = one
         ELSE
            s = negone
         END IF
         z = s * (abs(x)-sigma) * (s+sigma/x)
         w = s * y
      END IF
*
*     Generate the rotation.
*     CALL SLARTGP( Z, W, CS, SN, R ) might seem more natural;
*     reordering the arguments ensures that if Z = 0 then the rotation
*     is by PI/2.
*
      CALL slartgp( w, z, sn, cs, r )
*
      RETURN
*
*     End SLARTGS
*

◆ slasq1()

subroutine slasq1	(	integer	n,
		real, dimension( * )	d,
		real, dimension( * )	e,
		real, dimension( * )	work,
		integer	info )

SLASQ1 computes the singular values of a real square bidiagonal matrix. Used by sbdsqr.

Download SLASQ1 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> SLASQ1 computes the singular values of a real N-by-N bidiagonal
!> matrix with diagonal D and off-diagonal E. The singular values
!> are computed to high relative accuracy, in the absence of
!> denormalization, underflow and overflow. The algorithm was first
!> presented in
!>
!>  by K. V.
!> Fernando and B. N. Parlett, Numer. Math., Vol-67, No. 2, pp. 191-230,
!> 1994,
!>
!> and the present implementation is described in , LAPACK Working Note.
!>

Parameters

[in]	N	!> N is INTEGER !> The number of rows and columns in the matrix. N >= 0. !>
[in,out]	D	!> D is REAL array, dimension (N) !> On entry, D contains the diagonal elements of the !> bidiagonal matrix whose SVD is desired. On normal exit, !> D contains the singular values in decreasing order. !>
[in,out]	E	!> E is REAL array, dimension (N) !> On entry, elements E(1:N-1) contain the off-diagonal elements !> of the bidiagonal matrix whose SVD is desired. !> On exit, E is overwritten. !>
[out]	WORK	!> WORK is REAL array, dimension (4*N) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !> > 0: the algorithm failed !> = 1, a split was marked by a positive value in E !> = 2, current block of Z not diagonalized after 100*N !> iterations (in inner while loop) On exit D and E !> represent a matrix with the same singular values !> which the calling subroutine could use to finish the !> computation, or even feed back into SLASQ1 !> = 3, termination criterion of outer while loop not met !> (program created more than N unreduced blocks) !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 107 of file slasq1.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INFO, N
*     ..
*     .. Array Arguments ..
      REAL               D( * ), E( * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ZERO
      parameter( zero = 0.0e0 )
*     ..
*     .. Local Scalars ..
      INTEGER            I, IINFO
      REAL               EPS, SCALE, SAFMIN, SIGMN, SIGMX
*     ..
*     .. External Subroutines ..
      EXTERNAL           scopy, slas2, slascl, slasq2, slasrt, xerbla
*     ..
*     .. External Functions ..
      REAL               SLAMCH
      EXTERNAL           slamch
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, max, sqrt
*     ..
*     .. Executable Statements ..
*
      info = 0
      IF( n.LT.0 ) THEN
         info = -1
         CALL xerbla( 'SLASQ1', -info )
         RETURN
      ELSE IF( n.EQ.0 ) THEN
         RETURN
      ELSE IF( n.EQ.1 ) THEN
         d( 1 ) = abs( d( 1 ) )
         RETURN
      ELSE IF( n.EQ.2 ) THEN
         CALL slas2( d( 1 ), e( 1 ), d( 2 ), sigmn, sigmx )
         d( 1 ) = sigmx
         d( 2 ) = sigmn
         RETURN
      END IF
*
*     Estimate the largest singular value.
*
      sigmx = zero
      DO 10 i = 1, n - 1
         d( i ) = abs( d( i ) )
         sigmx = max( sigmx, abs( e( i ) ) )
   10 CONTINUE
      d( n ) = abs( d( n ) )
*
*     Early return if SIGMX is zero (matrix is already diagonal).
*
      IF( sigmx.EQ.zero ) THEN
         CALL slasrt( 'D', n, d, iinfo )
         RETURN
      END IF
*
      DO 20 i = 1, n
         sigmx = max( sigmx, d( i ) )
   20 CONTINUE
*
*     Copy D and E into WORK (in the Z format) and scale (squaring the
*     input data makes scaling by a power of the radix pointless).
*
      eps = slamch( 'Precision' )
      safmin = slamch( 'Safe minimum' )
      scale = sqrt( eps / safmin )
      CALL scopy( n, d, 1, work( 1 ), 2 )
      CALL scopy( n-1, e, 1, work( 2 ), 2 )
      CALL slascl( 'G', 0, 0, sigmx, scale, 2*n-1, 1, work, 2*n-1,
     $             iinfo )
*
*     Compute the q's and e's.
*
      DO 30 i = 1, 2*n - 1
         work( i ) = work( i )**2
   30 CONTINUE
      work( 2*n ) = zero
*
      CALL slasq2( n, work, info )
*
      IF( info.EQ.0 ) THEN
         DO 40 i = 1, n
            d( i ) = sqrt( work( i ) )
   40    CONTINUE
         CALL slascl( 'G', 0, 0, scale, sigmx, n, 1, d, n, iinfo )
      ELSE IF( info.EQ.2 ) THEN
*
*     Maximum number of iterations exceeded.  Move data from WORK
*     into D and E so the calling subroutine can try to finish
*
         DO i = 1, n
            d( i ) = sqrt( work( 2*i-1 ) )
            e( i ) = sqrt( work( 2*i ) )
         END DO
         CALL slascl( 'G', 0, 0, scale, sigmx, n, 1, d, n, iinfo )
         CALL slascl( 'G', 0, 0, scale, sigmx, n, 1, e, n, iinfo )
      END IF
*
      RETURN
*
*     End of SLASQ1
*

◆ slasq2()

subroutine slasq2	(	integer	n,
		real, dimension( * )	z,
		integer	info )

SLASQ2 computes all the eigenvalues of the symmetric positive definite tridiagonal matrix associated with the qd Array Z to high relative accuracy. Used by sbdsqr and sstegr.

Download SLASQ2 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> SLASQ2 computes all the eigenvalues of the symmetric positive
!> definite tridiagonal matrix associated with the qd array Z to high
!> relative accuracy are computed to high relative accuracy, in the
!> absence of denormalization, underflow and overflow.
!>
!> To see the relation of Z to the tridiagonal matrix, let L be a
!> unit lower bidiagonal matrix with subdiagonals Z(2,4,6,,..) and
!> let U be an upper bidiagonal matrix with 1's above and diagonal
!> Z(1,3,5,,..). The tridiagonal is L*U or, if you prefer, the
!> symmetric tridiagonal to which it is similar.
!>
!> Note : SLASQ2 defines a logical variable, IEEE, which is true
!> on machines which follow ieee-754 floating-point standard in their
!> handling of infinities and NaNs, and false otherwise. This variable
!> is passed to SLASQ3.
!>

Parameters

[in]

N

!>          N is INTEGER
!>        The number of rows and columns in the matrix. N >= 0.
!>

[in,out]

Z

!>          Z is REAL array, dimension ( 4*N )
!>        On entry Z holds the qd array. On exit, entries 1 to N hold
!>        the eigenvalues in decreasing order, Z( 2*N+1 ) holds the
!>        trace, and Z( 2*N+2 ) holds the sum of the eigenvalues. If
!>        N > 2, then Z( 2*N+3 ) holds the iteration count, Z( 2*N+4 )
!>        holds NDIVS/NIN^2, and Z( 2*N+5 ) holds the percentage of
!>        shifts that failed.
!>

[out]

INFO

!>          INFO is INTEGER
!>        = 0: successful exit
!>        < 0: if the i-th argument is a scalar and had an illegal
!>             value, then INFO = -i, if the i-th argument is an
!>             array and the j-entry had an illegal value, then
!>             INFO = -(i*100+j)
!>        > 0: the algorithm failed
!>              = 1, a split was marked by a positive value in E
!>              = 2, current block of Z not diagonalized after 100*N
!>                   iterations (in inner while loop).  On exit Z holds
!>                   a qd array with the same eigenvalues as the given Z.
!>              = 3, termination criterion of outer while loop not met
!>                   (program created more than N unreduced blocks)
!>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  Local Variables: I0:N0 defines a current unreduced segment of Z.
!>  The shifts are accumulated in SIGMA. Iteration count is in ITER.
!>  Ping-pong is controlled by PP (alternates between 0 and 1).
!>

Definition at line 111 of file slasq2.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INFO, N
*     ..
*     .. Array Arguments ..
      REAL               Z( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               CBIAS
      parameter( cbias = 1.50e0 )
      REAL               ZERO, HALF, ONE, TWO, FOUR, HUNDRD
      parameter( zero = 0.0e0, half = 0.5e0, one = 1.0e0,
     $                     two = 2.0e0, four = 4.0e0, hundrd = 100.0e0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            IEEE
      INTEGER            I0, I4, IINFO, IPN4, ITER, IWHILA, IWHILB, K,
     $                   KMIN, N0, NBIG, NDIV, NFAIL, PP, SPLT, TTYPE,
     $                   I1, N1
      REAL               D, DEE, DEEMIN, DESIG, DMIN, DMIN1, DMIN2, DN,
     $                   DN1, DN2, E, EMAX, EMIN, EPS, G, OLDEMN, QMAX,
     $                   QMIN, S, SAFMIN, SIGMA, T, TAU, TEMP, TOL,
     $                   TOL2, TRACE, ZMAX, TEMPE, TEMPQ
*     ..
*     .. External Subroutines ..
      EXTERNAL           slasq3, slasrt, xerbla
*     ..
*     .. External Functions ..
      REAL               SLAMCH
      EXTERNAL           slamch
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, max, min, real, sqrt
*     ..
*     .. Executable Statements ..
*
*     Test the input arguments.
*     (in case SLASQ2 is not called by SLASQ1)
*
      info = 0
      eps = slamch( 'Precision' )
      safmin = slamch( 'Safe minimum' )
      tol = eps*hundrd
      tol2 = tol**2
*
      IF( n.LT.0 ) THEN
         info = -1
         CALL xerbla( 'SLASQ2', 1 )
         RETURN
      ELSE IF( n.EQ.0 ) THEN
         RETURN
      ELSE IF( n.EQ.1 ) THEN
*
*        1-by-1 case.
*
         IF( z( 1 ).LT.zero ) THEN
            info = -201
            CALL xerbla( 'SLASQ2', 2 )
         END IF
         RETURN
      ELSE IF( n.EQ.2 ) THEN
*
*        2-by-2 case.
*
         IF( z( 1 ).LT.zero ) THEN
            info = -201
            CALL xerbla( 'SLASQ2', 2 )
            RETURN
         ELSE IF( z( 2 ).LT.zero ) THEN
            info = -202
            CALL xerbla( 'SLASQ2', 2 )
            RETURN
         ELSE IF( z( 3 ).LT.zero ) THEN
           info = -203
           CALL xerbla( 'SLASQ2', 2 )
           RETURN
         ELSE IF( z( 3 ).GT.z( 1 ) ) THEN
            d = z( 3 )
            z( 3 ) = z( 1 )
            z( 1 ) = d
         END IF
         z( 5 ) = z( 1 ) + z( 2 ) + z( 3 )
         IF( z( 2 ).GT.z( 3 )*tol2 ) THEN
            t = half*( ( z( 1 )-z( 3 ) )+z( 2 ) )
            s = z( 3 )*( z( 2 ) / t )
            IF( s.LE.t ) THEN
               s = z( 3 )*( z( 2 ) / ( t*( one+sqrt( one+s / t ) ) ) )
            ELSE
               s = z( 3 )*( z( 2 ) / ( t+sqrt( t )*sqrt( t+s ) ) )
            END IF
            t = z( 1 ) + ( s+z( 2 ) )
            z( 3 ) = z( 3 )*( z( 1 ) / t )
            z( 1 ) = t
         END IF
         z( 2 ) = z( 3 )
         z( 6 ) = z( 2 ) + z( 1 )
         RETURN
      END IF
*
*     Check for negative data and compute sums of q's and e's.
*
      z( 2*n ) = zero
      emin = z( 2 )
      qmax = zero
      zmax = zero
      d = zero
      e = zero
*
      DO 10 k = 1, 2*( n-1 ), 2
         IF( z( k ).LT.zero ) THEN
            info = -( 200+k )
            CALL xerbla( 'SLASQ2', 2 )
            RETURN
         ELSE IF( z( k+1 ).LT.zero ) THEN
            info = -( 200+k+1 )
            CALL xerbla( 'SLASQ2', 2 )
            RETURN
         END IF
         d = d + z( k )
         e = e + z( k+1 )
         qmax = max( qmax, z( k ) )
         emin = min( emin, z( k+1 ) )
         zmax = max( qmax, zmax, z( k+1 ) )
   10 CONTINUE
      IF( z( 2*n-1 ).LT.zero ) THEN
         info = -( 200+2*n-1 )
         CALL xerbla( 'SLASQ2', 2 )
         RETURN
      END IF
      d = d + z( 2*n-1 )
      qmax = max( qmax, z( 2*n-1 ) )
      zmax = max( qmax, zmax )
*
*     Check for diagonality.
*
      IF( e.EQ.zero ) THEN
         DO 20 k = 2, n
            z( k ) = z( 2*k-1 )
   20    CONTINUE
         CALL slasrt( 'D', n, z, iinfo )
         z( 2*n-1 ) = d
         RETURN
      END IF
*
      trace = d + e
*
*     Check for zero data.
*
      IF( trace.EQ.zero ) THEN
         z( 2*n-1 ) = zero
         RETURN
      END IF
*
*     Check whether the machine is IEEE conformable.
*
*     IEEE = ( ILAENV( 10, 'SLASQ2', 'N', 1, 2, 3, 4 ).EQ.1 )
*
*     [11/15/2008] The case IEEE=.TRUE. has a problem in single precision with
*     some the test matrices of type 16. The double precision code is fine.
*
      ieee = .false.
*
*     Rearrange data for locality: Z=(q1,qq1,e1,ee1,q2,qq2,e2,ee2,...).
*
      DO 30 k = 2*n, 2, -2
         z( 2*k ) = zero
         z( 2*k-1 ) = z( k )
         z( 2*k-2 ) = zero
         z( 2*k-3 ) = z( k-1 )
   30 CONTINUE
*
      i0 = 1
      n0 = n
*
*     Reverse the qd-array, if warranted.
*
      IF( cbias*z( 4*i0-3 ).LT.z( 4*n0-3 ) ) THEN
         ipn4 = 4*( i0+n0 )
         DO 40 i4 = 4*i0, 2*( i0+n0-1 ), 4
            temp = z( i4-3 )
            z( i4-3 ) = z( ipn4-i4-3 )
            z( ipn4-i4-3 ) = temp
            temp = z( i4-1 )
            z( i4-1 ) = z( ipn4-i4-5 )
            z( ipn4-i4-5 ) = temp
   40    CONTINUE
      END IF
*
*     Initial split checking via dqd and Li's test.
*
      pp = 0
*
      DO 80 k = 1, 2
*
         d = z( 4*n0+pp-3 )
         DO 50 i4 = 4*( n0-1 ) + pp, 4*i0 + pp, -4
            IF( z( i4-1 ).LE.tol2*d ) THEN
               z( i4-1 ) = -zero
               d = z( i4-3 )
            ELSE
               d = z( i4-3 )*( d / ( d+z( i4-1 ) ) )
            END IF
   50    CONTINUE
*
*        dqd maps Z to ZZ plus Li's test.
*
         emin = z( 4*i0+pp+1 )
         d = z( 4*i0+pp-3 )
         DO 60 i4 = 4*i0 + pp, 4*( n0-1 ) + pp, 4
            z( i4-2*pp-2 ) = d + z( i4-1 )
            IF( z( i4-1 ).LE.tol2*d ) THEN
               z( i4-1 ) = -zero
               z( i4-2*pp-2 ) = d
               z( i4-2*pp ) = zero
               d = z( i4+1 )
            ELSE IF( safmin*z( i4+1 ).LT.z( i4-2*pp-2 ) .AND.
     $               safmin*z( i4-2*pp-2 ).LT.z( i4+1 ) ) THEN
               temp = z( i4+1 ) / z( i4-2*pp-2 )
               z( i4-2*pp ) = z( i4-1 )*temp
               d = d*temp
            ELSE
               z( i4-2*pp ) = z( i4+1 )*( z( i4-1 ) / z( i4-2*pp-2 ) )
               d = z( i4+1 )*( d / z( i4-2*pp-2 ) )
            END IF
            emin = min( emin, z( i4-2*pp ) )
   60    CONTINUE
         z( 4*n0-pp-2 ) = d
*
*        Now find qmax.
*
         qmax = z( 4*i0-pp-2 )
         DO 70 i4 = 4*i0 - pp + 2, 4*n0 - pp - 2, 4
            qmax = max( qmax, z( i4 ) )
   70    CONTINUE
*
*        Prepare for the next iteration on K.
*
         pp = 1 - pp
   80 CONTINUE
*
*     Initialise variables to pass to SLASQ3.
*
      ttype = 0
      dmin1 = zero
      dmin2 = zero
      dn    = zero
      dn1   = zero
      dn2   = zero
      g     = zero
      tau   = zero
*
      iter = 2
      nfail = 0
      ndiv = 2*( n0-i0 )
*
      DO 160 iwhila = 1, n + 1
         IF( n0.LT.1 )
     $      GO TO 170
*
*        While array unfinished do
*
*        E(N0) holds the value of SIGMA when submatrix in I0:N0
*        splits from the rest of the array, but is negated.
*
         desig = zero
         IF( n0.EQ.n ) THEN
            sigma = zero
         ELSE
            sigma = -z( 4*n0-1 )
         END IF
         IF( sigma.LT.zero ) THEN
            info = 1
            RETURN
         END IF
*
*        Find last unreduced submatrix's top index I0, find QMAX and
*        EMIN. Find Gershgorin-type bound if Q's much greater than E's.
*
         emax = zero
         IF( n0.GT.i0 ) THEN
            emin = abs( z( 4*n0-5 ) )
         ELSE
            emin = zero
         END IF
         qmin = z( 4*n0-3 )
         qmax = qmin
         DO 90 i4 = 4*n0, 8, -4
            IF( z( i4-5 ).LE.zero )
     $         GO TO 100
            IF( qmin.GE.four*emax ) THEN
               qmin = min( qmin, z( i4-3 ) )
               emax = max( emax, z( i4-5 ) )
            END IF
            qmax = max( qmax, z( i4-7 )+z( i4-5 ) )
            emin = min( emin, z( i4-5 ) )
   90    CONTINUE
         i4 = 4
*
  100    CONTINUE
         i0 = i4 / 4
         pp = 0
*
         IF( n0-i0.GT.1 ) THEN
            dee = z( 4*i0-3 )
            deemin = dee
            kmin = i0
            DO 110 i4 = 4*i0+1, 4*n0-3, 4
               dee = z( i4 )*( dee /( dee+z( i4-2 ) ) )
               IF( dee.LE.deemin ) THEN
                  deemin = dee
                  kmin = ( i4+3 )/4
               END IF
  110       CONTINUE
            IF( (kmin-i0)*2.LT.n0-kmin .AND.
     $         deemin.LE.half*z(4*n0-3) ) THEN
               ipn4 = 4*( i0+n0 )
               pp = 2
               DO 120 i4 = 4*i0, 2*( i0+n0-1 ), 4
                  temp = z( i4-3 )
                  z( i4-3 ) = z( ipn4-i4-3 )
                  z( ipn4-i4-3 ) = temp
                  temp = z( i4-2 )
                  z( i4-2 ) = z( ipn4-i4-2 )
                  z( ipn4-i4-2 ) = temp
                  temp = z( i4-1 )
                  z( i4-1 ) = z( ipn4-i4-5 )
                  z( ipn4-i4-5 ) = temp
                  temp = z( i4 )
                  z( i4 ) = z( ipn4-i4-4 )
                  z( ipn4-i4-4 ) = temp
  120          CONTINUE
            END IF
         END IF
*
*        Put -(initial shift) into DMIN.
*
         dmin = -max( zero, qmin-two*sqrt( qmin )*sqrt( emax ) )
*
*        Now I0:N0 is unreduced.
*        PP = 0 for ping, PP = 1 for pong.
*        PP = 2 indicates that flipping was applied to the Z array and
*               and that the tests for deflation upon entry in SLASQ3
*               should not be performed.
*
         nbig = 100*( n0-i0+1 )
         DO 140 iwhilb = 1, nbig
            IF( i0.GT.n0 )
     $         GO TO 150
*
*           While submatrix unfinished take a good dqds step.
*
            CALL slasq3( i0, n0, z, pp, dmin, sigma, desig, qmax, nfail,
     $                   iter, ndiv, ieee, ttype, dmin1, dmin2, dn, dn1,
     $                   dn2, g, tau )
*
            pp = 1 - pp
*
*           When EMIN is very small check for splits.
*
            IF( pp.EQ.0 .AND. n0-i0.GE.3 ) THEN
               IF( z( 4*n0 ).LE.tol2*qmax .OR.
     $             z( 4*n0-1 ).LE.tol2*sigma ) THEN
                  splt = i0 - 1
                  qmax = z( 4*i0-3 )
                  emin = z( 4*i0-1 )
                  oldemn = z( 4*i0 )
                  DO 130 i4 = 4*i0, 4*( n0-3 ), 4
                     IF( z( i4 ).LE.tol2*z( i4-3 ) .OR.
     $                   z( i4-1 ).LE.tol2*sigma ) THEN
                        z( i4-1 ) = -sigma
                        splt = i4 / 4
                        qmax = zero
                        emin = z( i4+3 )
                        oldemn = z( i4+4 )
                     ELSE
                        qmax = max( qmax, z( i4+1 ) )
                        emin = min( emin, z( i4-1 ) )
                        oldemn = min( oldemn, z( i4 ) )
                     END IF
  130             CONTINUE
                  z( 4*n0-1 ) = emin
                  z( 4*n0 ) = oldemn
                  i0 = splt + 1
               END IF
            END IF
*
  140    CONTINUE
*
         info = 2
*
*        Maximum number of iterations exceeded, restore the shift
*        SIGMA and place the new d's and e's in a qd array.
*        This might need to be done for several blocks
*
         i1 = i0
         n1 = n0
 145     CONTINUE
         tempq = z( 4*i0-3 )
         z( 4*i0-3 ) = z( 4*i0-3 ) + sigma
         DO k = i0+1, n0
            tempe = z( 4*k-5 )
            z( 4*k-5 ) = z( 4*k-5 ) * (tempq / z( 4*k-7 ))
            tempq = z( 4*k-3 )
            z( 4*k-3 ) = z( 4*k-3 ) + sigma + tempe - z( 4*k-5 )
         END DO
*
*        Prepare to do this on the previous block if there is one
*
         IF( i1.GT.1 ) THEN
            n1 = i1-1
            DO WHILE( ( i1.GE.2 ) .AND. ( z(4*i1-5).GE.zero ) )
               i1 = i1 - 1
            END DO
            IF( i1.GE.1 ) THEN
               sigma = -z(4*n1-1)
               GO TO 145
            END IF
         END IF
 
         DO k = 1, n
            z( 2*k-1 ) = z( 4*k-3 )
*
*        Only the block 1..N0 is unfinished.  The rest of the e's
*        must be essentially zero, although sometimes other data
*        has been stored in them.
*
            IF( k.LT.n0 ) THEN
               z( 2*k ) = z( 4*k-1 )
            ELSE
               z( 2*k ) = 0
            END IF
         END DO
         RETURN
*
*        end IWHILB
*
  150    CONTINUE
*
  160 CONTINUE
*
      info = 3
      RETURN
*
*     end IWHILA
*
  170 CONTINUE
*
*     Move q's to the front.
*
      DO 180 k = 2, n
         z( k ) = z( 4*k-3 )
  180 CONTINUE
*
*     Sort and compute sum of eigenvalues.
*
      CALL slasrt( 'D', n, z, iinfo )
*
      e = zero
      DO 190 k = n, 1, -1
         e = e + z( k )
  190 CONTINUE
*
*     Store trace, sum(eigenvalues) and information on performance.
*
      z( 2*n+1 ) = trace
      z( 2*n+2 ) = e
      z( 2*n+3 ) = real( iter )
      z( 2*n+4 ) = real( ndiv ) / real( n**2 )
      z( 2*n+5 ) = hundrd*nfail / real( iter )
      RETURN
*
*     End of SLASQ2
*

◆ slasq3()

subroutine slasq3	(	integer	i0,
		integer	n0,
		real, dimension( * )	z,
		integer	pp,
		real	dmin,
		real	sigma,
		real	desig,
		real	qmax,
		integer	nfail,
		integer	iter,
		integer	ndiv,
		logical	ieee,
		integer	ttype,
		real	dmin1,
		real	dmin2,
		real	dn,
		real	dn1,
		real	dn2,
		real	g,
		real	tau )

SLASQ3 checks for deflation, computes a shift and calls dqds. Used by sbdsqr.

Download SLASQ3 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> SLASQ3 checks for deflation, computes a shift (TAU) and calls dqds.
!> In case of failure it changes shifts, and tries again until output
!> is positive.
!>

Parameters

[in]	I0	!> I0 is INTEGER !> First index. !>
[in,out]	N0	!> N0 is INTEGER !> Last index. !>
[in,out]	Z	!> Z is REAL array, dimension ( 4*N0 ) !> Z holds the qd array. !>
[in,out]	PP	!> PP is INTEGER !> PP=0 for ping, PP=1 for pong. !> PP=2 indicates that flipping was applied to the Z array !> and that the initial tests for deflation should not be !> performed. !>
[out]	DMIN	!> DMIN is REAL !> Minimum value of d. !>
[out]	SIGMA	!> SIGMA is REAL !> Sum of shifts used in current segment. !>
[in,out]	DESIG	!> DESIG is REAL !> Lower order part of SIGMA !>
[in]	QMAX	!> QMAX is REAL !> Maximum value of q. !>
[in,out]	NFAIL	!> NFAIL is INTEGER !> Increment NFAIL by 1 each time the shift was too big. !>
[in,out]	ITER	!> ITER is INTEGER !> Increment ITER by 1 for each iteration. !>
[in,out]	NDIV	!> NDIV is INTEGER !> Increment NDIV by 1 for each division. !>
[in]	IEEE	!> IEEE is LOGICAL !> Flag for IEEE or non IEEE arithmetic (passed to SLASQ5). !>
[in,out]	TTYPE	!> TTYPE is INTEGER !> Shift type. !>
[in,out]	DMIN1	!> DMIN1 is REAL !>
[in,out]	DMIN2	!> DMIN2 is REAL !>
[in,out]	DN	!> DN is REAL !>
[in,out]	DN1	!> DN1 is REAL !>
[in,out]	DN2	!> DN2 is REAL !>
[in,out]	G	!> G is REAL !>
[in,out]	TAU	!> TAU is REAL !> !> These are passed as arguments in order to save their values !> between calls to SLASQ3. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 179 of file slasq3.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      LOGICAL            IEEE
      INTEGER            I0, ITER, N0, NDIV, NFAIL, PP
      REAL               DESIG, DMIN, DMIN1, DMIN2, DN, DN1, DN2, G,
     $                   QMAX, SIGMA, TAU
*     ..
*     .. Array Arguments ..
      REAL               Z( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               CBIAS
      parameter( cbias = 1.50e0 )
      REAL               ZERO, QURTR, HALF, ONE, TWO, HUNDRD
      parameter( zero = 0.0e0, qurtr = 0.250e0, half = 0.5e0,
     $                     one = 1.0e0, two = 2.0e0, hundrd = 100.0e0 )
*     ..
*     .. Local Scalars ..
      INTEGER            IPN4, J4, N0IN, NN, TTYPE
      REAL               EPS, S, T, TEMP, TOL, TOL2
*     ..
*     .. External Subroutines ..
      EXTERNAL           slasq4, slasq5, slasq6
*     ..
*     .. External Function ..
      REAL               SLAMCH
      LOGICAL            SISNAN
      EXTERNAL           sisnan, slamch
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, max, min, sqrt
*     ..
*     .. Executable Statements ..
*
      n0in = n0
      eps = slamch( 'Precision' )
      tol = eps*hundrd
      tol2 = tol**2
*
*     Check for deflation.
*
   10 CONTINUE
*
      IF( n0.LT.i0 )
     $   RETURN
      IF( n0.EQ.i0 )
     $   GO TO 20
      nn = 4*n0 + pp
      IF( n0.EQ.( i0+1 ) )
     $   GO TO 40
*
*     Check whether E(N0-1) is negligible, 1 eigenvalue.
*
      IF( z( nn-5 ).GT.tol2*( sigma+z( nn-3 ) ) .AND.
     $    z( nn-2*pp-4 ).GT.tol2*z( nn-7 ) )
     $   GO TO 30
*
   20 CONTINUE
*
      z( 4*n0-3 ) = z( 4*n0+pp-3 ) + sigma
      n0 = n0 - 1
      GO TO 10
*
*     Check  whether E(N0-2) is negligible, 2 eigenvalues.
*
   30 CONTINUE
*
      IF( z( nn-9 ).GT.tol2*sigma .AND.
     $    z( nn-2*pp-8 ).GT.tol2*z( nn-11 ) )
     $   GO TO 50
*
   40 CONTINUE
*
      IF( z( nn-3 ).GT.z( nn-7 ) ) THEN
         s = z( nn-3 )
         z( nn-3 ) = z( nn-7 )
         z( nn-7 ) = s
      END IF
      t = half*( ( z( nn-7 )-z( nn-3 ) )+z( nn-5 ) )
      IF( z( nn-5 ).GT.z( nn-3 )*tol2.AND.t.NE.zero ) THEN
         s = z( nn-3 )*( z( nn-5 ) / t )
         IF( s.LE.t ) THEN
            s = z( nn-3 )*( z( nn-5 ) /
     $          ( t*( one+sqrt( one+s / t ) ) ) )
         ELSE
            s = z( nn-3 )*( z( nn-5 ) / ( t+sqrt( t )*sqrt( t+s ) ) )
         END IF
         t = z( nn-7 ) + ( s+z( nn-5 ) )
         z( nn-3 ) = z( nn-3 )*( z( nn-7 ) / t )
         z( nn-7 ) = t
      END IF
      z( 4*n0-7 ) = z( nn-7 ) + sigma
      z( 4*n0-3 ) = z( nn-3 ) + sigma
      n0 = n0 - 2
      GO TO 10
*
   50 CONTINUE
      IF( pp.EQ.2 )
     $   pp = 0
*
*     Reverse the qd-array, if warranted.
*
      IF( dmin.LE.zero .OR. n0.LT.n0in ) THEN
         IF( cbias*z( 4*i0+pp-3 ).LT.z( 4*n0+pp-3 ) ) THEN
            ipn4 = 4*( i0+n0 )
            DO 60 j4 = 4*i0, 2*( i0+n0-1 ), 4
               temp = z( j4-3 )
               z( j4-3 ) = z( ipn4-j4-3 )
               z( ipn4-j4-3 ) = temp
               temp = z( j4-2 )
               z( j4-2 ) = z( ipn4-j4-2 )
               z( ipn4-j4-2 ) = temp
               temp = z( j4-1 )
               z( j4-1 ) = z( ipn4-j4-5 )
               z( ipn4-j4-5 ) = temp
               temp = z( j4 )
               z( j4 ) = z( ipn4-j4-4 )
               z( ipn4-j4-4 ) = temp
   60       CONTINUE
            IF( n0-i0.LE.4 ) THEN
               z( 4*n0+pp-1 ) = z( 4*i0+pp-1 )
               z( 4*n0-pp ) = z( 4*i0-pp )
            END IF
            dmin2 = min( dmin2, z( 4*n0+pp-1 ) )
            z( 4*n0+pp-1 ) = min( z( 4*n0+pp-1 ), z( 4*i0+pp-1 ),
     $                            z( 4*i0+pp+3 ) )
            z( 4*n0-pp ) = min( z( 4*n0-pp ), z( 4*i0-pp ),
     $                          z( 4*i0-pp+4 ) )
            qmax = max( qmax, z( 4*i0+pp-3 ), z( 4*i0+pp+1 ) )
            dmin = -zero
         END IF
      END IF
*
*     Choose a shift.
*
      CALL slasq4( i0, n0, z, pp, n0in, dmin, dmin1, dmin2, dn, dn1,
     $             dn2, tau, ttype, g )
*
*     Call dqds until DMIN > 0.
*
   70 CONTINUE
*
      CALL slasq5( i0, n0, z, pp, tau, sigma, dmin, dmin1, dmin2, dn,
     $             dn1, dn2, ieee, eps )
*
      ndiv = ndiv + ( n0-i0+2 )
      iter = iter + 1
*
*     Check status.
*
      IF( dmin.GE.zero .AND. dmin1.GE.zero ) THEN
*
*        Success.
*
         GO TO 90
*
      ELSE IF( dmin.LT.zero .AND. dmin1.GT.zero .AND.
     $         z( 4*( n0-1 )-pp ).LT.tol*( sigma+dn1 ) .AND.
     $         abs( dn ).LT.tol*sigma ) THEN
*
*        Convergence hidden by negative DN.
*
         z( 4*( n0-1 )-pp+2 ) = zero
         dmin = zero
         GO TO 90
      ELSE IF( dmin.LT.zero ) THEN
*
*        TAU too big. Select new TAU and try again.
*
         nfail = nfail + 1
         IF( ttype.LT.-22 ) THEN
*
*           Failed twice. Play it safe.
*
            tau = zero
         ELSE IF( dmin1.GT.zero ) THEN
*
*           Late failure. Gives excellent shift.
*
            tau = ( tau+dmin )*( one-two*eps )
            ttype = ttype - 11
         ELSE
*
*           Early failure. Divide by 4.
*
            tau = qurtr*tau
            ttype = ttype - 12
         END IF
         GO TO 70
      ELSE IF( sisnan( dmin ) ) THEN
*
*        NaN.
*
         IF( tau.EQ.zero ) THEN
            GO TO 80
         ELSE
            tau = zero
            GO TO 70
         END IF
      ELSE
*
*        Possible underflow. Play it safe.
*
         GO TO 80
      END IF
*
*     Risk of underflow.
*
   80 CONTINUE
      CALL slasq6( i0, n0, z, pp, dmin, dmin1, dmin2, dn, dn1, dn2 )
      ndiv = ndiv + ( n0-i0+2 )
      iter = iter + 1
      tau = zero
*
   90 CONTINUE
      IF( tau.LT.sigma ) THEN
         desig = desig + tau
         t = sigma + desig
         desig = desig - ( t-sigma )
      ELSE
         t = sigma + tau
         desig = sigma - ( t-tau ) + desig
      END IF
      sigma = t
*
      RETURN
*
*     End of SLASQ3
*

◆ slasq4()

subroutine slasq4	(	integer	i0,
		integer	n0,
		real, dimension( * )	z,
		integer	pp,
		integer	n0in,
		real	dmin,
		real	dmin1,
		real	dmin2,
		real	dn,
		real	dn1,
		real	dn2,
		real	tau,
		integer	ttype,
		real	g )

SLASQ4 computes an approximation to the smallest eigenvalue using values of d from the previous transform. Used by sbdsqr.

Download SLASQ4 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> SLASQ4 computes an approximation TAU to the smallest eigenvalue
!> using values of d from the previous transform.
!>

Parameters

[in]	I0	!> I0 is INTEGER !> First index. !>
[in]	N0	!> N0 is INTEGER !> Last index. !>
[in]	Z	!> Z is REAL array, dimension ( 4*N0 ) !> Z holds the qd array. !>
[in]	PP	!> PP is INTEGER !> PP=0 for ping, PP=1 for pong. !>
[in]	N0IN	!> N0IN is INTEGER !> The value of N0 at start of EIGTEST. !>
[in]	DMIN	!> DMIN is REAL !> Minimum value of d. !>
[in]	DMIN1	!> DMIN1 is REAL !> Minimum value of d, excluding D( N0 ). !>
[in]	DMIN2	!> DMIN2 is REAL !> Minimum value of d, excluding D( N0 ) and D( N0-1 ). !>
[in]	DN	!> DN is REAL !> d(N) !>
[in]	DN1	!> DN1 is REAL !> d(N-1) !>
[in]	DN2	!> DN2 is REAL !> d(N-2) !>
[out]	TAU	!> TAU is REAL !> This is the shift. !>
[out]	TTYPE	!> TTYPE is INTEGER !> Shift type. !>
[in,out]	G	!> G is REAL !> G is passed as an argument in order to save its value between !> calls to SLASQ4. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  CNST1 = 9/16
!>

Definition at line 149 of file slasq4.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            I0, N0, N0IN, PP, TTYPE
      REAL               DMIN, DMIN1, DMIN2, DN, DN1, DN2, G, TAU
*     ..
*     .. Array Arguments ..
      REAL               Z( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               CNST1, CNST2, CNST3
      parameter( cnst1 = 0.5630e0, cnst2 = 1.010e0,
     $                   cnst3 = 1.050e0 )
      REAL               QURTR, THIRD, HALF, ZERO, ONE, TWO, HUNDRD
      parameter( qurtr = 0.250e0, third = 0.3330e0,
     $                   half = 0.50e0, zero = 0.0e0, one = 1.0e0,
     $                   two = 2.0e0, hundrd = 100.0e0 )
*     ..
*     .. Local Scalars ..
      INTEGER            I4, NN, NP
      REAL               A2, B1, B2, GAM, GAP1, GAP2, S
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, min, sqrt
*     ..
*     .. Executable Statements ..
*
*     A negative DMIN forces the shift to take that absolute value
*     TTYPE records the type of shift.
*
      IF( dmin.LE.zero ) THEN
         tau = -dmin
         ttype = -1
         RETURN
      END IF
*
      nn = 4*n0 + pp
      IF( n0in.EQ.n0 ) THEN
*
*        No eigenvalues deflated.
*
         IF( dmin.EQ.dn .OR. dmin.EQ.dn1 ) THEN
*
            b1 = sqrt( z( nn-3 ) )*sqrt( z( nn-5 ) )
            b2 = sqrt( z( nn-7 ) )*sqrt( z( nn-9 ) )
            a2 = z( nn-7 ) + z( nn-5 )
*
*           Cases 2 and 3.
*
            IF( dmin.EQ.dn .AND. dmin1.EQ.dn1 ) THEN
               gap2 = dmin2 - a2 - dmin2*qurtr
               IF( gap2.GT.zero .AND. gap2.GT.b2 ) THEN
                  gap1 = a2 - dn - ( b2 / gap2 )*b2
               ELSE
                  gap1 = a2 - dn - ( b1+b2 )
               END IF
               IF( gap1.GT.zero .AND. gap1.GT.b1 ) THEN
                  s = max( dn-( b1 / gap1 )*b1, half*dmin )
                  ttype = -2
               ELSE
                  s = zero
                  IF( dn.GT.b1 )
     $               s = dn - b1
                  IF( a2.GT.( b1+b2 ) )
     $               s = min( s, a2-( b1+b2 ) )
                  s = max( s, third*dmin )
                  ttype = -3
               END IF
            ELSE
*
*              Case 4.
*
               ttype = -4
               s = qurtr*dmin
               IF( dmin.EQ.dn ) THEN
                  gam = dn
                  a2 = zero
                  IF( z( nn-5 ) .GT. z( nn-7 ) )
     $               RETURN
                  b2 = z( nn-5 ) / z( nn-7 )
                  np = nn - 9
               ELSE
                  np = nn - 2*pp
                  gam = dn1
                  IF( z( np-4 ) .GT. z( np-2 ) )
     $               RETURN
                  a2 = z( np-4 ) / z( np-2 )
                  IF( z( nn-9 ) .GT. z( nn-11 ) )
     $               RETURN
                  b2 = z( nn-9 ) / z( nn-11 )
                  np = nn - 13
               END IF
*
*              Approximate contribution to norm squared from I < NN-1.
*
               a2 = a2 + b2
               DO 10 i4 = np, 4*i0 - 1 + pp, -4
                  IF( b2.EQ.zero )
     $               GO TO 20
                  b1 = b2
                  IF( z( i4 ) .GT. z( i4-2 ) )
     $               RETURN
                  b2 = b2*( z( i4 ) / z( i4-2 ) )
                  a2 = a2 + b2
                  IF( hundrd*max( b2, b1 ).LT.a2 .OR. cnst1.LT.a2 )
     $               GO TO 20
   10          CONTINUE
   20          CONTINUE
               a2 = cnst3*a2
*
*              Rayleigh quotient residual bound.
*
               IF( a2.LT.cnst1 )
     $            s = gam*( one-sqrt( a2 ) ) / ( one+a2 )
            END IF
         ELSE IF( dmin.EQ.dn2 ) THEN
*
*           Case 5.
*
            ttype = -5
            s = qurtr*dmin
*
*           Compute contribution to norm squared from I > NN-2.
*
            np = nn - 2*pp
            b1 = z( np-2 )
            b2 = z( np-6 )
            gam = dn2
            IF( z( np-8 ).GT.b2 .OR. z( np-4 ).GT.b1 )
     $         RETURN
            a2 = ( z( np-8 ) / b2 )*( one+z( np-4 ) / b1 )
*
*           Approximate contribution to norm squared from I < NN-2.
*
            IF( n0-i0.GT.2 ) THEN
               b2 = z( nn-13 ) / z( nn-15 )
               a2 = a2 + b2
               DO 30 i4 = nn - 17, 4*i0 - 1 + pp, -4
                  IF( b2.EQ.zero )
     $               GO TO 40
                  b1 = b2
                  IF( z( i4 ) .GT. z( i4-2 ) )
     $               RETURN
                  b2 = b2*( z( i4 ) / z( i4-2 ) )
                  a2 = a2 + b2
                  IF( hundrd*max( b2, b1 ).LT.a2 .OR. cnst1.LT.a2 )
     $               GO TO 40
   30          CONTINUE
   40          CONTINUE
               a2 = cnst3*a2
            END IF
*
            IF( a2.LT.cnst1 )
     $         s = gam*( one-sqrt( a2 ) ) / ( one+a2 )
         ELSE
*
*           Case 6, no information to guide us.
*
            IF( ttype.EQ.-6 ) THEN
               g = g + third*( one-g )
            ELSE IF( ttype.EQ.-18 ) THEN
               g = qurtr*third
            ELSE
               g = qurtr
            END IF
            s = g*dmin
            ttype = -6
         END IF
*
      ELSE IF( n0in.EQ.( n0+1 ) ) THEN
*
*        One eigenvalue just deflated. Use DMIN1, DN1 for DMIN and DN.
*
         IF( dmin1.EQ.dn1 .AND. dmin2.EQ.dn2 ) THEN
*
*           Cases 7 and 8.
*
            ttype = -7
            s = third*dmin1
            IF( z( nn-5 ).GT.z( nn-7 ) )
     $         RETURN
            b1 = z( nn-5 ) / z( nn-7 )
            b2 = b1
            IF( b2.EQ.zero )
     $         GO TO 60
            DO 50 i4 = 4*n0 - 9 + pp, 4*i0 - 1 + pp, -4
               a2 = b1
               IF( z( i4 ).GT.z( i4-2 ) )
     $            RETURN
               b1 = b1*( z( i4 ) / z( i4-2 ) )
               b2 = b2 + b1
               IF( hundrd*max( b1, a2 ).LT.b2 )
     $            GO TO 60
   50       CONTINUE
   60       CONTINUE
            b2 = sqrt( cnst3*b2 )
            a2 = dmin1 / ( one+b2**2 )
            gap2 = half*dmin2 - a2
            IF( gap2.GT.zero .AND. gap2.GT.b2*a2 ) THEN
               s = max( s, a2*( one-cnst2*a2*( b2 / gap2 )*b2 ) )
            ELSE
               s = max( s, a2*( one-cnst2*b2 ) )
               ttype = -8
            END IF
         ELSE
*
*           Case 9.
*
            s = qurtr*dmin1
            IF( dmin1.EQ.dn1 )
     $         s = half*dmin1
            ttype = -9
         END IF
*
      ELSE IF( n0in.EQ.( n0+2 ) ) THEN
*
*        Two eigenvalues deflated. Use DMIN2, DN2 for DMIN and DN.
*
*        Cases 10 and 11.
*
         IF( dmin2.EQ.dn2 .AND. two*z( nn-5 ).LT.z( nn-7 ) ) THEN
            ttype = -10
            s = third*dmin2
            IF( z( nn-5 ).GT.z( nn-7 ) )
     $         RETURN
            b1 = z( nn-5 ) / z( nn-7 )
            b2 = b1
            IF( b2.EQ.zero )
     $         GO TO 80
            DO 70 i4 = 4*n0 - 9 + pp, 4*i0 - 1 + pp, -4
               IF( z( i4 ).GT.z( i4-2 ) )
     $            RETURN
               b1 = b1*( z( i4 ) / z( i4-2 ) )
               b2 = b2 + b1
               IF( hundrd*b1.LT.b2 )
     $            GO TO 80
   70       CONTINUE
   80       CONTINUE
            b2 = sqrt( cnst3*b2 )
            a2 = dmin2 / ( one+b2**2 )
            gap2 = z( nn-7 ) + z( nn-9 ) -
     $             sqrt( z( nn-11 ) )*sqrt( z( nn-9 ) ) - a2
            IF( gap2.GT.zero .AND. gap2.GT.b2*a2 ) THEN
               s = max( s, a2*( one-cnst2*a2*( b2 / gap2 )*b2 ) )
            ELSE
               s = max( s, a2*( one-cnst2*b2 ) )
            END IF
         ELSE
            s = qurtr*dmin2
            ttype = -11
         END IF
      ELSE IF( n0in.GT.( n0+2 ) ) THEN
*
*        Case 12, more than two eigenvalues deflated. No information.
*
         s = zero
         ttype = -12
      END IF
*
      tau = s
      RETURN
*
*     End of SLASQ4
*

◆ slasq5()

subroutine slasq5	(	integer	i0,
		integer	n0,
		real, dimension( * )	z,
		integer	pp,
		real	tau,
		real	sigma,
		real	dmin,
		real	dmin1,
		real	dmin2,
		real	dn,
		real	dnm1,
		real	dnm2,
		logical	ieee,
		real	eps )

SLASQ5 computes one dqds transform in ping-pong form. Used by sbdsqr and sstegr.

Download SLASQ5 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> SLASQ5 computes one dqds transform in ping-pong form, one
!> version for IEEE machines another for non IEEE machines.
!>

Parameters

[in]	I0	!> I0 is INTEGER !> First index. !>
[in]	N0	!> N0 is INTEGER !> Last index. !>
[in]	Z	!> Z is REAL array, dimension ( 4N ) !> Z holds the qd array. EMIN is stored in Z(4N0) to avoid !> an extra argument. !>
[in]	PP	!> PP is INTEGER !> PP=0 for ping, PP=1 for pong. !>
[in]	TAU	!> TAU is REAL !> This is the shift. !>
[in]	SIGMA	!> SIGMA is REAL !> This is the accumulated shift up to this step. !>
[out]	DMIN	!> DMIN is REAL !> Minimum value of d. !>
[out]	DMIN1	!> DMIN1 is REAL !> Minimum value of d, excluding D( N0 ). !>
[out]	DMIN2	!> DMIN2 is REAL !> Minimum value of d, excluding D( N0 ) and D( N0-1 ). !>
[out]	DN	!> DN is REAL !> d(N0), the last value of d. !>
[out]	DNM1	!> DNM1 is REAL !> d(N0-1). !>
[out]	DNM2	!> DNM2 is REAL !> d(N0-2). !>
[in]	IEEE	!> IEEE is LOGICAL !> Flag for IEEE or non IEEE arithmetic. !>
[in]	EPS	!> EPS is REAL !> This is the value of epsilon used. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 142 of file slasq5.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      LOGICAL            IEEE
      INTEGER            I0, N0, PP
      REAL               DMIN, DMIN1, DMIN2, DN, DNM1, DNM2, TAU,
     $                   SIGMA, EPS
*     ..
*     .. Array Arguments ..
      REAL               Z( * )
*     ..
*
*  =====================================================================
*
*     .. Parameter ..
      REAL               ZERO, HALF
      parameter( zero = 0.0e0, half = 0.5 )
*     ..
*     .. Local Scalars ..
      INTEGER            J4, J4P2
      REAL               D, EMIN, TEMP, DTHRESH
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          min
*     ..
*     .. Executable Statements ..
*
      IF( ( n0-i0-1 ).LE.0 )
     $   RETURN
*
      dthresh = eps*(sigma+tau)
      IF( tau.LT.dthresh*half ) tau = zero
      IF( tau.NE.zero ) THEN
         j4 = 4*i0 + pp - 3
         emin = z( j4+4 )
         d = z( j4 ) - tau
         dmin = d
         dmin1 = -z( j4 )
*
         IF( ieee ) THEN
*
*     Code for IEEE arithmetic.
*
            IF( pp.EQ.0 ) THEN
               DO 10 j4 = 4*i0, 4*( n0-3 ), 4
                  z( j4-2 ) = d + z( j4-1 )
                  temp = z( j4+1 ) / z( j4-2 )
                  d = d*temp - tau
                  dmin = min( dmin, d )
                  z( j4 ) = z( j4-1 )*temp
                  emin = min( z( j4 ), emin )
 10            CONTINUE
            ELSE
               DO 20 j4 = 4*i0, 4*( n0-3 ), 4
                  z( j4-3 ) = d + z( j4 )
                  temp = z( j4+2 ) / z( j4-3 )
                  d = d*temp - tau
                  dmin = min( dmin, d )
                  z( j4-1 ) = z( j4 )*temp
                  emin = min( z( j4-1 ), emin )
 20            CONTINUE
            END IF
*
*     Unroll last two steps.
*
            dnm2 = d
            dmin2 = dmin
            j4 = 4*( n0-2 ) - pp
            j4p2 = j4 + 2*pp - 1
            z( j4-2 ) = dnm2 + z( j4p2 )
            z( j4 ) = z( j4p2+2 )*( z( j4p2 ) / z( j4-2 ) )
            dnm1 = z( j4p2+2 )*( dnm2 / z( j4-2 ) ) - tau
            dmin = min( dmin, dnm1 )
*
            dmin1 = dmin
            j4 = j4 + 4
            j4p2 = j4 + 2*pp - 1
            z( j4-2 ) = dnm1 + z( j4p2 )
            z( j4 ) = z( j4p2+2 )*( z( j4p2 ) / z( j4-2 ) )
            dn = z( j4p2+2 )*( dnm1 / z( j4-2 ) ) - tau
            dmin = min( dmin, dn )
*
         ELSE
*
*     Code for non IEEE arithmetic.
*
            IF( pp.EQ.0 ) THEN
               DO 30 j4 = 4*i0, 4*( n0-3 ), 4
                  z( j4-2 ) = d + z( j4-1 )
                  IF( d.LT.zero ) THEN
                     RETURN
                  ELSE
                     z( j4 ) = z( j4+1 )*( z( j4-1 ) / z( j4-2 ) )
                     d = z( j4+1 )*( d / z( j4-2 ) ) - tau
                  END IF
                  dmin = min( dmin, d )
                  emin = min( emin, z( j4 ) )
 30            CONTINUE
            ELSE
               DO 40 j4 = 4*i0, 4*( n0-3 ), 4
                  z( j4-3 ) = d + z( j4 )
                  IF( d.LT.zero ) THEN
                     RETURN
                  ELSE
                     z( j4-1 ) = z( j4+2 )*( z( j4 ) / z( j4-3 ) )
                     d = z( j4+2 )*( d / z( j4-3 ) ) - tau
                  END IF
                  dmin = min( dmin, d )
                  emin = min( emin, z( j4-1 ) )
 40            CONTINUE
            END IF
*
*     Unroll last two steps.
*
            dnm2 = d
            dmin2 = dmin
            j4 = 4*( n0-2 ) - pp
            j4p2 = j4 + 2*pp - 1
            z( j4-2 ) = dnm2 + z( j4p2 )
            IF( dnm2.LT.zero ) THEN
               RETURN
            ELSE
               z( j4 ) = z( j4p2+2 )*( z( j4p2 ) / z( j4-2 ) )
               dnm1 = z( j4p2+2 )*( dnm2 / z( j4-2 ) ) - tau
            END IF
            dmin = min( dmin, dnm1 )
*
            dmin1 = dmin
            j4 = j4 + 4
            j4p2 = j4 + 2*pp - 1
            z( j4-2 ) = dnm1 + z( j4p2 )
            IF( dnm1.LT.zero ) THEN
               RETURN
            ELSE
               z( j4 ) = z( j4p2+2 )*( z( j4p2 ) / z( j4-2 ) )
               dn = z( j4p2+2 )*( dnm1 / z( j4-2 ) ) - tau
            END IF
            dmin = min( dmin, dn )
*
         END IF
*
      ELSE
*     This is the version that sets d's to zero if they are small enough
         j4 = 4*i0 + pp - 3
         emin = z( j4+4 )
         d = z( j4 ) - tau
         dmin = d
         dmin1 = -z( j4 )
         IF( ieee ) THEN
*
*     Code for IEEE arithmetic.
*
            IF( pp.EQ.0 ) THEN
               DO 50 j4 = 4*i0, 4*( n0-3 ), 4
                  z( j4-2 ) = d + z( j4-1 )
                  temp = z( j4+1 ) / z( j4-2 )
                  d = d*temp - tau
                  IF( d.LT.dthresh ) d = zero
                  dmin = min( dmin, d )
                  z( j4 ) = z( j4-1 )*temp
                  emin = min( z( j4 ), emin )
 50            CONTINUE
            ELSE
               DO 60 j4 = 4*i0, 4*( n0-3 ), 4
                  z( j4-3 ) = d + z( j4 )
                  temp = z( j4+2 ) / z( j4-3 )
                  d = d*temp - tau
                  IF( d.LT.dthresh ) d = zero
                  dmin = min( dmin, d )
                  z( j4-1 ) = z( j4 )*temp
                  emin = min( z( j4-1 ), emin )
 60            CONTINUE
            END IF
*
*     Unroll last two steps.
*
            dnm2 = d
            dmin2 = dmin
            j4 = 4*( n0-2 ) - pp
            j4p2 = j4 + 2*pp - 1
            z( j4-2 ) = dnm2 + z( j4p2 )
            z( j4 ) = z( j4p2+2 )*( z( j4p2 ) / z( j4-2 ) )
            dnm1 = z( j4p2+2 )*( dnm2 / z( j4-2 ) ) - tau
            dmin = min( dmin, dnm1 )
*
            dmin1 = dmin
            j4 = j4 + 4
            j4p2 = j4 + 2*pp - 1
            z( j4-2 ) = dnm1 + z( j4p2 )
            z( j4 ) = z( j4p2+2 )*( z( j4p2 ) / z( j4-2 ) )
            dn = z( j4p2+2 )*( dnm1 / z( j4-2 ) ) - tau
            dmin = min( dmin, dn )
*
         ELSE
*
*     Code for non IEEE arithmetic.
*
            IF( pp.EQ.0 ) THEN
               DO 70 j4 = 4*i0, 4*( n0-3 ), 4
                  z( j4-2 ) = d + z( j4-1 )
                  IF( d.LT.zero ) THEN
                     RETURN
                  ELSE
                     z( j4 ) = z( j4+1 )*( z( j4-1 ) / z( j4-2 ) )
                     d = z( j4+1 )*( d / z( j4-2 ) ) - tau
                  END IF
                  IF( d.LT.dthresh ) d = zero
                  dmin = min( dmin, d )
                  emin = min( emin, z( j4 ) )
 70            CONTINUE
            ELSE
               DO 80 j4 = 4*i0, 4*( n0-3 ), 4
                  z( j4-3 ) = d + z( j4 )
                  IF( d.LT.zero ) THEN
                     RETURN
                  ELSE
                     z( j4-1 ) = z( j4+2 )*( z( j4 ) / z( j4-3 ) )
                     d = z( j4+2 )*( d / z( j4-3 ) ) - tau
                  END IF
                  IF( d.LT.dthresh ) d = zero
                  dmin = min( dmin, d )
                  emin = min( emin, z( j4-1 ) )
 80            CONTINUE
            END IF
*
*     Unroll last two steps.
*
            dnm2 = d
            dmin2 = dmin
            j4 = 4*( n0-2 ) - pp
            j4p2 = j4 + 2*pp - 1
            z( j4-2 ) = dnm2 + z( j4p2 )
            IF( dnm2.LT.zero ) THEN
               RETURN
            ELSE
               z( j4 ) = z( j4p2+2 )*( z( j4p2 ) / z( j4-2 ) )
               dnm1 = z( j4p2+2 )*( dnm2 / z( j4-2 ) ) - tau
            END IF
            dmin = min( dmin, dnm1 )
*
            dmin1 = dmin
            j4 = j4 + 4
            j4p2 = j4 + 2*pp - 1
            z( j4-2 ) = dnm1 + z( j4p2 )
            IF( dnm1.LT.zero ) THEN
               RETURN
            ELSE
               z( j4 ) = z( j4p2+2 )*( z( j4p2 ) / z( j4-2 ) )
               dn = z( j4p2+2 )*( dnm1 / z( j4-2 ) ) - tau
            END IF
            dmin = min( dmin, dn )
*
         END IF
*
      END IF
      z( j4+2 ) = dn
      z( 4*n0-pp ) = emin
      RETURN
*
*     End of SLASQ5
*

◆ slasq6()

subroutine slasq6	(	integer	i0,
		integer	n0,
		real, dimension( * )	z,
		integer	pp,
		real	dmin,
		real	dmin1,
		real	dmin2,
		real	dn,
		real	dnm1,
		real	dnm2 )

SLASQ6 computes one dqd transform in ping-pong form. Used by sbdsqr and sstegr.

Download SLASQ6 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> SLASQ6 computes one dqd (shift equal to zero) transform in
!> ping-pong form, with protection against underflow and overflow.
!>

Parameters

[in]	I0	!> I0 is INTEGER !> First index. !>
[in]	N0	!> N0 is INTEGER !> Last index. !>
[in]	Z	!> Z is REAL array, dimension ( 4N ) !> Z holds the qd array. EMIN is stored in Z(4N0) to avoid !> an extra argument. !>
[in]	PP	!> PP is INTEGER !> PP=0 for ping, PP=1 for pong. !>
[out]	DMIN	!> DMIN is REAL !> Minimum value of d. !>
[out]	DMIN1	!> DMIN1 is REAL !> Minimum value of d, excluding D( N0 ). !>
[out]	DMIN2	!> DMIN2 is REAL !> Minimum value of d, excluding D( N0 ) and D( N0-1 ). !>
[out]	DN	!> DN is REAL !> d(N0), the last value of d. !>
[out]	DNM1	!> DNM1 is REAL !> d(N0-1). !>
[out]	DNM2	!> DNM2 is REAL !> d(N0-2). !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 117 of file slasq6.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            I0, N0, PP
      REAL               DMIN, DMIN1, DMIN2, DN, DNM1, DNM2
*     ..
*     .. Array Arguments ..
      REAL               Z( * )
*     ..
*
*  =====================================================================
*
*     .. Parameter ..
      REAL               ZERO
      parameter( zero = 0.0e0 )
*     ..
*     .. Local Scalars ..
      INTEGER            J4, J4P2
      REAL               D, EMIN, SAFMIN, TEMP
*     ..
*     .. External Function ..
      REAL               SLAMCH
      EXTERNAL           slamch
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          min
*     ..
*     .. Executable Statements ..
*
      IF( ( n0-i0-1 ).LE.0 )
     $   RETURN
*
      safmin = slamch( 'Safe minimum' )
      j4 = 4*i0 + pp - 3
      emin = z( j4+4 )
      d = z( j4 )
      dmin = d
*
      IF( pp.EQ.0 ) THEN
         DO 10 j4 = 4*i0, 4*( n0-3 ), 4
            z( j4-2 ) = d + z( j4-1 )
            IF( z( j4-2 ).EQ.zero ) THEN
               z( j4 ) = zero
               d = z( j4+1 )
               dmin = d
               emin = zero
            ELSE IF( safmin*z( j4+1 ).LT.z( j4-2 ) .AND.
     $               safmin*z( j4-2 ).LT.z( j4+1 ) ) THEN
               temp = z( j4+1 ) / z( j4-2 )
               z( j4 ) = z( j4-1 )*temp
               d = d*temp
            ELSE
               z( j4 ) = z( j4+1 )*( z( j4-1 ) / z( j4-2 ) )
               d = z( j4+1 )*( d / z( j4-2 ) )
            END IF
            dmin = min( dmin, d )
            emin = min( emin, z( j4 ) )
   10    CONTINUE
      ELSE
         DO 20 j4 = 4*i0, 4*( n0-3 ), 4
            z( j4-3 ) = d + z( j4 )
            IF( z( j4-3 ).EQ.zero ) THEN
               z( j4-1 ) = zero
               d = z( j4+2 )
               dmin = d
               emin = zero
            ELSE IF( safmin*z( j4+2 ).LT.z( j4-3 ) .AND.
     $               safmin*z( j4-3 ).LT.z( j4+2 ) ) THEN
               temp = z( j4+2 ) / z( j4-3 )
               z( j4-1 ) = z( j4 )*temp
               d = d*temp
            ELSE
               z( j4-1 ) = z( j4+2 )*( z( j4 ) / z( j4-3 ) )
               d = z( j4+2 )*( d / z( j4-3 ) )
            END IF
            dmin = min( dmin, d )
            emin = min( emin, z( j4-1 ) )
   20    CONTINUE
      END IF
*
*     Unroll last two steps.
*
      dnm2 = d
      dmin2 = dmin
      j4 = 4*( n0-2 ) - pp
      j4p2 = j4 + 2*pp - 1
      z( j4-2 ) = dnm2 + z( j4p2 )
      IF( z( j4-2 ).EQ.zero ) THEN
         z( j4 ) = zero
         dnm1 = z( j4p2+2 )
         dmin = dnm1
         emin = zero
      ELSE IF( safmin*z( j4p2+2 ).LT.z( j4-2 ) .AND.
     $         safmin*z( j4-2 ).LT.z( j4p2+2 ) ) THEN
         temp = z( j4p2+2 ) / z( j4-2 )
         z( j4 ) = z( j4p2 )*temp
         dnm1 = dnm2*temp
      ELSE
         z( j4 ) = z( j4p2+2 )*( z( j4p2 ) / z( j4-2 ) )
         dnm1 = z( j4p2+2 )*( dnm2 / z( j4-2 ) )
      END IF
      dmin = min( dmin, dnm1 )
*
      dmin1 = dmin
      j4 = j4 + 4
      j4p2 = j4 + 2*pp - 1
      z( j4-2 ) = dnm1 + z( j4p2 )
      IF( z( j4-2 ).EQ.zero ) THEN
         z( j4 ) = zero
         dn = z( j4p2+2 )
         dmin = dn
         emin = zero
      ELSE IF( safmin*z( j4p2+2 ).LT.z( j4-2 ) .AND.
     $         safmin*z( j4-2 ).LT.z( j4p2+2 ) ) THEN
         temp = z( j4p2+2 ) / z( j4-2 )
         z( j4 ) = z( j4p2 )*temp
         dn = dnm1*temp
      ELSE
         z( j4 ) = z( j4p2+2 )*( z( j4p2 ) / z( j4-2 ) )
         dn = z( j4p2+2 )*( dnm1 / z( j4-2 ) )
      END IF
      dmin = min( dmin, dn )
*
      z( j4+2 ) = dn
      z( 4*n0-pp ) = emin
      RETURN
*
*     End of SLASQ6
*

◆ slasrt()

subroutine slasrt	(	character	id,
		integer	n,
		real, dimension( * )	d,
		integer	info )

SLASRT sorts numbers in increasing or decreasing order.

Download SLASRT + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> Sort the numbers in D in increasing order (if ID = 'I') or
!> in decreasing order (if ID = 'D' ).
!>
!> Use Quick Sort, reverting to Insertion sort on arrays of
!> size <= 20. Dimension of STACK limits N to about 2**32.
!>

Parameters

[in]	ID	!> ID is CHARACTER*1 !> = 'I': sort D in increasing order; !> = 'D': sort D in decreasing order. !>
[in]	N	!> N is INTEGER !> The length of the array D. !>
[in,out]	D	!> D is REAL array, dimension (N) !> On entry, the array to be sorted. !> On exit, D has been sorted into increasing order !> (D(1) <= ... <= D(N) ) or into decreasing order !> (D(1) >= ... >= D(N) ), depending on ID. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 87 of file slasrt.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          ID
      INTEGER            INFO, N
*     ..
*     .. Array Arguments ..
      REAL               D( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      INTEGER            SELECT
      parameter( SELECT = 20 )
*     ..
*     .. Local Scalars ..
      INTEGER            DIR, ENDD, I, J, START, STKPNT
      REAL               D1, D2, D3, DMNMX, TMP
*     ..
*     .. Local Arrays ..
      INTEGER            STACK( 2, 32 )
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           xerbla
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      dir = -1
      IF( lsame( id, 'D' ) ) THEN
         dir = 0
      ELSE IF( lsame( id, 'I' ) ) THEN
         dir = 1
      END IF
      IF( dir.EQ.-1 ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'SLASRT', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.LE.1 )
     $   RETURN
*
      stkpnt = 1
      stack( 1, 1 ) = 1
      stack( 2, 1 ) = n
   10 CONTINUE
      start = stack( 1, stkpnt )
      endd = stack( 2, stkpnt )
      stkpnt = stkpnt - 1
      IF( endd-start.LE.SELECT .AND. endd-start.GT.0 ) THEN
*
*        Do Insertion sort on D( START:ENDD )
*
         IF( dir.EQ.0 ) THEN
*
*           Sort into decreasing order
*
            DO 30 i = start + 1, endd
               DO 20 j = i, start + 1, -1
                  IF( d( j ).GT.d( j-1 ) ) THEN
                     dmnmx = d( j )
                     d( j ) = d( j-1 )
                     d( j-1 ) = dmnmx
                  ELSE
                     GO TO 30
                  END IF
   20          CONTINUE
   30       CONTINUE
*
         ELSE
*
*           Sort into increasing order
*
            DO 50 i = start + 1, endd
               DO 40 j = i, start + 1, -1
                  IF( d( j ).LT.d( j-1 ) ) THEN
                     dmnmx = d( j )
                     d( j ) = d( j-1 )
                     d( j-1 ) = dmnmx
                  ELSE
                     GO TO 50
                  END IF
   40          CONTINUE
   50       CONTINUE
*
         END IF
*
      ELSE IF( endd-start.GT.SELECT ) THEN
*
*        Partition D( START:ENDD ) and stack parts, largest one first
*
*        Choose partition entry as median of 3
*
         d1 = d( start )
         d2 = d( endd )
         i = ( start+endd ) / 2
         d3 = d( i )
         IF( d1.LT.d2 ) THEN
            IF( d3.LT.d1 ) THEN
               dmnmx = d1
            ELSE IF( d3.LT.d2 ) THEN
               dmnmx = d3
            ELSE
               dmnmx = d2
            END IF
         ELSE
            IF( d3.LT.d2 ) THEN
               dmnmx = d2
            ELSE IF( d3.LT.d1 ) THEN
               dmnmx = d3
            ELSE
               dmnmx = d1
            END IF
         END IF
*
         IF( dir.EQ.0 ) THEN
*
*           Sort into decreasing order
*
            i = start - 1
            j = endd + 1
   60       CONTINUE
   70       CONTINUE
            j = j - 1
            IF( d( j ).LT.dmnmx )
     $         GO TO 70
   80       CONTINUE
            i = i + 1
            IF( d( i ).GT.dmnmx )
     $         GO TO 80
            IF( i.LT.j ) THEN
               tmp = d( i )
               d( i ) = d( j )
               d( j ) = tmp
               GO TO 60
            END IF
            IF( j-start.GT.endd-j-1 ) THEN
               stkpnt = stkpnt + 1
               stack( 1, stkpnt ) = start
               stack( 2, stkpnt ) = j
               stkpnt = stkpnt + 1
               stack( 1, stkpnt ) = j + 1
               stack( 2, stkpnt ) = endd
            ELSE
               stkpnt = stkpnt + 1
               stack( 1, stkpnt ) = j + 1
               stack( 2, stkpnt ) = endd
               stkpnt = stkpnt + 1
               stack( 1, stkpnt ) = start
               stack( 2, stkpnt ) = j
            END IF
         ELSE
*
*           Sort into increasing order
*
            i = start - 1
            j = endd + 1
   90       CONTINUE
  100       CONTINUE
            j = j - 1
            IF( d( j ).GT.dmnmx )
     $         GO TO 100
  110       CONTINUE
            i = i + 1
            IF( d( i ).LT.dmnmx )
     $         GO TO 110
            IF( i.LT.j ) THEN
               tmp = d( i )
               d( i ) = d( j )
               d( j ) = tmp
               GO TO 90
            END IF
            IF( j-start.GT.endd-j-1 ) THEN
               stkpnt = stkpnt + 1
               stack( 1, stkpnt ) = start
               stack( 2, stkpnt ) = j
               stkpnt = stkpnt + 1
               stack( 1, stkpnt ) = j + 1
               stack( 2, stkpnt ) = endd
            ELSE
               stkpnt = stkpnt + 1
               stack( 1, stkpnt ) = j + 1
               stack( 2, stkpnt ) = endd
               stkpnt = stkpnt + 1
               stack( 1, stkpnt ) = start
               stack( 2, stkpnt ) = j
            END IF
         END IF
      END IF
      IF( stkpnt.GT.0 )
     $   GO TO 10
      RETURN
*
*     End of SLASRT
*

◆ spttrf()

subroutine spttrf	(	integer	n,
		real, dimension( * )	d,
		real, dimension( * )	e,
		integer	info )

SPTTRF

Download SPTTRF + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> SPTTRF computes the L*D*L**T factorization of a real symmetric
!> positive definite tridiagonal matrix A.  The factorization may also
!> be regarded as having the form A = U**T*D*U.
!>

Parameters

[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in,out]	D	!> D is REAL array, dimension (N) !> On entry, the n diagonal elements of the tridiagonal matrix !> A. On exit, the n diagonal elements of the diagonal matrix !> D from the LDL**T factorization of A. !>
[in,out]	E	!> E is REAL array, dimension (N-1) !> On entry, the (n-1) subdiagonal elements of the tridiagonal !> matrix A. On exit, the (n-1) subdiagonal elements of the !> unit bidiagonal factor L from the LDLT factorization of A. !> E can also be regarded as the superdiagonal of the unit !> bidiagonal factor U from the UTDU factorization of A. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -k, the k-th argument had an illegal value !> > 0: if INFO = k, the leading minor of order k is not !> positive definite; if k < N, the factorization could not !> be completed, while if k = N, the factorization was !> completed, but D(N) <= 0. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 90 of file spttrf.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INFO, N
*     ..
*     .. Array Arguments ..
      REAL               D( * ), E( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ZERO
      parameter( zero = 0.0e+0 )
*     ..
*     .. Local Scalars ..
      INTEGER            I, I4
      REAL               EI
*     ..
*     .. External Subroutines ..
      EXTERNAL           xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          mod
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      IF( n.LT.0 ) THEN
         info = -1
         CALL xerbla( 'SPTTRF', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
*     Compute the L*D*L**T (or U**T*D*U) factorization of A.
*
      i4 = mod( n-1, 4 )
      DO 10 i = 1, i4
         IF( d( i ).LE.zero ) THEN
            info = i
            GO TO 30
         END IF
         ei = e( i )
         e( i ) = ei / d( i )
         d( i+1 ) = d( i+1 ) - e( i )*ei
   10 CONTINUE
*
      DO 20 i = i4 + 1, n - 4, 4
*
*        Drop out of the loop if d(i) <= 0: the matrix is not positive
*        definite.
*
         IF( d( i ).LE.zero ) THEN
            info = i
            GO TO 30
         END IF
*
*        Solve for e(i) and d(i+1).
*
         ei = e( i )
         e( i ) = ei / d( i )
         d( i+1 ) = d( i+1 ) - e( i )*ei
*
         IF( d( i+1 ).LE.zero ) THEN
            info = i + 1
            GO TO 30
         END IF
*
*        Solve for e(i+1) and d(i+2).
*
         ei = e( i+1 )
         e( i+1 ) = ei / d( i+1 )
         d( i+2 ) = d( i+2 ) - e( i+1 )*ei
*
         IF( d( i+2 ).LE.zero ) THEN
            info = i + 2
            GO TO 30
         END IF
*
*        Solve for e(i+2) and d(i+3).
*
         ei = e( i+2 )
         e( i+2 ) = ei / d( i+2 )
         d( i+3 ) = d( i+3 ) - e( i+2 )*ei
*
         IF( d( i+3 ).LE.zero ) THEN
            info = i + 3
            GO TO 30
         END IF
*
*        Solve for e(i+3) and d(i+4).
*
         ei = e( i+3 )
         e( i+3 ) = ei / d( i+3 )
         d( i+4 ) = d( i+4 ) - e( i+3 )*ei
   20 CONTINUE
*
*     Check d(n) for positive definiteness.
*
      IF( d( n ).LE.zero )
     $   info = n
*
   30 CONTINUE
      RETURN
*
*     End of SPTTRF
*

◆ sstebz()

subroutine sstebz	(	character	range,
		character	order,
		integer	n,
		real	vl,
		real	vu,
		integer	il,
		integer	iu,
		real	abstol,
		real, dimension( * )	d,
		real, dimension( * )	e,
		integer	m,
		integer	nsplit,
		real, dimension( * )	w,
		integer, dimension( * )	iblock,
		integer, dimension( * )	isplit,
		real, dimension( * )	work,
		integer, dimension( * )	iwork,
		integer	info )

SSTEBZ

Download SSTEBZ + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> SSTEBZ computes the eigenvalues of a symmetric tridiagonal
!> matrix T.  The user may ask for all eigenvalues, all eigenvalues
!> in the half-open interval (VL, VU], or the IL-th through IU-th
!> eigenvalues.
!>
!> To avoid overflow, the matrix must be scaled so that its
!> largest element is no greater than overflow**(1/2) * underflow**(1/4) in absolute value, and for greatest
!> accuracy, it should not be much smaller than that.
!>
!> See W. Kahan , Report CS41, Computer Science Dept., Stanford
!> University, July 21, 1966.
!>

Parameters

[in]	RANGE	!> RANGE is CHARACTER*1 !> = 'A': () all eigenvalues will be found. !> = 'V': () all eigenvalues in the half-open interval !> (VL, VU] will be found. !> = 'I': () the IL-th through IU-th eigenvalues (of the !> entire matrix) will be found. !>
[in]	ORDER	!> ORDER is CHARACTER*1 !> = 'B': () the eigenvalues will be grouped by !> split-off block (see IBLOCK, ISPLIT) and !> ordered from smallest to largest within !> the block. !> = 'E': () !> the eigenvalues for the entire matrix !> will be ordered from smallest to !> largest. !>
[in]	N	!> N is INTEGER !> The order of the tridiagonal matrix T. N >= 0. !>
[in]	VL	!> VL is REAL !> !> If RANGE='V', the lower bound of the interval to !> be searched for eigenvalues. Eigenvalues less than or equal !> to VL, or greater than VU, will not be returned. VL < VU. !> Not referenced if RANGE = 'A' or 'I'. !>
[in]	VU	!> VU is REAL !> !> If RANGE='V', the upper bound of the interval to !> be searched for eigenvalues. Eigenvalues less than or equal !> to VL, or greater than VU, will not be returned. VL < VU. !> Not referenced if RANGE = 'A' or 'I'. !>
[in]	IL	!> IL is INTEGER !> !> If RANGE='I', the index of the !> smallest eigenvalue to be returned. !> 1 <= IL <= IU <= N, if N > 0; IL = 1 and IU = 0 if N = 0. !> Not referenced if RANGE = 'A' or 'V'. !>
[in]	IU	!> IU is INTEGER !> !> If RANGE='I', the index of the !> largest eigenvalue to be returned. !> 1 <= IL <= IU <= N, if N > 0; IL = 1 and IU = 0 if N = 0. !> Not referenced if RANGE = 'A' or 'V'. !>
[in]	ABSTOL	!> ABSTOL is REAL !> The absolute tolerance for the eigenvalues. An eigenvalue !> (or cluster) is considered to be located if it has been !> determined to lie in an interval whose width is ABSTOL or !> less. If ABSTOL is less than or equal to zero, then ULP\|T\| !> will be used, where \|T\| means the 1-norm of T. !> !> Eigenvalues will be computed most accurately when ABSTOL is !> set to twice the underflow threshold 2SLAMCH('S'), not zero. !>
[in]	D	!> D is REAL array, dimension (N) !> The n diagonal elements of the tridiagonal matrix T. !>
[in]	E	!> E is REAL array, dimension (N-1) !> The (n-1) off-diagonal elements of the tridiagonal matrix T. !>
[out]	M	!> M is INTEGER !> The actual number of eigenvalues found. 0 <= M <= N. !> (See also the description of INFO=2,3.) !>
[out]	NSPLIT	!> NSPLIT is INTEGER !> The number of diagonal blocks in the matrix T. !> 1 <= NSPLIT <= N. !>
[out]	W	!> W is REAL array, dimension (N) !> On exit, the first M elements of W will contain the !> eigenvalues. (SSTEBZ may use the remaining N-M elements as !> workspace.) !>
[out]	IBLOCK	!> IBLOCK is INTEGER array, dimension (N) !> At each row/column j where E(j) is zero or small, the !> matrix T is considered to split into a block diagonal !> matrix. On exit, if INFO = 0, IBLOCK(i) specifies to which !> block (from 1 to the number of blocks) the eigenvalue W(i) !> belongs. (SSTEBZ may use the remaining N-M elements as !> workspace.) !>
[out]	ISPLIT	!> ISPLIT is INTEGER array, dimension (N) !> The splitting points, at which T breaks up into submatrices. !> The first submatrix consists of rows/columns 1 to ISPLIT(1), !> the second of rows/columns ISPLIT(1)+1 through ISPLIT(2), !> etc., and the NSPLIT-th consists of rows/columns !> ISPLIT(NSPLIT-1)+1 through ISPLIT(NSPLIT)=N. !> (Only the first NSPLIT elements will actually be used, but !> since the user cannot know a priori what value NSPLIT will !> have, N words must be reserved for ISPLIT.) !>
[out]	WORK	!> WORK is REAL array, dimension (4*N) !>
[out]	IWORK	!> IWORK is INTEGER array, dimension (3*N) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !> > 0: some or all of the eigenvalues failed to converge or !> were not computed: !> =1 or 3: Bisection failed to converge for some !> eigenvalues; these eigenvalues are flagged by a !> negative block number. The effect is that the !> eigenvalues may not be as accurate as the !> absolute and relative tolerances. This is !> generally caused by unexpectedly inaccurate !> arithmetic. !> =2 or 3: RANGE='I' only: Not all of the eigenvalues !> IL:IU were found. !> Effect: M < IU+1-IL !> Cause: non-monotonic arithmetic, causing the !> Sturm sequence to be non-monotonic. !> Cure: recalculate, using RANGE='A', and pick !> out eigenvalues IL:IU. In some cases, !> increasing the PARAMETER may !> make things work. !> = 4: RANGE='I', and the Gershgorin interval !> initially used was too small. No eigenvalues !> were computed. !> Probable cause: your machine has sloppy !> floating-point arithmetic. !> Cure: Increase the PARAMETER , !> recompile, and try again. !>

Internal Parameters:

!>  RELFAC  REAL, default = 2.0e0
!>          The relative tolerance.  An interval (a,b] lies within
!>           if  b-a < RELFAC*ulp*max(|a|,|b|),
!>          where  is the machine precision (distance from 1 to
!>          the next larger floating point number.)
!>
!>  FUDGE   REAL, default = 2
!>          A  to widen the Gershgorin intervals.  Ideally,
!>          a value of 1 should work, but on machines with sloppy
!>          arithmetic, this needs to be larger.  The default for
!>          publicly released versions should be large enough to handle
!>          the worst machine around.  Note that this has no effect
!>          on accuracy of the solution.
!>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 270 of file sstebz.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          ORDER, RANGE
      INTEGER            IL, INFO, IU, M, N, NSPLIT
      REAL               ABSTOL, VL, VU
*     ..
*     .. Array Arguments ..
      INTEGER            IBLOCK( * ), ISPLIT( * ), IWORK( * )
      REAL               D( * ), E( * ), W( * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ZERO, ONE, TWO, HALF
      parameter( zero = 0.0e0, one = 1.0e0, two = 2.0e0,
     $                   half = 1.0e0 / two )
      REAL               FUDGE, RELFAC
      parameter( fudge = 2.1e0, relfac = 2.0e0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            NCNVRG, TOOFEW
      INTEGER            IB, IBEGIN, IDISCL, IDISCU, IE, IEND, IINFO,
     $                   IM, IN, IOFF, IORDER, IOUT, IRANGE, ITMAX,
     $                   ITMP1, IW, IWOFF, J, JB, JDISC, JE, NB, NWL,
     $                   NWU
      REAL               ATOLI, BNORM, GL, GU, PIVMIN, RTOLI, SAFEMN,
     $                   TMP1, TMP2, TNORM, ULP, WKILL, WL, WLU, WU, WUL
*     ..
*     .. Local Arrays ..
      INTEGER            IDUMMA( 1 )
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      INTEGER            ILAENV
      REAL               SLAMCH
      EXTERNAL           lsame, ilaenv, slamch
*     ..
*     .. External Subroutines ..
      EXTERNAL           slaebz, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, int, log, max, min, sqrt
*     ..
*     .. Executable Statements ..
*
      info = 0
*
*     Decode RANGE
*
      IF( lsame( range, 'A' ) ) THEN
         irange = 1
      ELSE IF( lsame( range, 'V' ) ) THEN
         irange = 2
      ELSE IF( lsame( range, 'I' ) ) THEN
         irange = 3
      ELSE
         irange = 0
      END IF
*
*     Decode ORDER
*
      IF( lsame( order, 'B' ) ) THEN
         iorder = 2
      ELSE IF( lsame( order, 'E' ) ) THEN
         iorder = 1
      ELSE
         iorder = 0
      END IF
*
*     Check for Errors
*
      IF( irange.LE.0 ) THEN
         info = -1
      ELSE IF( iorder.LE.0 ) THEN
         info = -2
      ELSE IF( n.LT.0 ) THEN
         info = -3
      ELSE IF( irange.EQ.2 ) THEN
         IF( vl.GE.vu ) info = -5
      ELSE IF( irange.EQ.3 .AND. ( il.LT.1 .OR. il.GT.max( 1, n ) ) )
     $          THEN
         info = -6
      ELSE IF( irange.EQ.3 .AND. ( iu.LT.min( n, il ) .OR. iu.GT.n ) )
     $          THEN
         info = -7
      END IF
*
      IF( info.NE.0 ) THEN
         CALL xerbla( 'SSTEBZ', -info )
         RETURN
      END IF
*
*     Initialize error flags
*
      info = 0
      ncnvrg = .false.
      toofew = .false.
*
*     Quick return if possible
*
      m = 0
      IF( n.EQ.0 )
     $   RETURN
*
*     Simplifications:
*
      IF( irange.EQ.3 .AND. il.EQ.1 .AND. iu.EQ.n )
     $   irange = 1
*
*     Get machine constants
*     NB is the minimum vector length for vector bisection, or 0
*     if only scalar is to be done.
*
      safemn = slamch( 'S' )
      ulp = slamch( 'P' )
      rtoli = ulp*relfac
      nb = ilaenv( 1, 'SSTEBZ', ' ', n, -1, -1, -1 )
      IF( nb.LE.1 )
     $   nb = 0
*
*     Special Case when N=1
*
      IF( n.EQ.1 ) THEN
         nsplit = 1
         isplit( 1 ) = 1
         IF( irange.EQ.2 .AND. ( vl.GE.d( 1 ) .OR. vu.LT.d( 1 ) ) ) THEN
            m = 0
         ELSE
            w( 1 ) = d( 1 )
            iblock( 1 ) = 1
            m = 1
         END IF
         RETURN
      END IF
*
*     Compute Splitting Points
*
      nsplit = 1
      work( n ) = zero
      pivmin = one
*
      DO 10 j = 2, n
         tmp1 = e( j-1 )**2
         IF( abs( d( j )*d( j-1 ) )*ulp**2+safemn.GT.tmp1 ) THEN
            isplit( nsplit ) = j - 1
            nsplit = nsplit + 1
            work( j-1 ) = zero
         ELSE
            work( j-1 ) = tmp1
            pivmin = max( pivmin, tmp1 )
         END IF
   10 CONTINUE
      isplit( nsplit ) = n
      pivmin = pivmin*safemn
*
*     Compute Interval and ATOLI
*
      IF( irange.EQ.3 ) THEN
*
*        RANGE='I': Compute the interval containing eigenvalues
*                   IL through IU.
*
*        Compute Gershgorin interval for entire (split) matrix
*        and use it as the initial interval
*
         gu = d( 1 )
         gl = d( 1 )
         tmp1 = zero
*
         DO 20 j = 1, n - 1
            tmp2 = sqrt( work( j ) )
            gu = max( gu, d( j )+tmp1+tmp2 )
            gl = min( gl, d( j )-tmp1-tmp2 )
            tmp1 = tmp2
   20    CONTINUE
*
         gu = max( gu, d( n )+tmp1 )
         gl = min( gl, d( n )-tmp1 )
         tnorm = max( abs( gl ), abs( gu ) )
         gl = gl - fudge*tnorm*ulp*n - fudge*two*pivmin
         gu = gu + fudge*tnorm*ulp*n + fudge*pivmin
*
*        Compute Iteration parameters
*
         itmax = int( ( log( tnorm+pivmin )-log( pivmin ) ) /
     $           log( two ) ) + 2
         IF( abstol.LE.zero ) THEN
            atoli = ulp*tnorm
         ELSE
            atoli = abstol
         END IF
*
         work( n+1 ) = gl
         work( n+2 ) = gl
         work( n+3 ) = gu
         work( n+4 ) = gu
         work( n+5 ) = gl
         work( n+6 ) = gu
         iwork( 1 ) = -1
         iwork( 2 ) = -1
         iwork( 3 ) = n + 1
         iwork( 4 ) = n + 1
         iwork( 5 ) = il - 1
         iwork( 6 ) = iu
*
         CALL slaebz( 3, itmax, n, 2, 2, nb, atoli, rtoli, pivmin, d, e,
     $                work, iwork( 5 ), work( n+1 ), work( n+5 ), iout,
     $                iwork, w, iblock, iinfo )
*
         IF( iwork( 6 ).EQ.iu ) THEN
            wl = work( n+1 )
            wlu = work( n+3 )
            nwl = iwork( 1 )
            wu = work( n+4 )
            wul = work( n+2 )
            nwu = iwork( 4 )
         ELSE
            wl = work( n+2 )
            wlu = work( n+4 )
            nwl = iwork( 2 )
            wu = work( n+3 )
            wul = work( n+1 )
            nwu = iwork( 3 )
         END IF
*
         IF( nwl.LT.0 .OR. nwl.GE.n .OR. nwu.LT.1 .OR. nwu.GT.n ) THEN
            info = 4
            RETURN
         END IF
      ELSE
*
*        RANGE='A' or 'V' -- Set ATOLI
*
         tnorm = max( abs( d( 1 ) )+abs( e( 1 ) ),
     $           abs( d( n ) )+abs( e( n-1 ) ) )
*
         DO 30 j = 2, n - 1
            tnorm = max( tnorm, abs( d( j ) )+abs( e( j-1 ) )+
     $              abs( e( j ) ) )
   30    CONTINUE
*
         IF( abstol.LE.zero ) THEN
            atoli = ulp*tnorm
         ELSE
            atoli = abstol
         END IF
*
         IF( irange.EQ.2 ) THEN
            wl = vl
            wu = vu
         ELSE
            wl = zero
            wu = zero
         END IF
      END IF
*
*     Find Eigenvalues -- Loop Over Blocks and recompute NWL and NWU.
*     NWL accumulates the number of eigenvalues .le. WL,
*     NWU accumulates the number of eigenvalues .le. WU
*
      m = 0
      iend = 0
      info = 0
      nwl = 0
      nwu = 0
*
      DO 70 jb = 1, nsplit
         ioff = iend
         ibegin = ioff + 1
         iend = isplit( jb )
         in = iend - ioff
*
         IF( in.EQ.1 ) THEN
*
*           Special Case -- IN=1
*
            IF( irange.EQ.1 .OR. wl.GE.d( ibegin )-pivmin )
     $         nwl = nwl + 1
            IF( irange.EQ.1 .OR. wu.GE.d( ibegin )-pivmin )
     $         nwu = nwu + 1
            IF( irange.EQ.1 .OR. ( wl.LT.d( ibegin )-pivmin .AND. wu.GE.
     $          d( ibegin )-pivmin ) ) THEN
               m = m + 1
               w( m ) = d( ibegin )
               iblock( m ) = jb
            END IF
         ELSE
*
*           General Case -- IN > 1
*
*           Compute Gershgorin Interval
*           and use it as the initial interval
*
            gu = d( ibegin )
            gl = d( ibegin )
            tmp1 = zero
*
            DO 40 j = ibegin, iend - 1
               tmp2 = abs( e( j ) )
               gu = max( gu, d( j )+tmp1+tmp2 )
               gl = min( gl, d( j )-tmp1-tmp2 )
               tmp1 = tmp2
   40       CONTINUE
*
            gu = max( gu, d( iend )+tmp1 )
            gl = min( gl, d( iend )-tmp1 )
            bnorm = max( abs( gl ), abs( gu ) )
            gl = gl - fudge*bnorm*ulp*in - fudge*pivmin
            gu = gu + fudge*bnorm*ulp*in + fudge*pivmin
*
*           Compute ATOLI for the current submatrix
*
            IF( abstol.LE.zero ) THEN
               atoli = ulp*max( abs( gl ), abs( gu ) )
            ELSE
               atoli = abstol
            END IF
*
            IF( irange.GT.1 ) THEN
               IF( gu.LT.wl ) THEN
                  nwl = nwl + in
                  nwu = nwu + in
                  GO TO 70
               END IF
               gl = max( gl, wl )
               gu = min( gu, wu )
               IF( gl.GE.gu )
     $            GO TO 70
            END IF
*
*           Set Up Initial Interval
*
            work( n+1 ) = gl
            work( n+in+1 ) = gu
            CALL slaebz( 1, 0, in, in, 1, nb, atoli, rtoli, pivmin,
     $                   d( ibegin ), e( ibegin ), work( ibegin ),
     $                   idumma, work( n+1 ), work( n+2*in+1 ), im,
     $                   iwork, w( m+1 ), iblock( m+1 ), iinfo )
*
            nwl = nwl + iwork( 1 )
            nwu = nwu + iwork( in+1 )
            iwoff = m - iwork( 1 )
*
*           Compute Eigenvalues
*
            itmax = int( ( log( gu-gl+pivmin )-log( pivmin ) ) /
     $              log( two ) ) + 2
            CALL slaebz( 2, itmax, in, in, 1, nb, atoli, rtoli, pivmin,
     $                   d( ibegin ), e( ibegin ), work( ibegin ),
     $                   idumma, work( n+1 ), work( n+2*in+1 ), iout,
     $                   iwork, w( m+1 ), iblock( m+1 ), iinfo )
*
*           Copy Eigenvalues Into W and IBLOCK
*           Use -JB for block number for unconverged eigenvalues.
*
            DO 60 j = 1, iout
               tmp1 = half*( work( j+n )+work( j+in+n ) )
*
*              Flag non-convergence.
*
               IF( j.GT.iout-iinfo ) THEN
                  ncnvrg = .true.
                  ib = -jb
               ELSE
                  ib = jb
               END IF
               DO 50 je = iwork( j ) + 1 + iwoff,
     $                 iwork( j+in ) + iwoff
                  w( je ) = tmp1
                  iblock( je ) = ib
   50          CONTINUE
   60       CONTINUE
*
            m = m + im
         END IF
   70 CONTINUE
*
*     If RANGE='I', then (WL,WU) contains eigenvalues NWL+1,...,NWU
*     If NWL+1 < IL or NWU > IU, discard extra eigenvalues.
*
      IF( irange.EQ.3 ) THEN
         im = 0
         idiscl = il - 1 - nwl
         idiscu = nwu - iu
*
         IF( idiscl.GT.0 .OR. idiscu.GT.0 ) THEN
            DO 80 je = 1, m
               IF( w( je ).LE.wlu .AND. idiscl.GT.0 ) THEN
                  idiscl = idiscl - 1
               ELSE IF( w( je ).GE.wul .AND. idiscu.GT.0 ) THEN
                  idiscu = idiscu - 1
               ELSE
                  im = im + 1
                  w( im ) = w( je )
                  iblock( im ) = iblock( je )
               END IF
   80       CONTINUE
            m = im
         END IF
         IF( idiscl.GT.0 .OR. idiscu.GT.0 ) THEN
*
*           Code to deal with effects of bad arithmetic:
*           Some low eigenvalues to be discarded are not in (WL,WLU],
*           or high eigenvalues to be discarded are not in (WUL,WU]
*           so just kill off the smallest IDISCL/largest IDISCU
*           eigenvalues, by simply finding the smallest/largest
*           eigenvalue(s).
*
*           (If N(w) is monotone non-decreasing, this should never
*               happen.)
*
            IF( idiscl.GT.0 ) THEN
               wkill = wu
               DO 100 jdisc = 1, idiscl
                  iw = 0
                  DO 90 je = 1, m
                     IF( iblock( je ).NE.0 .AND.
     $                   ( w( je ).LT.wkill .OR. iw.EQ.0 ) ) THEN
                        iw = je
                        wkill = w( je )
                     END IF
   90             CONTINUE
                  iblock( iw ) = 0
  100          CONTINUE
            END IF
            IF( idiscu.GT.0 ) THEN
*
               wkill = wl
               DO 120 jdisc = 1, idiscu
                  iw = 0
                  DO 110 je = 1, m
                     IF( iblock( je ).NE.0 .AND.
     $                   ( w( je ).GT.wkill .OR. iw.EQ.0 ) ) THEN
                        iw = je
                        wkill = w( je )
                     END IF
  110             CONTINUE
                  iblock( iw ) = 0
  120          CONTINUE
            END IF
            im = 0
            DO 130 je = 1, m
               IF( iblock( je ).NE.0 ) THEN
                  im = im + 1
                  w( im ) = w( je )
                  iblock( im ) = iblock( je )
               END IF
  130       CONTINUE
            m = im
         END IF
         IF( idiscl.LT.0 .OR. idiscu.LT.0 ) THEN
            toofew = .true.
         END IF
      END IF
*
*     If ORDER='B', do nothing -- the eigenvalues are already sorted
*        by block.
*     If ORDER='E', sort the eigenvalues from smallest to largest
*
      IF( iorder.EQ.1 .AND. nsplit.GT.1 ) THEN
         DO 150 je = 1, m - 1
            ie = 0
            tmp1 = w( je )
            DO 140 j = je + 1, m
               IF( w( j ).LT.tmp1 ) THEN
                  ie = j
                  tmp1 = w( j )
               END IF
  140       CONTINUE
*
            IF( ie.NE.0 ) THEN
               itmp1 = iblock( ie )
               w( ie ) = w( je )
               iblock( ie ) = iblock( je )
               w( je ) = tmp1
               iblock( je ) = itmp1
            END IF
  150    CONTINUE
      END IF
*
      info = 0
      IF( ncnvrg )
     $   info = info + 1
      IF( toofew )
     $   info = info + 2
      RETURN
*
*     End of SSTEBZ
*

◆ sstedc()

subroutine sstedc	(	character	compz,
		integer	n,
		real, dimension( * )	d,
		real, dimension( * )	e,
		real, dimension( ldz, * )	z,
		integer	ldz,
		real, dimension( * )	work,
		integer	lwork,
		integer, dimension( * )	iwork,
		integer	liwork,
		integer	info )

SSTEDC

Download SSTEDC + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> SSTEDC computes all eigenvalues and, optionally, eigenvectors of a
!> symmetric tridiagonal matrix using the divide and conquer method.
!> The eigenvectors of a full or band real symmetric matrix can also be
!> found if SSYTRD or SSPTRD or SSBTRD has been used to reduce this
!> matrix to tridiagonal form.
!>
!> This code makes very mild assumptions about floating point
!> arithmetic. It will work on machines with a guard digit in
!> add/subtract, or on those binary machines without guard digits
!> which subtract like the Cray X-MP, Cray Y-MP, Cray C-90, or Cray-2.
!> It could conceivably fail on hexadecimal or decimal machines
!> without guard digits, but we know of none.  See SLAED3 for details.
!>

Parameters

[in]	COMPZ	!> COMPZ is CHARACTER*1 !> = 'N': Compute eigenvalues only. !> = 'I': Compute eigenvectors of tridiagonal matrix also. !> = 'V': Compute eigenvectors of original dense symmetric !> matrix also. On entry, Z contains the orthogonal !> matrix used to reduce the original matrix to !> tridiagonal form. !>
[in]	N	!> N is INTEGER !> The dimension of the symmetric tridiagonal matrix. N >= 0. !>
[in,out]	D	!> D is REAL array, dimension (N) !> On entry, the diagonal elements of the tridiagonal matrix. !> On exit, if INFO = 0, the eigenvalues in ascending order. !>
[in,out]	E	!> E is REAL array, dimension (N-1) !> On entry, the subdiagonal elements of the tridiagonal matrix. !> On exit, E has been destroyed. !>
[in,out]	Z	!> Z is REAL array, dimension (LDZ,N) !> On entry, if COMPZ = 'V', then Z contains the orthogonal !> matrix used in the reduction to tridiagonal form. !> On exit, if INFO = 0, then if COMPZ = 'V', Z contains the !> orthonormal eigenvectors of the original symmetric matrix, !> and if COMPZ = 'I', Z contains the orthonormal eigenvectors !> of the symmetric tridiagonal matrix. !> If COMPZ = 'N', then Z is not referenced. !>
[in]	LDZ	!> LDZ is INTEGER !> The leading dimension of the array Z. LDZ >= 1. !> If eigenvectors are desired, then LDZ >= max(1,N). !>
[out]	WORK	!> WORK is REAL array, dimension (MAX(1,LWORK)) !> On exit, if INFO = 0, WORK(1) returns the optimal LWORK. !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the array WORK. !> If COMPZ = 'N' or N <= 1 then LWORK must be at least 1. !> If COMPZ = 'V' and N > 1 then LWORK must be at least !> ( 1 + 3N + 2Nlg N + 4N2 ), !> where lg( N ) = smallest integer k such !> that 2k >= N. !> If COMPZ = 'I' and N > 1 then LWORK must be at least !> ( 1 + 4N + N2 ). !> Note that for COMPZ = 'I' or 'V', then if N is less than or !> equal to the minimum divide size, usually 25, then LWORK need !> only be max(1,2(N-1)). !> !> If LWORK = -1, then a workspace query is assumed; the routine !> only calculates the optimal size of the WORK array, returns !> this value as the first entry of the WORK array, and no error !> message related to LWORK is issued by XERBLA. !>
[out]	IWORK	!> IWORK is INTEGER array, dimension (MAX(1,LIWORK)) !> On exit, if INFO = 0, IWORK(1) returns the optimal LIWORK. !>
[in]	LIWORK	!> LIWORK is INTEGER !> The dimension of the array IWORK. !> If COMPZ = 'N' or N <= 1 then LIWORK must be at least 1. !> If COMPZ = 'V' and N > 1 then LIWORK must be at least !> ( 6 + 6N + 5Nlg N ). !> If COMPZ = 'I' and N > 1 then LIWORK must be at least !> ( 3 + 5N ). !> Note that for COMPZ = 'I' or 'V', then if N is less than or !> equal to the minimum divide size, usually 25, then LIWORK !> need only be 1. !> !> If LIWORK = -1, then a workspace query is assumed; the !> routine only calculates the optimal size of the IWORK array, !> returns this value as the first entry of the IWORK array, and !> no error message related to LIWORK is issued by XERBLA. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> < 0: if INFO = -i, the i-th argument had an illegal value. !> > 0: The algorithm failed to compute an eigenvalue while !> working on the submatrix lying in rows and columns !> INFO/(N+1) through mod(INFO,N+1). !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: Jeff Rutter, Computer Science Division, University of California at Berkeley, USA
Modified by Francoise Tisseur, University of Tennessee

Definition at line 186 of file sstedc.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          COMPZ
      INTEGER            INFO, LDZ, LIWORK, LWORK, N
*     ..
*     .. Array Arguments ..
      INTEGER            IWORK( * )
      REAL               D( * ), E( * ), WORK( * ), Z( LDZ, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ZERO, ONE, TWO
      parameter( zero = 0.0e0, one = 1.0e0, two = 2.0e0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            LQUERY
      INTEGER            FINISH, I, ICOMPZ, II, J, K, LGN, LIWMIN,
     $                   LWMIN, M, SMLSIZ, START, STOREZ, STRTRW
      REAL               EPS, ORGNRM, P, TINY
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      INTEGER            ILAENV
      REAL               SLAMCH, SLANST
      EXTERNAL           ilaenv, lsame, slamch, slanst
*     ..
*     .. External Subroutines ..
      EXTERNAL           sgemm, slacpy, slaed0, slascl, slaset, slasrt,
     $                   ssteqr, ssterf, sswap, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, int, log, max, mod, real, sqrt
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      lquery = ( lwork.EQ.-1 .OR. liwork.EQ.-1 )
*
      IF( lsame( compz, 'N' ) ) THEN
         icompz = 0
      ELSE IF( lsame( compz, 'V' ) ) THEN
         icompz = 1
      ELSE IF( lsame( compz, 'I' ) ) THEN
         icompz = 2
      ELSE
         icompz = -1
      END IF
      IF( icompz.LT.0 ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( ( ldz.LT.1 ) .OR.
     $         ( icompz.GT.0 .AND. ldz.LT.max( 1, n ) ) ) THEN
         info = -6
      END IF
*
      IF( info.EQ.0 ) THEN
*
*        Compute the workspace requirements
*
         smlsiz = ilaenv( 9, 'SSTEDC', ' ', 0, 0, 0, 0 )
         IF( n.LE.1 .OR. icompz.EQ.0 ) THEN
            liwmin = 1
            lwmin = 1
         ELSE IF( n.LE.smlsiz ) THEN
            liwmin = 1
            lwmin = 2*( n - 1 )
         ELSE
            lgn = int( log( real( n ) )/log( two ) )
            IF( 2**lgn.LT.n )
     $         lgn = lgn + 1
            IF( 2**lgn.LT.n )
     $         lgn = lgn + 1
            IF( icompz.EQ.1 ) THEN
               lwmin = 1 + 3*n + 2*n*lgn + 4*n**2
               liwmin = 6 + 6*n + 5*n*lgn
            ELSE IF( icompz.EQ.2 ) THEN
               lwmin = 1 + 4*n + n**2
               liwmin = 3 + 5*n
            END IF
         END IF
         work( 1 ) = lwmin
         iwork( 1 ) = liwmin
*
         IF( lwork.LT.lwmin .AND. .NOT. lquery ) THEN
            info = -8
         ELSE IF( liwork.LT.liwmin .AND. .NOT. lquery ) THEN
            info = -10
         END IF
      END IF
*
      IF( info.NE.0 ) THEN
         CALL xerbla( 'SSTEDC', -info )
         RETURN
      ELSE IF (lquery) THEN
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
      IF( n.EQ.1 ) THEN
         IF( icompz.NE.0 )
     $      z( 1, 1 ) = one
         RETURN
      END IF
*
*     If the following conditional clause is removed, then the routine
*     will use the Divide and Conquer routine to compute only the
*     eigenvalues, which requires (3N + 3N**2) real workspace and
*     (2 + 5N + 2N lg(N)) integer workspace.
*     Since on many architectures SSTERF is much faster than any other
*     algorithm for finding eigenvalues only, it is used here
*     as the default. If the conditional clause is removed, then
*     information on the size of workspace needs to be changed.
*
*     If COMPZ = 'N', use SSTERF to compute the eigenvalues.
*
      IF( icompz.EQ.0 ) THEN
         CALL ssterf( n, d, e, info )
         GO TO 50
      END IF
*
*     If N is smaller than the minimum divide size (SMLSIZ+1), then
*     solve the problem with another solver.
*
      IF( n.LE.smlsiz ) THEN
*
         CALL ssteqr( compz, n, d, e, z, ldz, work, info )
*
      ELSE
*
*        If COMPZ = 'V', the Z matrix must be stored elsewhere for later
*        use.
*
         IF( icompz.EQ.1 ) THEN
            storez = 1 + n*n
         ELSE
            storez = 1
         END IF
*
         IF( icompz.EQ.2 ) THEN
            CALL slaset( 'Full', n, n, zero, one, z, ldz )
         END IF
*
*        Scale.
*
         orgnrm = slanst( 'M', n, d, e )
         IF( orgnrm.EQ.zero )
     $      GO TO 50
*
         eps = slamch( 'Epsilon' )
*
         start = 1
*
*        while ( START <= N )
*
   10    CONTINUE
         IF( start.LE.n ) THEN
*
*           Let FINISH be the position of the next subdiagonal entry
*           such that E( FINISH ) <= TINY or FINISH = N if no such
*           subdiagonal exists.  The matrix identified by the elements
*           between START and FINISH constitutes an independent
*           sub-problem.
*
            finish = start
   20       CONTINUE
            IF( finish.LT.n ) THEN
               tiny = eps*sqrt( abs( d( finish ) ) )*
     $                    sqrt( abs( d( finish+1 ) ) )
               IF( abs( e( finish ) ).GT.tiny ) THEN
                  finish = finish + 1
                  GO TO 20
               END IF
            END IF
*
*           (Sub) Problem determined.  Compute its size and solve it.
*
            m = finish - start + 1
            IF( m.EQ.1 ) THEN
               start = finish + 1
               GO TO 10
            END IF
            IF( m.GT.smlsiz ) THEN
*
*              Scale.
*
               orgnrm = slanst( 'M', m, d( start ), e( start ) )
               CALL slascl( 'G', 0, 0, orgnrm, one, m, 1, d( start ), m,
     $                      info )
               CALL slascl( 'G', 0, 0, orgnrm, one, m-1, 1, e( start ),
     $                      m-1, info )
*
               IF( icompz.EQ.1 ) THEN
                  strtrw = 1
               ELSE
                  strtrw = start
               END IF
               CALL slaed0( icompz, n, m, d( start ), e( start ),
     $                      z( strtrw, start ), ldz, work( 1 ), n,
     $                      work( storez ), iwork, info )
               IF( info.NE.0 ) THEN
                  info = ( info / ( m+1 )+start-1 )*( n+1 ) +
     $                   mod( info, ( m+1 ) ) + start - 1
                  GO TO 50
               END IF
*
*              Scale back.
*
               CALL slascl( 'G', 0, 0, one, orgnrm, m, 1, d( start ), m,
     $                      info )
*
            ELSE
               IF( icompz.EQ.1 ) THEN
*
*                 Since QR won't update a Z matrix which is larger than
*                 the length of D, we must solve the sub-problem in a
*                 workspace and then multiply back into Z.
*
                  CALL ssteqr( 'I', m, d( start ), e( start ), work, m,
     $                         work( m*m+1 ), info )
                  CALL slacpy( 'A', n, m, z( 1, start ), ldz,
     $                         work( storez ), n )
                  CALL sgemm( 'N', 'N', n, m, m, one,
     $                        work( storez ), n, work, m, zero,
     $                        z( 1, start ), ldz )
               ELSE IF( icompz.EQ.2 ) THEN
                  CALL ssteqr( 'I', m, d( start ), e( start ),
     $                         z( start, start ), ldz, work, info )
               ELSE
                  CALL ssterf( m, d( start ), e( start ), info )
               END IF
               IF( info.NE.0 ) THEN
                  info = start*( n+1 ) + finish
                  GO TO 50
               END IF
            END IF
*
            start = finish + 1
            GO TO 10
         END IF
*
*        endwhile
*
         IF( icompz.EQ.0 ) THEN
*
*          Use Quick Sort
*
           CALL slasrt( 'I', n, d, info )
*
         ELSE
*
*          Use Selection Sort to minimize swaps of eigenvectors
*
           DO 40 ii = 2, n
              i = ii - 1
              k = i
              p = d( i )
              DO 30 j = ii, n
                 IF( d( j ).LT.p ) THEN
                    k = j
                    p = d( j )
                 END IF
   30         CONTINUE
              IF( k.NE.i ) THEN
                 d( k ) = d( i )
                 d( i ) = p
                 CALL sswap( n, z( 1, i ), 1, z( 1, k ), 1 )
              END IF
   40      CONTINUE
         END IF
      END IF
*
   50 CONTINUE
      work( 1 ) = lwmin
      iwork( 1 ) = liwmin
*
      RETURN
*
*     End of SSTEDC
*

◆ ssteqr()

subroutine ssteqr	(	character	compz,
		integer	n,
		real, dimension( * )	d,
		real, dimension( * )	e,
		real, dimension( ldz, * )	z,
		integer	ldz,
		real, dimension( * )	work,
		integer	info )

SSTEQR

Download SSTEQR + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> SSTEQR computes all eigenvalues and, optionally, eigenvectors of a
!> symmetric tridiagonal matrix using the implicit QL or QR method.
!> The eigenvectors of a full or band symmetric matrix can also be found
!> if SSYTRD or SSPTRD or SSBTRD has been used to reduce this matrix to
!> tridiagonal form.
!>

Parameters

[in]	COMPZ	!> COMPZ is CHARACTER*1 !> = 'N': Compute eigenvalues only. !> = 'V': Compute eigenvalues and eigenvectors of the original !> symmetric matrix. On entry, Z must contain the !> orthogonal matrix used to reduce the original matrix !> to tridiagonal form. !> = 'I': Compute eigenvalues and eigenvectors of the !> tridiagonal matrix. Z is initialized to the identity !> matrix. !>
[in]	N	!> N is INTEGER !> The order of the matrix. N >= 0. !>
[in,out]	D	!> D is REAL array, dimension (N) !> On entry, the diagonal elements of the tridiagonal matrix. !> On exit, if INFO = 0, the eigenvalues in ascending order. !>
[in,out]	E	!> E is REAL array, dimension (N-1) !> On entry, the (n-1) subdiagonal elements of the tridiagonal !> matrix. !> On exit, E has been destroyed. !>
[in,out]	Z	!> Z is REAL array, dimension (LDZ, N) !> On entry, if COMPZ = 'V', then Z contains the orthogonal !> matrix used in the reduction to tridiagonal form. !> On exit, if INFO = 0, then if COMPZ = 'V', Z contains the !> orthonormal eigenvectors of the original symmetric matrix, !> and if COMPZ = 'I', Z contains the orthonormal eigenvectors !> of the symmetric tridiagonal matrix. !> If COMPZ = 'N', then Z is not referenced. !>
[in]	LDZ	!> LDZ is INTEGER !> The leading dimension of the array Z. LDZ >= 1, and if !> eigenvectors are desired, then LDZ >= max(1,N). !>
[out]	WORK	!> WORK is REAL array, dimension (max(1,2*N-2)) !> If COMPZ = 'N', then WORK is not referenced. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !> > 0: the algorithm has failed to find all the eigenvalues in !> a total of 30*N iterations; if INFO = i, then i !> elements of E have not converged to zero; on exit, D !> and E contain the elements of a symmetric tridiagonal !> matrix which is orthogonally similar to the original !> matrix. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 130 of file ssteqr.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          COMPZ
      INTEGER            INFO, LDZ, N
*     ..
*     .. Array Arguments ..
      REAL               D( * ), E( * ), WORK( * ), Z( LDZ, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ZERO, ONE, TWO, THREE
      parameter( zero = 0.0e0, one = 1.0e0, two = 2.0e0,
     $                   three = 3.0e0 )
      INTEGER            MAXIT
      parameter( maxit = 30 )
*     ..
*     .. Local Scalars ..
      INTEGER            I, ICOMPZ, II, ISCALE, J, JTOT, K, L, L1, LEND,
     $                   LENDM1, LENDP1, LENDSV, LM1, LSV, M, MM, MM1,
     $                   NM1, NMAXIT
      REAL               ANORM, B, C, EPS, EPS2, F, G, P, R, RT1, RT2,
     $                   S, SAFMAX, SAFMIN, SSFMAX, SSFMIN, TST
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      REAL               SLAMCH, SLANST, SLAPY2
      EXTERNAL           lsame, slamch, slanst, slapy2
*     ..
*     .. External Subroutines ..
      EXTERNAL           slae2, slaev2, slartg, slascl, slaset, slasr,
     $                   slasrt, sswap, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, max, sign, sqrt
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
*
      IF( lsame( compz, 'N' ) ) THEN
         icompz = 0
      ELSE IF( lsame( compz, 'V' ) ) THEN
         icompz = 1
      ELSE IF( lsame( compz, 'I' ) ) THEN
         icompz = 2
      ELSE
         icompz = -1
      END IF
      IF( icompz.LT.0 ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( ( ldz.LT.1 ) .OR. ( icompz.GT.0 .AND. ldz.LT.max( 1,
     $         n ) ) ) THEN
         info = -6
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'SSTEQR', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
      IF( n.EQ.1 ) THEN
         IF( icompz.EQ.2 )
     $      z( 1, 1 ) = one
         RETURN
      END IF
*
*     Determine the unit roundoff and over/underflow thresholds.
*
      eps = slamch( 'E' )
      eps2 = eps**2
      safmin = slamch( 'S' )
      safmax = one / safmin
      ssfmax = sqrt( safmax ) / three
      ssfmin = sqrt( safmin ) / eps2
*
*     Compute the eigenvalues and eigenvectors of the tridiagonal
*     matrix.
*
      IF( icompz.EQ.2 )
     $   CALL slaset( 'Full', n, n, zero, one, z, ldz )
*
      nmaxit = n*maxit
      jtot = 0
*
*     Determine where the matrix splits and choose QL or QR iteration
*     for each block, according to whether top or bottom diagonal
*     element is smaller.
*
      l1 = 1
      nm1 = n - 1
*
   10 CONTINUE
      IF( l1.GT.n )
     $   GO TO 160
      IF( l1.GT.1 )
     $   e( l1-1 ) = zero
      IF( l1.LE.nm1 ) THEN
         DO 20 m = l1, nm1
            tst = abs( e( m ) )
            IF( tst.EQ.zero )
     $         GO TO 30
            IF( tst.LE.( sqrt( abs( d( m ) ) )*sqrt( abs( d( m+
     $          1 ) ) ) )*eps ) THEN
               e( m ) = zero
               GO TO 30
            END IF
   20    CONTINUE
      END IF
      m = n
*
   30 CONTINUE
      l = l1
      lsv = l
      lend = m
      lendsv = lend
      l1 = m + 1
      IF( lend.EQ.l )
     $   GO TO 10
*
*     Scale submatrix in rows and columns L to LEND
*
      anorm = slanst( 'M', lend-l+1, d( l ), e( l ) )
      iscale = 0
      IF( anorm.EQ.zero )
     $   GO TO 10
      IF( anorm.GT.ssfmax ) THEN
         iscale = 1
         CALL slascl( 'G', 0, 0, anorm, ssfmax, lend-l+1, 1, d( l ), n,
     $                info )
         CALL slascl( 'G', 0, 0, anorm, ssfmax, lend-l, 1, e( l ), n,
     $                info )
      ELSE IF( anorm.LT.ssfmin ) THEN
         iscale = 2
         CALL slascl( 'G', 0, 0, anorm, ssfmin, lend-l+1, 1, d( l ), n,
     $                info )
         CALL slascl( 'G', 0, 0, anorm, ssfmin, lend-l, 1, e( l ), n,
     $                info )
      END IF
*
*     Choose between QL and QR iteration
*
      IF( abs( d( lend ) ).LT.abs( d( l ) ) ) THEN
         lend = lsv
         l = lendsv
      END IF
*
      IF( lend.GT.l ) THEN
*
*        QL Iteration
*
*        Look for small subdiagonal element.
*
   40    CONTINUE
         IF( l.NE.lend ) THEN
            lendm1 = lend - 1
            DO 50 m = l, lendm1
               tst = abs( e( m ) )**2
               IF( tst.LE.( eps2*abs( d( m ) ) )*abs( d( m+1 ) )+
     $             safmin )GO TO 60
   50       CONTINUE
         END IF
*
         m = lend
*
   60    CONTINUE
         IF( m.LT.lend )
     $      e( m ) = zero
         p = d( l )
         IF( m.EQ.l )
     $      GO TO 80
*
*        If remaining matrix is 2-by-2, use SLAE2 or SLAEV2
*        to compute its eigensystem.
*
         IF( m.EQ.l+1 ) THEN
            IF( icompz.GT.0 ) THEN
               CALL slaev2( d( l ), e( l ), d( l+1 ), rt1, rt2, c, s )
               work( l ) = c
               work( n-1+l ) = s
               CALL slasr( 'R', 'V', 'B', n, 2, work( l ),
     $                     work( n-1+l ), z( 1, l ), ldz )
            ELSE
               CALL slae2( d( l ), e( l ), d( l+1 ), rt1, rt2 )
            END IF
            d( l ) = rt1
            d( l+1 ) = rt2
            e( l ) = zero
            l = l + 2
            IF( l.LE.lend )
     $         GO TO 40
            GO TO 140
         END IF
*
         IF( jtot.EQ.nmaxit )
     $      GO TO 140
         jtot = jtot + 1
*
*        Form shift.
*
         g = ( d( l+1 )-p ) / ( two*e( l ) )
         r = slapy2( g, one )
         g = d( m ) - p + ( e( l ) / ( g+sign( r, g ) ) )
*
         s = one
         c = one
         p = zero
*
*        Inner loop
*
         mm1 = m - 1
         DO 70 i = mm1, l, -1
            f = s*e( i )
            b = c*e( i )
            CALL slartg( g, f, c, s, r )
            IF( i.NE.m-1 )
     $         e( i+1 ) = r
            g = d( i+1 ) - p
            r = ( d( i )-g )*s + two*c*b
            p = s*r
            d( i+1 ) = g + p
            g = c*r - b
*
*           If eigenvectors are desired, then save rotations.
*
            IF( icompz.GT.0 ) THEN
               work( i ) = c
               work( n-1+i ) = -s
            END IF
*
   70    CONTINUE
*
*        If eigenvectors are desired, then apply saved rotations.
*
         IF( icompz.GT.0 ) THEN
            mm = m - l + 1
            CALL slasr( 'R', 'V', 'B', n, mm, work( l ), work( n-1+l ),
     $                  z( 1, l ), ldz )
         END IF
*
         d( l ) = d( l ) - p
         e( l ) = g
         GO TO 40
*
*        Eigenvalue found.
*
   80    CONTINUE
         d( l ) = p
*
         l = l + 1
         IF( l.LE.lend )
     $      GO TO 40
         GO TO 140
*
      ELSE
*
*        QR Iteration
*
*        Look for small superdiagonal element.
*
   90    CONTINUE
         IF( l.NE.lend ) THEN
            lendp1 = lend + 1
            DO 100 m = l, lendp1, -1
               tst = abs( e( m-1 ) )**2
               IF( tst.LE.( eps2*abs( d( m ) ) )*abs( d( m-1 ) )+
     $             safmin )GO TO 110
  100       CONTINUE
         END IF
*
         m = lend
*
  110    CONTINUE
         IF( m.GT.lend )
     $      e( m-1 ) = zero
         p = d( l )
         IF( m.EQ.l )
     $      GO TO 130
*
*        If remaining matrix is 2-by-2, use SLAE2 or SLAEV2
*        to compute its eigensystem.
*
         IF( m.EQ.l-1 ) THEN
            IF( icompz.GT.0 ) THEN
               CALL slaev2( d( l-1 ), e( l-1 ), d( l ), rt1, rt2, c, s )
               work( m ) = c
               work( n-1+m ) = s
               CALL slasr( 'R', 'V', 'F', n, 2, work( m ),
     $                     work( n-1+m ), z( 1, l-1 ), ldz )
            ELSE
               CALL slae2( d( l-1 ), e( l-1 ), d( l ), rt1, rt2 )
            END IF
            d( l-1 ) = rt1
            d( l ) = rt2
            e( l-1 ) = zero
            l = l - 2
            IF( l.GE.lend )
     $         GO TO 90
            GO TO 140
         END IF
*
         IF( jtot.EQ.nmaxit )
     $      GO TO 140
         jtot = jtot + 1
*
*        Form shift.
*
         g = ( d( l-1 )-p ) / ( two*e( l-1 ) )
         r = slapy2( g, one )
         g = d( m ) - p + ( e( l-1 ) / ( g+sign( r, g ) ) )
*
         s = one
         c = one
         p = zero
*
*        Inner loop
*
         lm1 = l - 1
         DO 120 i = m, lm1
            f = s*e( i )
            b = c*e( i )
            CALL slartg( g, f, c, s, r )
            IF( i.NE.m )
     $         e( i-1 ) = r
            g = d( i ) - p
            r = ( d( i+1 )-g )*s + two*c*b
            p = s*r
            d( i ) = g + p
            g = c*r - b
*
*           If eigenvectors are desired, then save rotations.
*
            IF( icompz.GT.0 ) THEN
               work( i ) = c
               work( n-1+i ) = s
            END IF
*
  120    CONTINUE
*
*        If eigenvectors are desired, then apply saved rotations.
*
         IF( icompz.GT.0 ) THEN
            mm = l - m + 1
            CALL slasr( 'R', 'V', 'F', n, mm, work( m ), work( n-1+m ),
     $                  z( 1, m ), ldz )
         END IF
*
         d( l ) = d( l ) - p
         e( lm1 ) = g
         GO TO 90
*
*        Eigenvalue found.
*
  130    CONTINUE
         d( l ) = p
*
         l = l - 1
         IF( l.GE.lend )
     $      GO TO 90
         GO TO 140
*
      END IF
*
*     Undo scaling if necessary
*
  140 CONTINUE
      IF( iscale.EQ.1 ) THEN
         CALL slascl( 'G', 0, 0, ssfmax, anorm, lendsv-lsv+1, 1,
     $                d( lsv ), n, info )
         CALL slascl( 'G', 0, 0, ssfmax, anorm, lendsv-lsv, 1, e( lsv ),
     $                n, info )
      ELSE IF( iscale.EQ.2 ) THEN
         CALL slascl( 'G', 0, 0, ssfmin, anorm, lendsv-lsv+1, 1,
     $                d( lsv ), n, info )
         CALL slascl( 'G', 0, 0, ssfmin, anorm, lendsv-lsv, 1, e( lsv ),
     $                n, info )
      END IF
*
*     Check for no convergence to an eigenvalue after a total
*     of N*MAXIT iterations.
*
      IF( jtot.LT.nmaxit )
     $   GO TO 10
      DO 150 i = 1, n - 1
         IF( e( i ).NE.zero )
     $      info = info + 1
  150 CONTINUE
      GO TO 190
*
*     Order eigenvalues and eigenvectors.
*
  160 CONTINUE
      IF( icompz.EQ.0 ) THEN
*
*        Use Quick Sort
*
         CALL slasrt( 'I', n, d, info )
*
      ELSE
*
*        Use Selection Sort to minimize swaps of eigenvectors
*
         DO 180 ii = 2, n
            i = ii - 1
            k = i
            p = d( i )
            DO 170 j = ii, n
               IF( d( j ).LT.p ) THEN
                  k = j
                  p = d( j )
               END IF
  170       CONTINUE
            IF( k.NE.i ) THEN
               d( k ) = d( i )
               d( i ) = p
               CALL sswap( n, z( 1, i ), 1, z( 1, k ), 1 )
            END IF
  180    CONTINUE
      END IF
*
  190 CONTINUE
      RETURN
*
*     End of SSTEQR
*

◆ ssterf()

subroutine ssterf	(	integer	n,
		real, dimension( * )	d,
		real, dimension( * )	e,
		integer	info )

SSTERF

Download SSTERF + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> SSTERF computes all eigenvalues of a symmetric tridiagonal matrix
!> using the Pal-Walker-Kahan variant of the QL or QR algorithm.
!>

Parameters

[in]	N	!> N is INTEGER !> The order of the matrix. N >= 0. !>
[in,out]	D	!> D is REAL array, dimension (N) !> On entry, the n diagonal elements of the tridiagonal matrix. !> On exit, if INFO = 0, the eigenvalues in ascending order. !>
[in,out]	E	!> E is REAL array, dimension (N-1) !> On entry, the (n-1) subdiagonal elements of the tridiagonal !> matrix. !> On exit, E has been destroyed. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !> > 0: the algorithm failed to find all of the eigenvalues in !> a total of 30*N iterations; if INFO = i, then i !> elements of E have not converged to zero. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 85 of file ssterf.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INFO, N
*     ..
*     .. Array Arguments ..
      REAL               D( * ), E( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ZERO, ONE, TWO, THREE
      parameter( zero = 0.0e0, one = 1.0e0, two = 2.0e0,
     $                   three = 3.0e0 )
      INTEGER            MAXIT
      parameter( maxit = 30 )
*     ..
*     .. Local Scalars ..
      INTEGER            I, ISCALE, JTOT, L, L1, LEND, LENDSV, LSV, M,
     $                   NMAXIT
      REAL               ALPHA, ANORM, BB, C, EPS, EPS2, GAMMA, OLDC,
     $                   OLDGAM, P, R, RT1, RT2, RTE, S, SAFMAX, SAFMIN,
     $                   SIGMA, SSFMAX, SSFMIN
*     ..
*     .. External Functions ..
      REAL               SLAMCH, SLANST, SLAPY2
      EXTERNAL           slamch, slanst, slapy2
*     ..
*     .. External Subroutines ..
      EXTERNAL           slae2, slascl, slasrt, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, sign, sqrt
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
*
*     Quick return if possible
*
      IF( n.LT.0 ) THEN
         info = -1
         CALL xerbla( 'SSTERF', -info )
         RETURN
      END IF
      IF( n.LE.1 )
     $   RETURN
*
*     Determine the unit roundoff for this environment.
*
      eps = slamch( 'E' )
      eps2 = eps**2
      safmin = slamch( 'S' )
      safmax = one / safmin
      ssfmax = sqrt( safmax ) / three
      ssfmin = sqrt( safmin ) / eps2
*
*     Compute the eigenvalues of the tridiagonal matrix.
*
      nmaxit = n*maxit
      sigma = zero
      jtot = 0
*
*     Determine where the matrix splits and choose QL or QR iteration
*     for each block, according to whether top or bottom diagonal
*     element is smaller.
*
      l1 = 1
*
   10 CONTINUE
      IF( l1.GT.n )
     $   GO TO 170
      IF( l1.GT.1 )
     $   e( l1-1 ) = zero
      DO 20 m = l1, n - 1
         IF( abs( e( m ) ).LE.( sqrt( abs( d( m ) ) )*
     $       sqrt( abs( d( m+1 ) ) ) )*eps ) THEN
            e( m ) = zero
            GO TO 30
         END IF
   20 CONTINUE
      m = n
*
   30 CONTINUE
      l = l1
      lsv = l
      lend = m
      lendsv = lend
      l1 = m + 1
      IF( lend.EQ.l )
     $   GO TO 10
*
*     Scale submatrix in rows and columns L to LEND
*
      anorm = slanst( 'M', lend-l+1, d( l ), e( l ) )
      iscale = 0
      IF( anorm.EQ.zero )
     $   GO TO 10
      IF( anorm.GT.ssfmax ) THEN
         iscale = 1
         CALL slascl( 'G', 0, 0, anorm, ssfmax, lend-l+1, 1, d( l ), n,
     $                info )
         CALL slascl( 'G', 0, 0, anorm, ssfmax, lend-l, 1, e( l ), n,
     $                info )
      ELSE IF( anorm.LT.ssfmin ) THEN
         iscale = 2
         CALL slascl( 'G', 0, 0, anorm, ssfmin, lend-l+1, 1, d( l ), n,
     $                info )
         CALL slascl( 'G', 0, 0, anorm, ssfmin, lend-l, 1, e( l ), n,
     $                info )
      END IF
*
      DO 40 i = l, lend - 1
         e( i ) = e( i )**2
   40 CONTINUE
*
*     Choose between QL and QR iteration
*
      IF( abs( d( lend ) ).LT.abs( d( l ) ) ) THEN
         lend = lsv
         l = lendsv
      END IF
*
      IF( lend.GE.l ) THEN
*
*        QL Iteration
*
*        Look for small subdiagonal element.
*
   50    CONTINUE
         IF( l.NE.lend ) THEN
            DO 60 m = l, lend - 1
               IF( abs( e( m ) ).LE.eps2*abs( d( m )*d( m+1 ) ) )
     $            GO TO 70
   60       CONTINUE
         END IF
         m = lend
*
   70    CONTINUE
         IF( m.LT.lend )
     $      e( m ) = zero
         p = d( l )
         IF( m.EQ.l )
     $      GO TO 90
*
*        If remaining matrix is 2 by 2, use SLAE2 to compute its
*        eigenvalues.
*
         IF( m.EQ.l+1 ) THEN
            rte = sqrt( e( l ) )
            CALL slae2( d( l ), rte, d( l+1 ), rt1, rt2 )
            d( l ) = rt1
            d( l+1 ) = rt2
            e( l ) = zero
            l = l + 2
            IF( l.LE.lend )
     $         GO TO 50
            GO TO 150
         END IF
*
         IF( jtot.EQ.nmaxit )
     $      GO TO 150
         jtot = jtot + 1
*
*        Form shift.
*
         rte = sqrt( e( l ) )
         sigma = ( d( l+1 )-p ) / ( two*rte )
         r = slapy2( sigma, one )
         sigma = p - ( rte / ( sigma+sign( r, sigma ) ) )
*
         c = one
         s = zero
         gamma = d( m ) - sigma
         p = gamma*gamma
*
*        Inner loop
*
         DO 80 i = m - 1, l, -1
            bb = e( i )
            r = p + bb
            IF( i.NE.m-1 )
     $         e( i+1 ) = s*r
            oldc = c
            c = p / r
            s = bb / r
            oldgam = gamma
            alpha = d( i )
            gamma = c*( alpha-sigma ) - s*oldgam
            d( i+1 ) = oldgam + ( alpha-gamma )
            IF( c.NE.zero ) THEN
               p = ( gamma*gamma ) / c
            ELSE
               p = oldc*bb
            END IF
   80    CONTINUE
*
         e( l ) = s*p
         d( l ) = sigma + gamma
         GO TO 50
*
*        Eigenvalue found.
*
   90    CONTINUE
         d( l ) = p
*
         l = l + 1
         IF( l.LE.lend )
     $      GO TO 50
         GO TO 150
*
      ELSE
*
*        QR Iteration
*
*        Look for small superdiagonal element.
*
  100    CONTINUE
         DO 110 m = l, lend + 1, -1
            IF( abs( e( m-1 ) ).LE.eps2*abs( d( m )*d( m-1 ) ) )
     $         GO TO 120
  110    CONTINUE
         m = lend
*
  120    CONTINUE
         IF( m.GT.lend )
     $      e( m-1 ) = zero
         p = d( l )
         IF( m.EQ.l )
     $      GO TO 140
*
*        If remaining matrix is 2 by 2, use SLAE2 to compute its
*        eigenvalues.
*
         IF( m.EQ.l-1 ) THEN
            rte = sqrt( e( l-1 ) )
            CALL slae2( d( l ), rte, d( l-1 ), rt1, rt2 )
            d( l ) = rt1
            d( l-1 ) = rt2
            e( l-1 ) = zero
            l = l - 2
            IF( l.GE.lend )
     $         GO TO 100
            GO TO 150
         END IF
*
         IF( jtot.EQ.nmaxit )
     $      GO TO 150
         jtot = jtot + 1
*
*        Form shift.
*
         rte = sqrt( e( l-1 ) )
         sigma = ( d( l-1 )-p ) / ( two*rte )
         r = slapy2( sigma, one )
         sigma = p - ( rte / ( sigma+sign( r, sigma ) ) )
*
         c = one
         s = zero
         gamma = d( m ) - sigma
         p = gamma*gamma
*
*        Inner loop
*
         DO 130 i = m, l - 1
            bb = e( i )
            r = p + bb
            IF( i.NE.m )
     $         e( i-1 ) = s*r
            oldc = c
            c = p / r
            s = bb / r
            oldgam = gamma
            alpha = d( i+1 )
            gamma = c*( alpha-sigma ) - s*oldgam
            d( i ) = oldgam + ( alpha-gamma )
            IF( c.NE.zero ) THEN
               p = ( gamma*gamma ) / c
            ELSE
               p = oldc*bb
            END IF
  130    CONTINUE
*
         e( l-1 ) = s*p
         d( l ) = sigma + gamma
         GO TO 100
*
*        Eigenvalue found.
*
  140    CONTINUE
         d( l ) = p
*
         l = l - 1
         IF( l.GE.lend )
     $      GO TO 100
         GO TO 150
*
      END IF
*
*     Undo scaling if necessary
*
  150 CONTINUE
      IF( iscale.EQ.1 )
     $   CALL slascl( 'G', 0, 0, ssfmax, anorm, lendsv-lsv+1, 1,
     $                d( lsv ), n, info )
      IF( iscale.EQ.2 )
     $   CALL slascl( 'G', 0, 0, ssfmin, anorm, lendsv-lsv+1, 1,
     $                d( lsv ), n, info )
*
*     Check for no convergence to an eigenvalue after a total
*     of N*MAXIT iterations.
*
      IF( jtot.LT.nmaxit )
     $   GO TO 10
      DO 160 i = 1, n - 1
         IF( e( i ).NE.zero )
     $      info = info + 1
  160 CONTINUE
      GO TO 180
*
*     Sort eigenvalues in increasing order.
*
  170 CONTINUE
      CALL slasrt( 'I', n, d, info )
*
  180 CONTINUE
      RETURN
*
*     End of SSTERF
*

OpenRadioss 2025.1.11 OpenRadioss project