Functions
subroutine	cbbcsd (jobu1, jobu2, jobv1t, jobv2t, trans, m, p, q, theta, phi, u1, ldu1, u2, ldu2, v1t, ldv1t, v2t, ldv2t, b11d, b11e, b12d, b12e, b21d, b21e, b22d, b22e, rwork, lrwork, info)
	CBBCSD
subroutine	cbdsqr (uplo, n, ncvt, nru, ncc, d, e, vt, ldvt, u, ldu, c, ldc, rwork, info)
	CBDSQR
subroutine	cgghd3 (compq, compz, n, ilo, ihi, a, lda, b, ldb, q, ldq, z, ldz, work, lwork, info)
	CGGHD3
subroutine	cgghrd (compq, compz, n, ilo, ihi, a, lda, b, ldb, q, ldq, z, ldz, info)
	CGGHRD
subroutine	cggqrf (n, m, p, a, lda, taua, b, ldb, taub, work, lwork, info)
	CGGQRF
subroutine	cggrqf (m, p, n, a, lda, taua, b, ldb, taub, work, lwork, info)
	CGGRQF
subroutine	cggsvp3 (jobu, jobv, jobq, m, p, n, a, lda, b, ldb, tola, tolb, k, l, u, ldu, v, ldv, q, ldq, iwork, rwork, tau, work, lwork, info)
	CGGSVP3
subroutine	cgsvj0 (jobv, m, n, a, lda, d, sva, mv, v, ldv, eps, sfmin, tol, nsweep, work, lwork, info)
	CGSVJ0 pre-processor for the routine cgesvj.
subroutine	cgsvj1 (jobv, m, n, n1, a, lda, d, sva, mv, v, ldv, eps, sfmin, tol, nsweep, work, lwork, info)
	CGSVJ1 pre-processor for the routine cgesvj, applies Jacobi rotations targeting only particular pivots.
subroutine	chbgst (vect, uplo, n, ka, kb, ab, ldab, bb, ldbb, x, ldx, work, rwork, info)
	CHBGST
subroutine	chbtrd (vect, uplo, n, kd, ab, ldab, d, e, q, ldq, work, info)
	CHBTRD
subroutine	chetrd_hb2st (stage1, vect, uplo, n, kd, ab, ldab, d, e, hous, lhous, work, lwork, info)
	CHETRD_HB2ST reduces a complex Hermitian band matrix A to real symmetric tridiagonal form T
subroutine	chfrk (transr, uplo, trans, n, k, alpha, a, lda, beta, c)
	CHFRK performs a Hermitian rank-k operation for matrix in RFP format.
subroutine	chpcon (uplo, n, ap, ipiv, anorm, rcond, work, info)
	CHPCON
subroutine	chpgst (itype, uplo, n, ap, bp, info)
	CHPGST
subroutine	chprfs (uplo, n, nrhs, ap, afp, ipiv, b, ldb, x, ldx, ferr, berr, work, rwork, info)
	CHPRFS
subroutine	chptrd (uplo, n, ap, d, e, tau, info)
	CHPTRD
subroutine	chptrf (uplo, n, ap, ipiv, info)
	CHPTRF
subroutine	chptri (uplo, n, ap, ipiv, work, info)
	CHPTRI
subroutine	chptrs (uplo, n, nrhs, ap, ipiv, b, ldb, info)
	CHPTRS
subroutine	chsein (side, eigsrc, initv, select, n, h, ldh, w, vl, ldvl, vr, ldvr, mm, m, work, rwork, ifaill, ifailr, info)
	CHSEIN
subroutine	chseqr (job, compz, n, ilo, ihi, h, ldh, w, z, ldz, work, lwork, info)
	CHSEQR
subroutine	cla_lin_berr (n, nz, nrhs, res, ayb, berr)
	CLA_LIN_BERR computes a component-wise relative backward error.
subroutine	cla_wwaddw (n, x, y, w)
	CLA_WWADDW adds a vector into a doubled-single vector.
subroutine	claed0 (qsiz, n, d, e, q, ldq, qstore, ldqs, rwork, iwork, info)
	CLAED0 used by CSTEDC. Computes all eigenvalues and corresponding eigenvectors of an unreduced symmetric tridiagonal matrix using the divide and conquer method.
subroutine	claed7 (n, cutpnt, qsiz, tlvls, curlvl, curpbm, d, q, ldq, rho, indxq, qstore, qptr, prmptr, perm, givptr, givcol, givnum, work, rwork, iwork, info)
	CLAED7 used by CSTEDC. Computes the updated eigensystem of a diagonal matrix after modification by a rank-one symmetric matrix. Used when the original matrix is dense.
subroutine	claed8 (k, n, qsiz, q, ldq, d, rho, cutpnt, z, dlamda, q2, ldq2, w, indxp, indx, indxq, perm, givptr, givcol, givnum, info)
	CLAED8 used by CSTEDC. Merges eigenvalues and deflates secular equation. Used when the original matrix is dense.
subroutine	clals0 (icompq, nl, nr, sqre, nrhs, b, ldb, bx, ldbx, perm, givptr, givcol, ldgcol, givnum, ldgnum, poles, difl, difr, z, k, c, s, rwork, info)
	CLALS0 applies back multiplying factors in solving the least squares problem using divide and conquer SVD approach. Used by sgelsd.
subroutine	clalsa (icompq, smlsiz, n, nrhs, b, ldb, bx, ldbx, u, ldu, vt, k, difl, difr, z, poles, givptr, givcol, ldgcol, perm, givnum, c, s, rwork, iwork, info)
	CLALSA computes the SVD of the coefficient matrix in compact form. Used by sgelsd.
subroutine	clalsd (uplo, smlsiz, n, nrhs, d, e, b, ldb, rcond, rank, work, rwork, iwork, info)
	CLALSD uses the singular value decomposition of A to solve the least squares problem.
real function	clanhf (norm, transr, uplo, n, a, work)
	CLANHF returns the value of the 1-norm, or the Frobenius norm, or the infinity norm, or the element of largest absolute value of a Hermitian matrix in RFP format.
subroutine	clarscl2 (m, n, d, x, ldx)
	CLARSCL2 performs reciprocal diagonal scaling on a vector.
subroutine	clarz (side, m, n, l, v, incv, tau, c, ldc, work)
	CLARZ applies an elementary reflector (as returned by stzrzf) to a general matrix.
subroutine	clarzb (side, trans, direct, storev, m, n, k, l, v, ldv, t, ldt, c, ldc, work, ldwork)
	CLARZB applies a block reflector or its conjugate-transpose to a general matrix.
subroutine	clarzt (direct, storev, n, k, v, ldv, tau, t, ldt)
	CLARZT forms the triangular factor T of a block reflector H = I - vtvH.
subroutine	clascl2 (m, n, d, x, ldx)
	CLASCL2 performs diagonal scaling on a vector.
subroutine	clatrz (m, n, l, a, lda, tau, work)
	CLATRZ factors an upper trapezoidal matrix by means of unitary transformations.
subroutine	cpbcon (uplo, n, kd, ab, ldab, anorm, rcond, work, rwork, info)
	CPBCON
subroutine	cpbequ (uplo, n, kd, ab, ldab, s, scond, amax, info)
	CPBEQU
subroutine	cpbrfs (uplo, n, kd, nrhs, ab, ldab, afb, ldafb, b, ldb, x, ldx, ferr, berr, work, rwork, info)
	CPBRFS
subroutine	cpbstf (uplo, n, kd, ab, ldab, info)
	CPBSTF
subroutine	cpbtf2 (uplo, n, kd, ab, ldab, info)
	CPBTF2 computes the Cholesky factorization of a symmetric/Hermitian positive definite band matrix (unblocked algorithm).
subroutine	cpbtrf (uplo, n, kd, ab, ldab, info)
	CPBTRF
subroutine	cpbtrs (uplo, n, kd, nrhs, ab, ldab, b, ldb, info)
	CPBTRS
subroutine	cpftrf (transr, uplo, n, a, info)
	CPFTRF
subroutine	cpftri (transr, uplo, n, a, info)
	CPFTRI
subroutine	cpftrs (transr, uplo, n, nrhs, a, b, ldb, info)
	CPFTRS
subroutine	cppcon (uplo, n, ap, anorm, rcond, work, rwork, info)
	CPPCON
subroutine	cppequ (uplo, n, ap, s, scond, amax, info)
	CPPEQU
subroutine	cpprfs (uplo, n, nrhs, ap, afp, b, ldb, x, ldx, ferr, berr, work, rwork, info)
	CPPRFS
subroutine	cpptrf (uplo, n, ap, info)
	CPPTRF
subroutine	cpptri (uplo, n, ap, info)
	CPPTRI
subroutine	cpptrs (uplo, n, nrhs, ap, b, ldb, info)
	CPPTRS
subroutine	cpstf2 (uplo, n, a, lda, piv, rank, tol, work, info)
	CPSTF2 computes the Cholesky factorization with complete pivoting of complex Hermitian positive semidefinite matrix.
subroutine	cpstrf (uplo, n, a, lda, piv, rank, tol, work, info)
	CPSTRF computes the Cholesky factorization with complete pivoting of complex Hermitian positive semidefinite matrix.
subroutine	cspcon (uplo, n, ap, ipiv, anorm, rcond, work, info)
	CSPCON
subroutine	csprfs (uplo, n, nrhs, ap, afp, ipiv, b, ldb, x, ldx, ferr, berr, work, rwork, info)
	CSPRFS
subroutine	csptrf (uplo, n, ap, ipiv, info)
	CSPTRF
subroutine	csptri (uplo, n, ap, ipiv, work, info)
	CSPTRI
subroutine	csptrs (uplo, n, nrhs, ap, ipiv, b, ldb, info)
	CSPTRS
subroutine	cstedc (compz, n, d, e, z, ldz, work, lwork, rwork, lrwork, iwork, liwork, info)
	CSTEDC
subroutine	cstegr (jobz, range, n, d, e, vl, vu, il, iu, abstol, m, w, z, ldz, isuppz, work, lwork, iwork, liwork, info)
	CSTEGR
subroutine	cstein (n, d, e, m, w, iblock, isplit, z, ldz, work, iwork, ifail, info)
	CSTEIN
subroutine	cstemr (jobz, range, n, d, e, vl, vu, il, iu, m, w, z, ldz, nzc, isuppz, tryrac, work, lwork, iwork, liwork, info)
	CSTEMR
subroutine	csteqr (compz, n, d, e, z, ldz, work, info)
	CSTEQR
subroutine	ctbcon (norm, uplo, diag, n, kd, ab, ldab, rcond, work, rwork, info)
	CTBCON
subroutine	ctbrfs (uplo, trans, diag, n, kd, nrhs, ab, ldab, b, ldb, x, ldx, ferr, berr, work, rwork, info)
	CTBRFS
subroutine	ctbtrs (uplo, trans, diag, n, kd, nrhs, ab, ldab, b, ldb, info)
	CTBTRS
subroutine	ctfsm (transr, side, uplo, trans, diag, m, n, alpha, a, b, ldb)
	CTFSM solves a matrix equation (one operand is a triangular matrix in RFP format).
subroutine	ctftri (transr, uplo, diag, n, a, info)
	CTFTRI
subroutine	ctfttp (transr, uplo, n, arf, ap, info)
	CTFTTP copies a triangular matrix from the rectangular full packed format (TF) to the standard packed format (TP).
subroutine	ctfttr (transr, uplo, n, arf, a, lda, info)
	CTFTTR copies a triangular matrix from the rectangular full packed format (TF) to the standard full format (TR).
subroutine	ctgsen (ijob, wantq, wantz, select, n, a, lda, b, ldb, alpha, beta, q, ldq, z, ldz, m, pl, pr, dif, work, lwork, iwork, liwork, info)
	CTGSEN
subroutine	ctgsja (jobu, jobv, jobq, m, p, n, k, l, a, lda, b, ldb, tola, tolb, alpha, beta, u, ldu, v, ldv, q, ldq, work, ncycle, info)
	CTGSJA
subroutine	ctgsna (job, howmny, select, n, a, lda, b, ldb, vl, ldvl, vr, ldvr, s, dif, mm, m, work, lwork, iwork, info)
	CTGSNA
subroutine	ctpcon (norm, uplo, diag, n, ap, rcond, work, rwork, info)
	CTPCON
subroutine	ctpmqrt (side, trans, m, n, k, l, nb, v, ldv, t, ldt, a, lda, b, ldb, work, info)
	CTPMQRT
subroutine	ctpqrt (m, n, l, nb, a, lda, b, ldb, t, ldt, work, info)
	CTPQRT
subroutine	ctpqrt2 (m, n, l, a, lda, b, ldb, t, ldt, info)
	CTPQRT2 computes a QR factorization of a real or complex "triangular-pentagonal" matrix, which is composed of a triangular block and a pentagonal block, using the compact WY representation for Q.
subroutine	ctprfs (uplo, trans, diag, n, nrhs, ap, b, ldb, x, ldx, ferr, berr, work, rwork, info)
	CTPRFS
subroutine	ctptri (uplo, diag, n, ap, info)
	CTPTRI
subroutine	ctptrs (uplo, trans, diag, n, nrhs, ap, b, ldb, info)
	CTPTRS
subroutine	ctpttf (transr, uplo, n, ap, arf, info)
	CTPTTF copies a triangular matrix from the standard packed format (TP) to the rectangular full packed format (TF).
subroutine	ctpttr (uplo, n, ap, a, lda, info)
	CTPTTR copies a triangular matrix from the standard packed format (TP) to the standard full format (TR).
subroutine	ctrcon (norm, uplo, diag, n, a, lda, rcond, work, rwork, info)
	CTRCON
subroutine	ctrevc (side, howmny, select, n, t, ldt, vl, ldvl, vr, ldvr, mm, m, work, rwork, info)
	CTREVC
subroutine	ctrevc3 (side, howmny, select, n, t, ldt, vl, ldvl, vr, ldvr, mm, m, work, lwork, rwork, lrwork, info)
	CTREVC3
subroutine	ctrexc (compq, n, t, ldt, q, ldq, ifst, ilst, info)
	CTREXC
subroutine	ctrrfs (uplo, trans, diag, n, nrhs, a, lda, b, ldb, x, ldx, ferr, berr, work, rwork, info)
	CTRRFS
subroutine	ctrsen (job, compq, select, n, t, ldt, q, ldq, w, m, s, sep, work, lwork, info)
	CTRSEN
subroutine	ctrsna (job, howmny, select, n, t, ldt, vl, ldvl, vr, ldvr, s, sep, mm, m, work, ldwork, rwork, info)
	CTRSNA
subroutine	ctrti2 (uplo, diag, n, a, lda, info)
	CTRTI2 computes the inverse of a triangular matrix (unblocked algorithm).
subroutine	ctrtri (uplo, diag, n, a, lda, info)
	CTRTRI
subroutine	ctrtrs (uplo, trans, diag, n, nrhs, a, lda, b, ldb, info)
	CTRTRS
subroutine	ctrttf (transr, uplo, n, a, lda, arf, info)
	CTRTTF copies a triangular matrix from the standard full format (TR) to the rectangular full packed format (TF).
subroutine	ctrttp (uplo, n, a, lda, ap, info)
	CTRTTP copies a triangular matrix from the standard full format (TR) to the standard packed format (TP).
subroutine	ctzrzf (m, n, a, lda, tau, work, lwork, info)
	CTZRZF
subroutine	cunbdb (trans, signs, m, p, q, x11, ldx11, x12, ldx12, x21, ldx21, x22, ldx22, theta, phi, taup1, taup2, tauq1, tauq2, work, lwork, info)
	CUNBDB
subroutine	cunbdb1 (m, p, q, x11, ldx11, x21, ldx21, theta, phi, taup1, taup2, tauq1, work, lwork, info)
	CUNBDB1
subroutine	cunbdb2 (m, p, q, x11, ldx11, x21, ldx21, theta, phi, taup1, taup2, tauq1, work, lwork, info)
	CUNBDB2
subroutine	cunbdb3 (m, p, q, x11, ldx11, x21, ldx21, theta, phi, taup1, taup2, tauq1, work, lwork, info)
	CUNBDB3
subroutine	cunbdb4 (m, p, q, x11, ldx11, x21, ldx21, theta, phi, taup1, taup2, tauq1, phantom, work, lwork, info)
	CUNBDB4
subroutine	cunbdb5 (m1, m2, n, x1, incx1, x2, incx2, q1, ldq1, q2, ldq2, work, lwork, info)
	CUNBDB5
subroutine	cunbdb6 (m1, m2, n, x1, incx1, x2, incx2, q1, ldq1, q2, ldq2, work, lwork, info)
	CUNBDB6
recursive subroutine	cuncsd (jobu1, jobu2, jobv1t, jobv2t, trans, signs, m, p, q, x11, ldx11, x12, ldx12, x21, ldx21, x22, ldx22, theta, u1, ldu1, u2, ldu2, v1t, ldv1t, v2t, ldv2t, work, lwork, rwork, lrwork, iwork, info)
	CUNCSD
subroutine	cuncsd2by1 (jobu1, jobu2, jobv1t, m, p, q, x11, ldx11, x21, ldx21, theta, u1, ldu1, u2, ldu2, v1t, ldv1t, work, lwork, rwork, lrwork, iwork, info)
	CUNCSD2BY1
subroutine	cung2l (m, n, k, a, lda, tau, work, info)
	CUNG2L generates all or part of the unitary matrix Q from a QL factorization determined by cgeqlf (unblocked algorithm).
subroutine	cung2r (m, n, k, a, lda, tau, work, info)
	CUNG2R
subroutine	cunghr (n, ilo, ihi, a, lda, tau, work, lwork, info)
	CUNGHR
subroutine	cungl2 (m, n, k, a, lda, tau, work, info)
	CUNGL2 generates all or part of the unitary matrix Q from an LQ factorization determined by cgelqf (unblocked algorithm).
subroutine	cunglq (m, n, k, a, lda, tau, work, lwork, info)
	CUNGLQ
subroutine	cungql (m, n, k, a, lda, tau, work, lwork, info)
	CUNGQL
subroutine	cungqr (m, n, k, a, lda, tau, work, lwork, info)
	CUNGQR
subroutine	cungr2 (m, n, k, a, lda, tau, work, info)
	CUNGR2 generates all or part of the unitary matrix Q from an RQ factorization determined by cgerqf (unblocked algorithm).
subroutine	cungrq (m, n, k, a, lda, tau, work, lwork, info)
	CUNGRQ
subroutine	cungtr (uplo, n, a, lda, tau, work, lwork, info)
	CUNGTR
subroutine	cungtsqr (m, n, mb, nb, a, lda, t, ldt, work, lwork, info)
	CUNGTSQR
subroutine	cungtsqr_row (m, n, mb, nb, a, lda, t, ldt, work, lwork, info)
	CUNGTSQR_ROW
subroutine	cunhr_col (m, n, nb, a, lda, t, ldt, d, info)
	CUNHR_COL
subroutine	cunm22 (side, trans, m, n, n1, n2, q, ldq, c, ldc, work, lwork, info)
	CUNM22 multiplies a general matrix by a banded unitary matrix.
subroutine	cunm2l (side, trans, m, n, k, a, lda, tau, c, ldc, work, info)
	CUNM2L multiplies a general matrix by the unitary matrix from a QL factorization determined by cgeqlf (unblocked algorithm).
subroutine	cunm2r (side, trans, m, n, k, a, lda, tau, c, ldc, work, info)
	CUNM2R multiplies a general matrix by the unitary matrix from a QR factorization determined by cgeqrf (unblocked algorithm).
subroutine	cunmbr (vect, side, trans, m, n, k, a, lda, tau, c, ldc, work, lwork, info)
	CUNMBR
subroutine	cunmhr (side, trans, m, n, ilo, ihi, a, lda, tau, c, ldc, work, lwork, info)
	CUNMHR
subroutine	cunml2 (side, trans, m, n, k, a, lda, tau, c, ldc, work, info)
	CUNML2 multiplies a general matrix by the unitary matrix from a LQ factorization determined by cgelqf (unblocked algorithm).
subroutine	cunmlq (side, trans, m, n, k, a, lda, tau, c, ldc, work, lwork, info)
	CUNMLQ
subroutine	cunmql (side, trans, m, n, k, a, lda, tau, c, ldc, work, lwork, info)
	CUNMQL
subroutine	cunmqr (side, trans, m, n, k, a, lda, tau, c, ldc, work, lwork, info)
	CUNMQR
subroutine	cunmr2 (side, trans, m, n, k, a, lda, tau, c, ldc, work, info)
	CUNMR2 multiplies a general matrix by the unitary matrix from a RQ factorization determined by cgerqf (unblocked algorithm).
subroutine	cunmr3 (side, trans, m, n, k, l, a, lda, tau, c, ldc, work, info)
	CUNMR3 multiplies a general matrix by the unitary matrix from a RZ factorization determined by ctzrzf (unblocked algorithm).
subroutine	cunmrq (side, trans, m, n, k, a, lda, tau, c, ldc, work, lwork, info)
	CUNMRQ
subroutine	cunmrz (side, trans, m, n, k, l, a, lda, tau, c, ldc, work, lwork, info)
	CUNMRZ
subroutine	cunmtr (side, uplo, trans, m, n, a, lda, tau, c, ldc, work, lwork, info)
	CUNMTR
subroutine	cupgtr (uplo, n, ap, tau, q, ldq, work, info)
	CUPGTR
subroutine	cupmtr (side, uplo, trans, m, n, ap, tau, c, ldc, work, info)
	CUPMTR
subroutine	cggsvp (jobu, jobv, jobq, m, p, n, a, lda, b, ldb, tola, tolb, k, l, u, ldu, v, ldv, q, ldq, iwork, rwork, tau, work, info)
	CGGSVP
subroutine	clatzm (side, m, n, v, incv, tau, c1, c2, ldc, work)
	CLATZM
subroutine	ctzrqf (m, n, a, lda, tau, info)
	CTZRQF
subroutine	dorm22 (side, trans, m, n, n1, n2, q, ldq, c, ldc, work, lwork, info)
	DORM22 multiplies a general matrix by a banded orthogonal matrix.
subroutine	sorm22 (side, trans, m, n, n1, n2, q, ldq, c, ldc, work, lwork, info)
	SORM22 multiplies a general matrix by a banded orthogonal matrix.
subroutine	zunm22 (side, trans, m, n, n1, n2, q, ldq, c, ldc, work, lwork, info)
	ZUNM22 multiplies a general matrix by a banded unitary matrix.

Detailed Description

This is the group of complex other Computational routines

Function Documentation

◆ cbbcsd()

subroutine cbbcsd	(	character	jobu1,
		character	jobu2,
		character	jobv1t,
		character	jobv2t,
		character	trans,
		integer	m,
		integer	p,
		integer	q,
		real, dimension( * )	theta,
		real, dimension( * )	phi,
		complex, dimension( ldu1, * )	u1,
		integer	ldu1,
		complex, dimension( ldu2, * )	u2,
		integer	ldu2,
		complex, dimension( ldv1t, * )	v1t,
		integer	ldv1t,
		complex, dimension( ldv2t, * )	v2t,
		integer	ldv2t,
		real, dimension( * )	b11d,
		real, dimension( * )	b11e,
		real, dimension( * )	b12d,
		real, dimension( * )	b12e,
		real, dimension( * )	b21d,
		real, dimension( * )	b21e,
		real, dimension( * )	b22d,
		real, dimension( * )	b22e,
		real, dimension( * )	rwork,
		integer	lrwork,
		integer	info )

CBBCSD

Download CBBCSD + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CBBCSD computes the CS decomposition of a unitary matrix in
!> bidiagonal-block form,
!>
!>
!>     [ B11 | B12 0  0 ]
!>     [  0  |  0 -I  0 ]
!> X = [----------------]
!>     [ B21 | B22 0  0 ]
!>     [  0  |  0  0  I ]
!>
!>                               [  C | -S  0  0 ]
!>                   [ U1 |    ] [  0 |  0 -I  0 ] [ V1 |    ]**H
!>                 = [---------] [---------------] [---------]   .
!>                   [    | U2 ] [  S |  C  0  0 ] [    | V2 ]
!>                               [  0 |  0  0  I ]
!>
!> X is M-by-M, its top-left block is P-by-Q, and Q must be no larger
!> than P, M-P, or M-Q. (If Q is not the smallest index, then X must be
!> transposed and/or permuted. This can be done in constant time using
!> the TRANS and SIGNS options. See CUNCSD for details.)
!>
!> The bidiagonal matrices B11, B12, B21, and B22 are represented
!> implicitly by angles THETA(1:Q) and PHI(1:Q-1).
!>
!> The unitary matrices U1, U2, V1T, and V2T are input/output.
!> The input matrices are pre- or post-multiplied by the appropriate
!> singular vector matrices.
!>

Parameters

[in]	JOBU1	!> JOBU1 is CHARACTER !> = 'Y': U1 is updated; !> otherwise: U1 is not updated. !>
[in]	JOBU2	!> JOBU2 is CHARACTER !> = 'Y': U2 is updated; !> otherwise: U2 is not updated. !>
[in]	JOBV1T	!> JOBV1T is CHARACTER !> = 'Y': V1T is updated; !> otherwise: V1T is not updated. !>
[in]	JOBV2T	!> JOBV2T is CHARACTER !> = 'Y': V2T is updated; !> otherwise: V2T is not updated. !>
[in]	TRANS	!> TRANS is CHARACTER !> = 'T': X, U1, U2, V1T, and V2T are stored in row-major !> order; !> otherwise: X, U1, U2, V1T, and V2T are stored in column- !> major order. !>
[in]	M	!> M is INTEGER !> The number of rows and columns in X, the unitary matrix in !> bidiagonal-block form. !>
[in]	P	!> P is INTEGER !> The number of rows in the top-left block of X. 0 <= P <= M. !>
[in]	Q	!> Q is INTEGER !> The number of columns in the top-left block of X. !> 0 <= Q <= MIN(P,M-P,M-Q). !>
[in,out]	THETA	!> THETA is REAL array, dimension (Q) !> On entry, the angles THETA(1),...,THETA(Q) that, along with !> PHI(1), ...,PHI(Q-1), define the matrix in bidiagonal-block !> form. On exit, the angles whose cosines and sines define the !> diagonal blocks in the CS decomposition. !>
[in,out]	PHI	!> PHI is REAL array, dimension (Q-1) !> The angles PHI(1),...,PHI(Q-1) that, along with THETA(1),..., !> THETA(Q), define the matrix in bidiagonal-block form. !>
[in,out]	U1	!> U1 is COMPLEX array, dimension (LDU1,P) !> On entry, a P-by-P matrix. On exit, U1 is postmultiplied !> by the left singular vector matrix common to [ B11 ; 0 ] and !> [ B12 0 0 ; 0 -I 0 0 ]. !>
[in]	LDU1	!> LDU1 is INTEGER !> The leading dimension of the array U1, LDU1 >= MAX(1,P). !>
[in,out]	U2	!> U2 is COMPLEX array, dimension (LDU2,M-P) !> On entry, an (M-P)-by-(M-P) matrix. On exit, U2 is !> postmultiplied by the left singular vector matrix common to !> [ B21 ; 0 ] and [ B22 0 0 ; 0 0 I ]. !>
[in]	LDU2	!> LDU2 is INTEGER !> The leading dimension of the array U2, LDU2 >= MAX(1,M-P). !>
[in,out]	V1T	!> V1T is COMPLEX array, dimension (LDV1T,Q) !> On entry, a Q-by-Q matrix. On exit, V1T is premultiplied !> by the conjugate transpose of the right singular vector !> matrix common to [ B11 ; 0 ] and [ B21 ; 0 ]. !>
[in]	LDV1T	!> LDV1T is INTEGER !> The leading dimension of the array V1T, LDV1T >= MAX(1,Q). !>
[in,out]	V2T	!> V2T is COMPLEX array, dimension (LDV2T,M-Q) !> On entry, an (M-Q)-by-(M-Q) matrix. On exit, V2T is !> premultiplied by the conjugate transpose of the right !> singular vector matrix common to [ B12 0 0 ; 0 -I 0 ] and !> [ B22 0 0 ; 0 0 I ]. !>
[in]	LDV2T	!> LDV2T is INTEGER !> The leading dimension of the array V2T, LDV2T >= MAX(1,M-Q). !>
[out]	B11D	!> B11D is REAL array, dimension (Q) !> When CBBCSD converges, B11D contains the cosines of THETA(1), !> ..., THETA(Q). If CBBCSD fails to converge, then B11D !> contains the diagonal of the partially reduced top-left !> block. !>
[out]	B11E	!> B11E is REAL array, dimension (Q-1) !> When CBBCSD converges, B11E contains zeros. If CBBCSD fails !> to converge, then B11E contains the superdiagonal of the !> partially reduced top-left block. !>
[out]	B12D	!> B12D is REAL array, dimension (Q) !> When CBBCSD converges, B12D contains the negative sines of !> THETA(1), ..., THETA(Q). If CBBCSD fails to converge, then !> B12D contains the diagonal of the partially reduced top-right !> block. !>
[out]	B12E	!> B12E is REAL array, dimension (Q-1) !> When CBBCSD converges, B12E contains zeros. If CBBCSD fails !> to converge, then B12E contains the subdiagonal of the !> partially reduced top-right block. !>
[out]	B21D	!> B21D is REAL array, dimension (Q) !> When CBBCSD converges, B21D contains the negative sines of !> THETA(1), ..., THETA(Q). If CBBCSD fails to converge, then !> B21D contains the diagonal of the partially reduced bottom-left !> block. !>
[out]	B21E	!> B21E is REAL array, dimension (Q-1) !> When CBBCSD converges, B21E contains zeros. If CBBCSD fails !> to converge, then B21E contains the subdiagonal of the !> partially reduced bottom-left block. !>
[out]	B22D	!> B22D is REAL array, dimension (Q) !> When CBBCSD converges, B22D contains the negative sines of !> THETA(1), ..., THETA(Q). If CBBCSD fails to converge, then !> B22D contains the diagonal of the partially reduced bottom-right !> block. !>
[out]	B22E	!> B22E is REAL array, dimension (Q-1) !> When CBBCSD converges, B22E contains zeros. If CBBCSD fails !> to converge, then B22E contains the subdiagonal of the !> partially reduced bottom-right block. !>
[out]	RWORK	!> RWORK is REAL array, dimension (MAX(1,LRWORK)) !> On exit, if INFO = 0, RWORK(1) returns the optimal LRWORK. !>
[in]	LRWORK	!> LRWORK is INTEGER !> The dimension of the array RWORK. LRWORK >= MAX(1,8*Q). !> !> If LRWORK = -1, then a workspace query is assumed; the !> routine only calculates the optimal size of the RWORK array, !> returns this value as the first entry of the work array, and !> no error message related to LRWORK is issued by XERBLA. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> < 0: if INFO = -i, the i-th argument had an illegal value. !> > 0: if CBBCSD did not converge, INFO specifies the number !> of nonzero entries in PHI, and B11D, B11E, etc., !> contain the partially reduced matrix. !>

Internal Parameters:

!>  TOLMUL  REAL, default = MAX(10,MIN(100,EPS**(-1/8)))
!>          TOLMUL controls the convergence criterion of the QR loop.
!>          Angles THETA(i), PHI(i) are rounded to 0 or PI/2 when they
!>          are within TOLMUL*EPS of either bound.
!>

References:: [1] Brian D. Sutton. Computing the complete CS decomposition. Numer. Algorithms, 50(1):33-65, 2009.

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 328 of file cbbcsd.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          JOBU1, JOBU2, JOBV1T, JOBV2T, TRANS
      INTEGER            INFO, LDU1, LDU2, LDV1T, LDV2T, LRWORK, M, P, Q
*     ..
*     .. Array Arguments ..
      REAL               B11D( * ), B11E( * ), B12D( * ), B12E( * ),
     $                   B21D( * ), B21E( * ), B22D( * ), B22E( * ),
     $                   PHI( * ), THETA( * ), RWORK( * )
      COMPLEX            U1( LDU1, * ), U2( LDU2, * ), V1T( LDV1T, * ),
     $                   V2T( LDV2T, * )
*     ..
*
*  ===================================================================
*
*     .. Parameters ..
      INTEGER            MAXITR
      parameter( maxitr = 6 )
      REAL               HUNDRED, MEIGHTH, ONE, TEN, ZERO
      parameter( hundred = 100.0e0, meighth = -0.125e0,
     $                     one = 1.0e0, ten = 10.0e0, zero = 0.0e0 )
      COMPLEX            NEGONECOMPLEX
      parameter( negonecomplex = (-1.0e0,0.0e0) )
      REAL               PIOVER2
      parameter( piover2 = 1.57079632679489661923132169163975144210e0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            COLMAJOR, LQUERY, RESTART11, RESTART12,
     $                   RESTART21, RESTART22, WANTU1, WANTU2, WANTV1T,
     $                   WANTV2T
      INTEGER            I, IMIN, IMAX, ITER, IU1CS, IU1SN, IU2CS,
     $                   IU2SN, IV1TCS, IV1TSN, IV2TCS, IV2TSN, J,
     $                   LRWORKMIN, LRWORKOPT, MAXIT, MINI
      REAL               B11BULGE, B12BULGE, B21BULGE, B22BULGE, DUMMY,
     $                   EPS, MU, NU, R, SIGMA11, SIGMA21,
     $                   TEMP, THETAMAX, THETAMIN, THRESH, TOL, TOLMUL,
     $                   UNFL, X1, X2, Y1, Y2
*
*     .. External Subroutines ..
      EXTERNAL           clasr, cscal, cswap, slartgp, slartgs, slas2,
     $                   xerbla
*     ..
*     .. External Functions ..
      REAL               SLAMCH
      LOGICAL            LSAME
      EXTERNAL           lsame, slamch
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, atan2, cos, max, min, sin, sqrt
*     ..
*     .. Executable Statements ..
*
*     Test input arguments
*
      info = 0
      lquery = lrwork .EQ. -1
      wantu1 = lsame( jobu1, 'Y' )
      wantu2 = lsame( jobu2, 'Y' )
      wantv1t = lsame( jobv1t, 'Y' )
      wantv2t = lsame( jobv2t, 'Y' )
      colmajor = .NOT. lsame( trans, 'T' )
*
      IF( m .LT. 0 ) THEN
         info = -6
      ELSE IF( p .LT. 0 .OR. p .GT. m ) THEN
         info = -7
      ELSE IF( q .LT. 0 .OR. q .GT. m ) THEN
         info = -8
      ELSE IF( q .GT. p .OR. q .GT. m-p .OR. q .GT. m-q ) THEN
         info = -8
      ELSE IF( wantu1 .AND. ldu1 .LT. p ) THEN
         info = -12
      ELSE IF( wantu2 .AND. ldu2 .LT. m-p ) THEN
         info = -14
      ELSE IF( wantv1t .AND. ldv1t .LT. q ) THEN
         info = -16
      ELSE IF( wantv2t .AND. ldv2t .LT. m-q ) THEN
         info = -18
      END IF
*
*     Quick return if Q = 0
*
      IF( info .EQ. 0 .AND. q .EQ. 0 ) THEN
         lrworkmin = 1
         rwork(1) = lrworkmin
         RETURN
      END IF
*
*     Compute workspace
*
      IF( info .EQ. 0 ) THEN
         iu1cs = 1
         iu1sn = iu1cs + q
         iu2cs = iu1sn + q
         iu2sn = iu2cs + q
         iv1tcs = iu2sn + q
         iv1tsn = iv1tcs + q
         iv2tcs = iv1tsn + q
         iv2tsn = iv2tcs + q
         lrworkopt = iv2tsn + q - 1
         lrworkmin = lrworkopt
         rwork(1) = lrworkopt
         IF( lrwork .LT. lrworkmin .AND. .NOT. lquery ) THEN
            info = -28
         END IF
      END IF
*
      IF( info .NE. 0 ) THEN
         CALL xerbla( 'CBBCSD', -info )
         RETURN
      ELSE IF( lquery ) THEN
         RETURN
      END IF
*
*     Get machine constants
*
      eps = slamch( 'Epsilon' )
      unfl = slamch( 'Safe minimum' )
      tolmul = max( ten, min( hundred, eps**meighth ) )
      tol = tolmul*eps
      thresh = max( tol, maxitr*q*q*unfl )
*
*     Test for negligible sines or cosines
*
      DO i = 1, q
         IF( theta(i) .LT. thresh ) THEN
            theta(i) = zero
         ELSE IF( theta(i) .GT. piover2-thresh ) THEN
            theta(i) = piover2
         END IF
      END DO
      DO i = 1, q-1
         IF( phi(i) .LT. thresh ) THEN
            phi(i) = zero
         ELSE IF( phi(i) .GT. piover2-thresh ) THEN
            phi(i) = piover2
         END IF
      END DO
*
*     Initial deflation
*
      imax = q
      DO WHILE( imax .GT. 1 )
         IF( phi(imax-1) .NE. zero ) THEN
            EXIT
         END IF
         imax = imax - 1
      END DO
      imin = imax - 1
      IF  ( imin .GT. 1 ) THEN
         DO WHILE( phi(imin-1) .NE. zero )
            imin = imin - 1
            IF  ( imin .LE. 1 ) EXIT
         END DO
      END IF
*
*     Initialize iteration counter
*
      maxit = maxitr*q*q
      iter = 0
*
*     Begin main iteration loop
*
      DO WHILE( imax .GT. 1 )
*
*        Compute the matrix entries
*
         b11d(imin) = cos( theta(imin) )
         b21d(imin) = -sin( theta(imin) )
         DO i = imin, imax - 1
            b11e(i) = -sin( theta(i) ) * sin( phi(i) )
            b11d(i+1) = cos( theta(i+1) ) * cos( phi(i) )
            b12d(i) = sin( theta(i) ) * cos( phi(i) )
            b12e(i) = cos( theta(i+1) ) * sin( phi(i) )
            b21e(i) = -cos( theta(i) ) * sin( phi(i) )
            b21d(i+1) = -sin( theta(i+1) ) * cos( phi(i) )
            b22d(i) = cos( theta(i) ) * cos( phi(i) )
            b22e(i) = -sin( theta(i+1) ) * sin( phi(i) )
         END DO
         b12d(imax) = sin( theta(imax) )
         b22d(imax) = cos( theta(imax) )
*
*        Abort if not converging; otherwise, increment ITER
*
         IF( iter .GT. maxit ) THEN
            info = 0
            DO i = 1, q
               IF( phi(i) .NE. zero )
     $            info = info + 1
            END DO
            RETURN
         END IF
*
         iter = iter + imax - imin
*
*        Compute shifts
*
         thetamax = theta(imin)
         thetamin = theta(imin)
         DO i = imin+1, imax
            IF( theta(i) > thetamax )
     $         thetamax = theta(i)
            IF( theta(i) < thetamin )
     $         thetamin = theta(i)
         END DO
*
         IF( thetamax .GT. piover2 - thresh ) THEN
*
*           Zero on diagonals of B11 and B22; induce deflation with a
*           zero shift
*
            mu = zero
            nu = one
*
         ELSE IF( thetamin .LT. thresh ) THEN
*
*           Zero on diagonals of B12 and B22; induce deflation with a
*           zero shift
*
            mu = one
            nu = zero
*
         ELSE
*
*           Compute shifts for B11 and B21 and use the lesser
*
            CALL slas2( b11d(imax-1), b11e(imax-1), b11d(imax), sigma11,
     $                  dummy )
            CALL slas2( b21d(imax-1), b21e(imax-1), b21d(imax), sigma21,
     $                  dummy )
*
            IF( sigma11 .LE. sigma21 ) THEN
               mu = sigma11
               nu = sqrt( one - mu**2 )
               IF( mu .LT. thresh ) THEN
                  mu = zero
                  nu = one
               END IF
            ELSE
               nu = sigma21
               mu = sqrt( 1.0 - nu**2 )
               IF( nu .LT. thresh ) THEN
                  mu = one
                  nu = zero
               END IF
            END IF
         END IF
*
*        Rotate to produce bulges in B11 and B21
*
         IF( mu .LE. nu ) THEN
            CALL slartgs( b11d(imin), b11e(imin), mu,
     $                    rwork(iv1tcs+imin-1), rwork(iv1tsn+imin-1) )
         ELSE
            CALL slartgs( b21d(imin), b21e(imin), nu,
     $                    rwork(iv1tcs+imin-1), rwork(iv1tsn+imin-1) )
         END IF
*
         temp = rwork(iv1tcs+imin-1)*b11d(imin) +
     $          rwork(iv1tsn+imin-1)*b11e(imin)
         b11e(imin) = rwork(iv1tcs+imin-1)*b11e(imin) -
     $                rwork(iv1tsn+imin-1)*b11d(imin)
         b11d(imin) = temp
         b11bulge = rwork(iv1tsn+imin-1)*b11d(imin+1)
         b11d(imin+1) = rwork(iv1tcs+imin-1)*b11d(imin+1)
         temp = rwork(iv1tcs+imin-1)*b21d(imin) +
     $          rwork(iv1tsn+imin-1)*b21e(imin)
         b21e(imin) = rwork(iv1tcs+imin-1)*b21e(imin) -
     $                rwork(iv1tsn+imin-1)*b21d(imin)
         b21d(imin) = temp
         b21bulge = rwork(iv1tsn+imin-1)*b21d(imin+1)
         b21d(imin+1) = rwork(iv1tcs+imin-1)*b21d(imin+1)
*
*        Compute THETA(IMIN)
*
         theta( imin ) = atan2( sqrt( b21d(imin)**2+b21bulge**2 ),
     $                   sqrt( b11d(imin)**2+b11bulge**2 ) )
*
*        Chase the bulges in B11(IMIN+1,IMIN) and B21(IMIN+1,IMIN)
*
         IF( b11d(imin)**2+b11bulge**2 .GT. thresh**2 ) THEN
            CALL slartgp( b11bulge, b11d(imin), rwork(iu1sn+imin-1),
     $                    rwork(iu1cs+imin-1), r )
         ELSE IF( mu .LE. nu ) THEN
            CALL slartgs( b11e( imin ), b11d( imin + 1 ), mu,
     $                    rwork(iu1cs+imin-1), rwork(iu1sn+imin-1) )
         ELSE
            CALL slartgs( b12d( imin ), b12e( imin ), nu,
     $                    rwork(iu1cs+imin-1), rwork(iu1sn+imin-1) )
         END IF
         IF( b21d(imin)**2+b21bulge**2 .GT. thresh**2 ) THEN
            CALL slartgp( b21bulge, b21d(imin), rwork(iu2sn+imin-1),
     $                    rwork(iu2cs+imin-1), r )
         ELSE IF( nu .LT. mu ) THEN
            CALL slartgs( b21e( imin ), b21d( imin + 1 ), nu,
     $                    rwork(iu2cs+imin-1), rwork(iu2sn+imin-1) )
         ELSE
            CALL slartgs( b22d(imin), b22e(imin), mu,
     $                    rwork(iu2cs+imin-1), rwork(iu2sn+imin-1) )
         END IF
         rwork(iu2cs+imin-1) = -rwork(iu2cs+imin-1)
         rwork(iu2sn+imin-1) = -rwork(iu2sn+imin-1)
*
         temp = rwork(iu1cs+imin-1)*b11e(imin) +
     $          rwork(iu1sn+imin-1)*b11d(imin+1)
         b11d(imin+1) = rwork(iu1cs+imin-1)*b11d(imin+1) -
     $                  rwork(iu1sn+imin-1)*b11e(imin)
         b11e(imin) = temp
         IF( imax .GT. imin+1 ) THEN
            b11bulge = rwork(iu1sn+imin-1)*b11e(imin+1)
            b11e(imin+1) = rwork(iu1cs+imin-1)*b11e(imin+1)
         END IF
         temp = rwork(iu1cs+imin-1)*b12d(imin) +
     $          rwork(iu1sn+imin-1)*b12e(imin)
         b12e(imin) = rwork(iu1cs+imin-1)*b12e(imin) -
     $                rwork(iu1sn+imin-1)*b12d(imin)
         b12d(imin) = temp
         b12bulge = rwork(iu1sn+imin-1)*b12d(imin+1)
         b12d(imin+1) = rwork(iu1cs+imin-1)*b12d(imin+1)
         temp = rwork(iu2cs+imin-1)*b21e(imin) +
     $          rwork(iu2sn+imin-1)*b21d(imin+1)
         b21d(imin+1) = rwork(iu2cs+imin-1)*b21d(imin+1) -
     $                  rwork(iu2sn+imin-1)*b21e(imin)
         b21e(imin) = temp
         IF( imax .GT. imin+1 ) THEN
            b21bulge = rwork(iu2sn+imin-1)*b21e(imin+1)
            b21e(imin+1) = rwork(iu2cs+imin-1)*b21e(imin+1)
         END IF
         temp = rwork(iu2cs+imin-1)*b22d(imin) +
     $          rwork(iu2sn+imin-1)*b22e(imin)
         b22e(imin) = rwork(iu2cs+imin-1)*b22e(imin) -
     $                rwork(iu2sn+imin-1)*b22d(imin)
         b22d(imin) = temp
         b22bulge = rwork(iu2sn+imin-1)*b22d(imin+1)
         b22d(imin+1) = rwork(iu2cs+imin-1)*b22d(imin+1)
*
*        Inner loop: chase bulges from B11(IMIN,IMIN+2),
*        B12(IMIN,IMIN+1), B21(IMIN,IMIN+2), and B22(IMIN,IMIN+1) to
*        bottom-right
*
         DO i = imin+1, imax-1
*
*           Compute PHI(I-1)
*
            x1 = sin(theta(i-1))*b11e(i-1) + cos(theta(i-1))*b21e(i-1)
            x2 = sin(theta(i-1))*b11bulge + cos(theta(i-1))*b21bulge
            y1 = sin(theta(i-1))*b12d(i-1) + cos(theta(i-1))*b22d(i-1)
            y2 = sin(theta(i-1))*b12bulge + cos(theta(i-1))*b22bulge
*
            phi(i-1) = atan2( sqrt(x1**2+x2**2), sqrt(y1**2+y2**2) )
*
*           Determine if there are bulges to chase or if a new direct
*           summand has been reached
*
            restart11 = b11e(i-1)**2 + b11bulge**2 .LE. thresh**2
            restart21 = b21e(i-1)**2 + b21bulge**2 .LE. thresh**2
            restart12 = b12d(i-1)**2 + b12bulge**2 .LE. thresh**2
            restart22 = b22d(i-1)**2 + b22bulge**2 .LE. thresh**2
*
*           If possible, chase bulges from B11(I-1,I+1), B12(I-1,I),
*           B21(I-1,I+1), and B22(I-1,I). If necessary, restart bulge-
*           chasing by applying the original shift again.
*
            IF( .NOT. restart11 .AND. .NOT. restart21 ) THEN
               CALL slartgp( x2, x1, rwork(iv1tsn+i-1),
     $                       rwork(iv1tcs+i-1), r )
            ELSE IF( .NOT. restart11 .AND. restart21 ) THEN
               CALL slartgp( b11bulge, b11e(i-1), rwork(iv1tsn+i-1),
     $                       rwork(iv1tcs+i-1), r )
            ELSE IF( restart11 .AND. .NOT. restart21 ) THEN
               CALL slartgp( b21bulge, b21e(i-1), rwork(iv1tsn+i-1),
     $                       rwork(iv1tcs+i-1), r )
            ELSE IF( mu .LE. nu ) THEN
               CALL slartgs( b11d(i), b11e(i), mu, rwork(iv1tcs+i-1),
     $                       rwork(iv1tsn+i-1) )
            ELSE
               CALL slartgs( b21d(i), b21e(i), nu, rwork(iv1tcs+i-1),
     $                       rwork(iv1tsn+i-1) )
            END IF
            rwork(iv1tcs+i-1) = -rwork(iv1tcs+i-1)
            rwork(iv1tsn+i-1) = -rwork(iv1tsn+i-1)
            IF( .NOT. restart12 .AND. .NOT. restart22 ) THEN
               CALL slartgp( y2, y1, rwork(iv2tsn+i-1-1),
     $                       rwork(iv2tcs+i-1-1), r )
            ELSE IF( .NOT. restart12 .AND. restart22 ) THEN
               CALL slartgp( b12bulge, b12d(i-1), rwork(iv2tsn+i-1-1),
     $                       rwork(iv2tcs+i-1-1), r )
            ELSE IF( restart12 .AND. .NOT. restart22 ) THEN
               CALL slartgp( b22bulge, b22d(i-1), rwork(iv2tsn+i-1-1),
     $                       rwork(iv2tcs+i-1-1), r )
            ELSE IF( nu .LT. mu ) THEN
               CALL slartgs( b12e(i-1), b12d(i), nu,
     $                       rwork(iv2tcs+i-1-1), rwork(iv2tsn+i-1-1) )
            ELSE
               CALL slartgs( b22e(i-1), b22d(i), mu,
     $                       rwork(iv2tcs+i-1-1), rwork(iv2tsn+i-1-1) )
            END IF
*
            temp = rwork(iv1tcs+i-1)*b11d(i) + rwork(iv1tsn+i-1)*b11e(i)
            b11e(i) = rwork(iv1tcs+i-1)*b11e(i) -
     $                rwork(iv1tsn+i-1)*b11d(i)
            b11d(i) = temp
            b11bulge = rwork(iv1tsn+i-1)*b11d(i+1)
            b11d(i+1) = rwork(iv1tcs+i-1)*b11d(i+1)
            temp = rwork(iv1tcs+i-1)*b21d(i) + rwork(iv1tsn+i-1)*b21e(i)
            b21e(i) = rwork(iv1tcs+i-1)*b21e(i) -
     $                rwork(iv1tsn+i-1)*b21d(i)
            b21d(i) = temp
            b21bulge = rwork(iv1tsn+i-1)*b21d(i+1)
            b21d(i+1) = rwork(iv1tcs+i-1)*b21d(i+1)
            temp = rwork(iv2tcs+i-1-1)*b12e(i-1) +
     $             rwork(iv2tsn+i-1-1)*b12d(i)
            b12d(i) = rwork(iv2tcs+i-1-1)*b12d(i) -
     $                rwork(iv2tsn+i-1-1)*b12e(i-1)
            b12e(i-1) = temp
            b12bulge = rwork(iv2tsn+i-1-1)*b12e(i)
            b12e(i) = rwork(iv2tcs+i-1-1)*b12e(i)
            temp = rwork(iv2tcs+i-1-1)*b22e(i-1) +
     $             rwork(iv2tsn+i-1-1)*b22d(i)
            b22d(i) = rwork(iv2tcs+i-1-1)*b22d(i) -
     $                rwork(iv2tsn+i-1-1)*b22e(i-1)
            b22e(i-1) = temp
            b22bulge = rwork(iv2tsn+i-1-1)*b22e(i)
            b22e(i) = rwork(iv2tcs+i-1-1)*b22e(i)
*
*           Compute THETA(I)
*
            x1 = cos(phi(i-1))*b11d(i) + sin(phi(i-1))*b12e(i-1)
            x2 = cos(phi(i-1))*b11bulge + sin(phi(i-1))*b12bulge
            y1 = cos(phi(i-1))*b21d(i) + sin(phi(i-1))*b22e(i-1)
            y2 = cos(phi(i-1))*b21bulge + sin(phi(i-1))*b22bulge
*
            theta(i) = atan2( sqrt(y1**2+y2**2), sqrt(x1**2+x2**2) )
*
*           Determine if there are bulges to chase or if a new direct
*           summand has been reached
*
            restart11 =   b11d(i)**2 + b11bulge**2 .LE. thresh**2
            restart12 = b12e(i-1)**2 + b12bulge**2 .LE. thresh**2
            restart21 =   b21d(i)**2 + b21bulge**2 .LE. thresh**2
            restart22 = b22e(i-1)**2 + b22bulge**2 .LE. thresh**2
*
*           If possible, chase bulges from B11(I+1,I), B12(I+1,I-1),
*           B21(I+1,I), and B22(I+1,I-1). If necessary, restart bulge-
*           chasing by applying the original shift again.
*
            IF( .NOT. restart11 .AND. .NOT. restart12 ) THEN
               CALL slartgp( x2, x1, rwork(iu1sn+i-1), rwork(iu1cs+i-1),
     $                       r )
            ELSE IF( .NOT. restart11 .AND. restart12 ) THEN
               CALL slartgp( b11bulge, b11d(i), rwork(iu1sn+i-1),
     $                       rwork(iu1cs+i-1), r )
            ELSE IF( restart11 .AND. .NOT. restart12 ) THEN
               CALL slartgp( b12bulge, b12e(i-1), rwork(iu1sn+i-1),
     $                       rwork(iu1cs+i-1), r )
            ELSE IF( mu .LE. nu ) THEN
               CALL slartgs( b11e(i), b11d(i+1), mu, rwork(iu1cs+i-1),
     $                       rwork(iu1sn+i-1) )
            ELSE
               CALL slartgs( b12d(i), b12e(i), nu, rwork(iu1cs+i-1),
     $                       rwork(iu1sn+i-1) )
            END IF
            IF( .NOT. restart21 .AND. .NOT. restart22 ) THEN
               CALL slartgp( y2, y1, rwork(iu2sn+i-1), rwork(iu2cs+i-1),
     $                       r )
            ELSE IF( .NOT. restart21 .AND. restart22 ) THEN
               CALL slartgp( b21bulge, b21d(i), rwork(iu2sn+i-1),
     $                       rwork(iu2cs+i-1), r )
            ELSE IF( restart21 .AND. .NOT. restart22 ) THEN
               CALL slartgp( b22bulge, b22e(i-1), rwork(iu2sn+i-1),
     $                       rwork(iu2cs+i-1), r )
            ELSE IF( nu .LT. mu ) THEN
               CALL slartgs( b21e(i), b21e(i+1), nu, rwork(iu2cs+i-1),
     $                       rwork(iu2sn+i-1) )
            ELSE
               CALL slartgs( b22d(i), b22e(i), mu, rwork(iu2cs+i-1),
     $                       rwork(iu2sn+i-1) )
            END IF
            rwork(iu2cs+i-1) = -rwork(iu2cs+i-1)
            rwork(iu2sn+i-1) = -rwork(iu2sn+i-1)
*
            temp = rwork(iu1cs+i-1)*b11e(i) + rwork(iu1sn+i-1)*b11d(i+1)
            b11d(i+1) = rwork(iu1cs+i-1)*b11d(i+1) -
     $                  rwork(iu1sn+i-1)*b11e(i)
            b11e(i) = temp
            IF( i .LT. imax - 1 ) THEN
               b11bulge = rwork(iu1sn+i-1)*b11e(i+1)
               b11e(i+1) = rwork(iu1cs+i-1)*b11e(i+1)
            END IF
            temp = rwork(iu2cs+i-1)*b21e(i) + rwork(iu2sn+i-1)*b21d(i+1)
            b21d(i+1) = rwork(iu2cs+i-1)*b21d(i+1) -
     $                  rwork(iu2sn+i-1)*b21e(i)
            b21e(i) = temp
            IF( i .LT. imax - 1 ) THEN
               b21bulge = rwork(iu2sn+i-1)*b21e(i+1)
               b21e(i+1) = rwork(iu2cs+i-1)*b21e(i+1)
            END IF
            temp = rwork(iu1cs+i-1)*b12d(i) + rwork(iu1sn+i-1)*b12e(i)
            b12e(i) = rwork(iu1cs+i-1)*b12e(i) -
     $                rwork(iu1sn+i-1)*b12d(i)
            b12d(i) = temp
            b12bulge = rwork(iu1sn+i-1)*b12d(i+1)
            b12d(i+1) = rwork(iu1cs+i-1)*b12d(i+1)
            temp = rwork(iu2cs+i-1)*b22d(i) + rwork(iu2sn+i-1)*b22e(i)
            b22e(i) = rwork(iu2cs+i-1)*b22e(i) -
     $                rwork(iu2sn+i-1)*b22d(i)
            b22d(i) = temp
            b22bulge = rwork(iu2sn+i-1)*b22d(i+1)
            b22d(i+1) = rwork(iu2cs+i-1)*b22d(i+1)
*
         END DO
*
*        Compute PHI(IMAX-1)
*
         x1 = sin(theta(imax-1))*b11e(imax-1) +
     $        cos(theta(imax-1))*b21e(imax-1)
         y1 = sin(theta(imax-1))*b12d(imax-1) +
     $        cos(theta(imax-1))*b22d(imax-1)
         y2 = sin(theta(imax-1))*b12bulge + cos(theta(imax-1))*b22bulge
*
         phi(imax-1) = atan2( abs(x1), sqrt(y1**2+y2**2) )
*
*        Chase bulges from B12(IMAX-1,IMAX) and B22(IMAX-1,IMAX)
*
         restart12 = b12d(imax-1)**2 + b12bulge**2 .LE. thresh**2
         restart22 = b22d(imax-1)**2 + b22bulge**2 .LE. thresh**2
*
         IF( .NOT. restart12 .AND. .NOT. restart22 ) THEN
            CALL slartgp( y2, y1, rwork(iv2tsn+imax-1-1),
     $                    rwork(iv2tcs+imax-1-1), r )
         ELSE IF( .NOT. restart12 .AND. restart22 ) THEN
            CALL slartgp( b12bulge, b12d(imax-1),
     $                    rwork(iv2tsn+imax-1-1),
     $                    rwork(iv2tcs+imax-1-1), r )
         ELSE IF( restart12 .AND. .NOT. restart22 ) THEN
            CALL slartgp( b22bulge, b22d(imax-1),
     $                    rwork(iv2tsn+imax-1-1),
     $                    rwork(iv2tcs+imax-1-1), r )
         ELSE IF( nu .LT. mu ) THEN
            CALL slartgs( b12e(imax-1), b12d(imax), nu,
     $                    rwork(iv2tcs+imax-1-1),
     $                    rwork(iv2tsn+imax-1-1) )
         ELSE
            CALL slartgs( b22e(imax-1), b22d(imax), mu,
     $                    rwork(iv2tcs+imax-1-1),
     $                    rwork(iv2tsn+imax-1-1) )
         END IF
*
         temp = rwork(iv2tcs+imax-1-1)*b12e(imax-1) +
     $          rwork(iv2tsn+imax-1-1)*b12d(imax)
         b12d(imax) = rwork(iv2tcs+imax-1-1)*b12d(imax) -
     $                rwork(iv2tsn+imax-1-1)*b12e(imax-1)
         b12e(imax-1) = temp
         temp = rwork(iv2tcs+imax-1-1)*b22e(imax-1) +
     $          rwork(iv2tsn+imax-1-1)*b22d(imax)
         b22d(imax) = rwork(iv2tcs+imax-1-1)*b22d(imax) -
     $                rwork(iv2tsn+imax-1-1)*b22e(imax-1)
         b22e(imax-1) = temp
*
*        Update singular vectors
*
         IF( wantu1 ) THEN
            IF( colmajor ) THEN
               CALL clasr( 'R', 'V', 'F', p, imax-imin+1,
     $                     rwork(iu1cs+imin-1), rwork(iu1sn+imin-1),
     $                     u1(1,imin), ldu1 )
            ELSE
               CALL clasr( 'L', 'V', 'F', imax-imin+1, p,
     $                     rwork(iu1cs+imin-1), rwork(iu1sn+imin-1),
     $                     u1(imin,1), ldu1 )
            END IF
         END IF
         IF( wantu2 ) THEN
            IF( colmajor ) THEN
               CALL clasr( 'R', 'V', 'F', m-p, imax-imin+1,
     $                     rwork(iu2cs+imin-1), rwork(iu2sn+imin-1),
     $                     u2(1,imin), ldu2 )
            ELSE
               CALL clasr( 'L', 'V', 'F', imax-imin+1, m-p,
     $                     rwork(iu2cs+imin-1), rwork(iu2sn+imin-1),
     $                     u2(imin,1), ldu2 )
            END IF
         END IF
         IF( wantv1t ) THEN
            IF( colmajor ) THEN
               CALL clasr( 'L', 'V', 'F', imax-imin+1, q,
     $                     rwork(iv1tcs+imin-1), rwork(iv1tsn+imin-1),
     $                     v1t(imin,1), ldv1t )
            ELSE
               CALL clasr( 'R', 'V', 'F', q, imax-imin+1,
     $                     rwork(iv1tcs+imin-1), rwork(iv1tsn+imin-1),
     $                     v1t(1,imin), ldv1t )
            END IF
         END IF
         IF( wantv2t ) THEN
            IF( colmajor ) THEN
               CALL clasr( 'L', 'V', 'F', imax-imin+1, m-q,
     $                     rwork(iv2tcs+imin-1), rwork(iv2tsn+imin-1),
     $                     v2t(imin,1), ldv2t )
            ELSE
               CALL clasr( 'R', 'V', 'F', m-q, imax-imin+1,
     $                     rwork(iv2tcs+imin-1), rwork(iv2tsn+imin-1),
     $                     v2t(1,imin), ldv2t )
            END IF
         END IF
*
*        Fix signs on B11(IMAX-1,IMAX) and B21(IMAX-1,IMAX)
*
         IF( b11e(imax-1)+b21e(imax-1) .GT. 0 ) THEN
            b11d(imax) = -b11d(imax)
            b21d(imax) = -b21d(imax)
            IF( wantv1t ) THEN
               IF( colmajor ) THEN
                  CALL cscal( q, negonecomplex, v1t(imax,1), ldv1t )
               ELSE
                  CALL cscal( q, negonecomplex, v1t(1,imax), 1 )
               END IF
            END IF
         END IF
*
*        Compute THETA(IMAX)
*
         x1 = cos(phi(imax-1))*b11d(imax) +
     $        sin(phi(imax-1))*b12e(imax-1)
         y1 = cos(phi(imax-1))*b21d(imax) +
     $        sin(phi(imax-1))*b22e(imax-1)
*
         theta(imax) = atan2( abs(y1), abs(x1) )
*
*        Fix signs on B11(IMAX,IMAX), B12(IMAX,IMAX-1), B21(IMAX,IMAX),
*        and B22(IMAX,IMAX-1)
*
         IF( b11d(imax)+b12e(imax-1) .LT. 0 ) THEN
            b12d(imax) = -b12d(imax)
            IF( wantu1 ) THEN
               IF( colmajor ) THEN
                  CALL cscal( p, negonecomplex, u1(1,imax), 1 )
               ELSE
                  CALL cscal( p, negonecomplex, u1(imax,1), ldu1 )
               END IF
            END IF
         END IF
         IF( b21d(imax)+b22e(imax-1) .GT. 0 ) THEN
            b22d(imax) = -b22d(imax)
            IF( wantu2 ) THEN
               IF( colmajor ) THEN
                  CALL cscal( m-p, negonecomplex, u2(1,imax), 1 )
               ELSE
                  CALL cscal( m-p, negonecomplex, u2(imax,1), ldu2 )
               END IF
            END IF
         END IF
*
*        Fix signs on B12(IMAX,IMAX) and B22(IMAX,IMAX)
*
         IF( b12d(imax)+b22d(imax) .LT. 0 ) THEN
            IF( wantv2t ) THEN
               IF( colmajor ) THEN
                  CALL cscal( m-q, negonecomplex, v2t(imax,1), ldv2t )
               ELSE
                  CALL cscal( m-q, negonecomplex, v2t(1,imax), 1 )
               END IF
            END IF
         END IF
*
*        Test for negligible sines or cosines
*
         DO i = imin, imax
            IF( theta(i) .LT. thresh ) THEN
               theta(i) = zero
            ELSE IF( theta(i) .GT. piover2-thresh ) THEN
               theta(i) = piover2
            END IF
         END DO
         DO i = imin, imax-1
            IF( phi(i) .LT. thresh ) THEN
               phi(i) = zero
            ELSE IF( phi(i) .GT. piover2-thresh ) THEN
               phi(i) = piover2
            END IF
         END DO
*
*        Deflate
*
         IF (imax .GT. 1) THEN
            DO WHILE( phi(imax-1) .EQ. zero )
               imax = imax - 1
               IF (imax .LE. 1) EXIT
            END DO
         END IF
         IF( imin .GT. imax - 1 )
     $      imin = imax - 1
         IF (imin .GT. 1) THEN
            DO WHILE (phi(imin-1) .NE. zero)
                imin = imin - 1
                IF (imin .LE. 1) EXIT
            END DO
         END IF
*
*        Repeat main iteration loop
*
      END DO
*
*     Postprocessing: order THETA from least to greatest
*
      DO i = 1, q
*
         mini = i
         thetamin = theta(i)
         DO j = i+1, q
            IF( theta(j) .LT. thetamin ) THEN
               mini = j
               thetamin = theta(j)
            END IF
         END DO
*
         IF( mini .NE. i ) THEN
            theta(mini) = theta(i)
            theta(i) = thetamin
            IF( colmajor ) THEN
               IF( wantu1 )
     $            CALL cswap( p, u1(1,i), 1, u1(1,mini), 1 )
               IF( wantu2 )
     $            CALL cswap( m-p, u2(1,i), 1, u2(1,mini), 1 )
               IF( wantv1t )
     $            CALL cswap( q, v1t(i,1), ldv1t, v1t(mini,1), ldv1t )
               IF( wantv2t )
     $            CALL cswap( m-q, v2t(i,1), ldv2t, v2t(mini,1),
     $               ldv2t )
            ELSE
               IF( wantu1 )
     $            CALL cswap( p, u1(i,1), ldu1, u1(mini,1), ldu1 )
               IF( wantu2 )
     $            CALL cswap( m-p, u2(i,1), ldu2, u2(mini,1), ldu2 )
               IF( wantv1t )
     $            CALL cswap( q, v1t(1,i), 1, v1t(1,mini), 1 )
               IF( wantv2t )
     $            CALL cswap( m-q, v2t(1,i), 1, v2t(1,mini), 1 )
            END IF
         END IF
*
      END DO
*
      RETURN
*
*     End of CBBCSD
*

◆ cbdsqr()

subroutine cbdsqr	(	character	uplo,
		integer	n,
		integer	ncvt,
		integer	nru,
		integer	ncc,
		real, dimension( * )	d,
		real, dimension( * )	e,
		complex, dimension( ldvt, * )	vt,
		integer	ldvt,
		complex, dimension( ldu, * )	u,
		integer	ldu,
		complex, dimension( ldc, * )	c,
		integer	ldc,
		real, dimension( * )	rwork,
		integer	info )

CBDSQR

Download CBDSQR + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CBDSQR computes the singular values and, optionally, the right and/or
!> left singular vectors from the singular value decomposition (SVD) of
!> a real N-by-N (upper or lower) bidiagonal matrix B using the implicit
!> zero-shift QR algorithm.  The SVD of B has the form
!>
!>    B = Q * S * P**H
!>
!> where S is the diagonal matrix of singular values, Q is an orthogonal
!> matrix of left singular vectors, and P is an orthogonal matrix of
!> right singular vectors.  If left singular vectors are requested, this
!> subroutine actually returns U*Q instead of Q, and, if right singular
!> vectors are requested, this subroutine returns P**H*VT instead of
!> P**H, for given complex input matrices U and VT.  When U and VT are
!> the unitary matrices that reduce a general matrix A to bidiagonal
!> form: A = U*B*VT, as computed by CGEBRD, then
!>
!>    A = (U*Q) * S * (P**H*VT)
!>
!> is the SVD of A.  Optionally, the subroutine may also compute Q**H*C
!> for a given complex input matrix C.
!>
!> See  by J. Demmel and W. Kahan,
!> LAPACK Working Note #3 (or SIAM J. Sci. Statist. Comput. vol. 11,
!> no. 5, pp. 873-912, Sept 1990) and
!>  by
!> B. Parlett and V. Fernando, Technical Report CPAM-554, Mathematics
!> Department, University of California at Berkeley, July 1992
!> for a detailed description of the algorithm.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': B is upper bidiagonal; !> = 'L': B is lower bidiagonal. !>
[in]	N	!> N is INTEGER !> The order of the matrix B. N >= 0. !>
[in]	NCVT	!> NCVT is INTEGER !> The number of columns of the matrix VT. NCVT >= 0. !>
[in]	NRU	!> NRU is INTEGER !> The number of rows of the matrix U. NRU >= 0. !>
[in]	NCC	!> NCC is INTEGER !> The number of columns of the matrix C. NCC >= 0. !>
[in,out]	D	!> D is REAL array, dimension (N) !> On entry, the n diagonal elements of the bidiagonal matrix B. !> On exit, if INFO=0, the singular values of B in decreasing !> order. !>
[in,out]	E	!> E is REAL array, dimension (N-1) !> On entry, the N-1 offdiagonal elements of the bidiagonal !> matrix B. !> On exit, if INFO = 0, E is destroyed; if INFO > 0, D and E !> will contain the diagonal and superdiagonal elements of a !> bidiagonal matrix orthogonally equivalent to the one given !> as input. !>
[in,out]	VT	!> VT is COMPLEX array, dimension (LDVT, NCVT) !> On entry, an N-by-NCVT matrix VT. !> On exit, VT is overwritten by P*H VT. !> Not referenced if NCVT = 0. !>
[in]	LDVT	!> LDVT is INTEGER !> The leading dimension of the array VT. !> LDVT >= max(1,N) if NCVT > 0; LDVT >= 1 if NCVT = 0. !>
[in,out]	U	!> U is COMPLEX array, dimension (LDU, N) !> On entry, an NRU-by-N matrix U. !> On exit, U is overwritten by U * Q. !> Not referenced if NRU = 0. !>
[in]	LDU	!> LDU is INTEGER !> The leading dimension of the array U. LDU >= max(1,NRU). !>
[in,out]	C	!> C is COMPLEX array, dimension (LDC, NCC) !> On entry, an N-by-NCC matrix C. !> On exit, C is overwritten by Q*H C. !> Not referenced if NCC = 0. !>
[in]	LDC	!> LDC is INTEGER !> The leading dimension of the array C. !> LDC >= max(1,N) if NCC > 0; LDC >=1 if NCC = 0. !>
[out]	RWORK	!> RWORK is REAL array, dimension (4*N) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: If INFO = -i, the i-th argument had an illegal value !> > 0: the algorithm did not converge; D and E contain the !> elements of a bidiagonal matrix which is orthogonally !> similar to the input matrix B; if INFO = i, i !> elements of E have not converged to zero. !>

Internal Parameters:

!>  TOLMUL  REAL, default = max(10,min(100,EPS**(-1/8)))
!>          TOLMUL controls the convergence criterion of the QR loop.
!>          If it is positive, TOLMUL*EPS is the desired relative
!>             precision in the computed singular values.
!>          If it is negative, abs(TOLMUL*EPS*sigma_max) is the
!>             desired absolute accuracy in the computed singular
!>             values (corresponds to relative accuracy
!>             abs(TOLMUL*EPS) in the largest singular value.
!>          abs(TOLMUL) should be between 1 and 1/EPS, and preferably
!>             between 10 (for fast convergence) and .1/EPS
!>             (for there to be some accuracy in the results).
!>          Default is to lose at either one eighth or 2 of the
!>             available decimal digits in each computed singular value
!>             (whichever is smaller).
!>
!>  MAXITR  INTEGER, default = 6
!>          MAXITR controls the maximum number of passes of the
!>          algorithm through its inner loop. The algorithms stops
!>          (and so fails to converge) if the number of passes
!>          through the inner loop exceeds MAXITR*N**2.
!>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 220 of file cbdsqr.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          UPLO
      INTEGER            INFO, LDC, LDU, LDVT, N, NCC, NCVT, NRU
*     ..
*     .. Array Arguments ..
      REAL               D( * ), E( * ), RWORK( * )
      COMPLEX            C( LDC, * ), U( LDU, * ), VT( LDVT, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ZERO
      parameter( zero = 0.0e0 )
      REAL               ONE
      parameter( one = 1.0e0 )
      REAL               NEGONE
      parameter( negone = -1.0e0 )
      REAL               HNDRTH
      parameter( hndrth = 0.01e0 )
      REAL               TEN
      parameter( ten = 10.0e0 )
      REAL               HNDRD
      parameter( hndrd = 100.0e0 )
      REAL               MEIGTH
      parameter( meigth = -0.125e0 )
      INTEGER            MAXITR
      parameter( maxitr = 6 )
*     ..
*     .. Local Scalars ..
      LOGICAL            LOWER, ROTATE
      INTEGER            I, IDIR, ISUB, ITER, J, LL, LLL, M, MAXIT, NM1,
     $                   NM12, NM13, OLDLL, OLDM
      REAL               ABSE, ABSS, COSL, COSR, CS, EPS, F, G, H, MU,
     $                   OLDCS, OLDSN, R, SHIFT, SIGMN, SIGMX, SINL,
     $                   SINR, SLL, SMAX, SMIN, SMINL, SMINOA,
     $                   SN, THRESH, TOL, TOLMUL, UNFL
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      REAL               SLAMCH
      EXTERNAL           lsame, slamch
*     ..
*     .. External Subroutines ..
      EXTERNAL           clasr, csrot, csscal, cswap, slartg, slas2,
     $                   slasq1, slasv2, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, max, min, real, sign, sqrt
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      lower = lsame( uplo, 'L' )
      IF( .NOT.lsame( uplo, 'U' ) .AND. .NOT.lower ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( ncvt.LT.0 ) THEN
         info = -3
      ELSE IF( nru.LT.0 ) THEN
         info = -4
      ELSE IF( ncc.LT.0 ) THEN
         info = -5
      ELSE IF( ( ncvt.EQ.0 .AND. ldvt.LT.1 ) .OR.
     $         ( ncvt.GT.0 .AND. ldvt.LT.max( 1, n ) ) ) THEN
         info = -9
      ELSE IF( ldu.LT.max( 1, nru ) ) THEN
         info = -11
      ELSE IF( ( ncc.EQ.0 .AND. ldc.LT.1 ) .OR.
     $         ( ncc.GT.0 .AND. ldc.LT.max( 1, n ) ) ) THEN
         info = -13
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CBDSQR', -info )
         RETURN
      END IF
      IF( n.EQ.0 )
     $   RETURN
      IF( n.EQ.1 )
     $   GO TO 160
*
*     ROTATE is true if any singular vectors desired, false otherwise
*
      rotate = ( ncvt.GT.0 ) .OR. ( nru.GT.0 ) .OR. ( ncc.GT.0 )
*
*     If no singular vectors desired, use qd algorithm
*
      IF( .NOT.rotate ) THEN
         CALL slasq1( n, d, e, rwork, info )
*
*     If INFO equals 2, dqds didn't finish, try to finish
*
         IF( info .NE. 2 ) RETURN
         info = 0
      END IF
*
      nm1 = n - 1
      nm12 = nm1 + nm1
      nm13 = nm12 + nm1
      idir = 0
*
*     Get machine constants
*
      eps = slamch( 'Epsilon' )
      unfl = slamch( 'Safe minimum' )
*
*     If matrix lower bidiagonal, rotate to be upper bidiagonal
*     by applying Givens rotations on the left
*
      IF( lower ) THEN
         DO 10 i = 1, n - 1
            CALL slartg( d( i ), e( i ), cs, sn, r )
            d( i ) = r
            e( i ) = sn*d( i+1 )
            d( i+1 ) = cs*d( i+1 )
            rwork( i ) = cs
            rwork( nm1+i ) = sn
   10    CONTINUE
*
*        Update singular vectors if desired
*
         IF( nru.GT.0 )
     $      CALL clasr( 'R', 'V', 'F', nru, n, rwork( 1 ), rwork( n ),
     $                  u, ldu )
         IF( ncc.GT.0 )
     $      CALL clasr( 'L', 'V', 'F', n, ncc, rwork( 1 ), rwork( n ),
     $                  c, ldc )
      END IF
*
*     Compute singular values to relative accuracy TOL
*     (By setting TOL to be negative, algorithm will compute
*     singular values to absolute accuracy ABS(TOL)*norm(input matrix))
*
      tolmul = max( ten, min( hndrd, eps**meigth ) )
      tol = tolmul*eps
*
*     Compute approximate maximum, minimum singular values
*
      smax = zero
      DO 20 i = 1, n
         smax = max( smax, abs( d( i ) ) )
   20 CONTINUE
      DO 30 i = 1, n - 1
         smax = max( smax, abs( e( i ) ) )
   30 CONTINUE
      sminl = zero
      IF( tol.GE.zero ) THEN
*
*        Relative accuracy desired
*
         sminoa = abs( d( 1 ) )
         IF( sminoa.EQ.zero )
     $      GO TO 50
         mu = sminoa
         DO 40 i = 2, n
            mu = abs( d( i ) )*( mu / ( mu+abs( e( i-1 ) ) ) )
            sminoa = min( sminoa, mu )
            IF( sminoa.EQ.zero )
     $         GO TO 50
   40    CONTINUE
   50    CONTINUE
         sminoa = sminoa / sqrt( real( n ) )
         thresh = max( tol*sminoa, maxitr*n*n*unfl )
      ELSE
*
*        Absolute accuracy desired
*
         thresh = max( abs( tol )*smax, maxitr*n*n*unfl )
      END IF
*
*     Prepare for main iteration loop for the singular values
*     (MAXIT is the maximum number of passes through the inner
*     loop permitted before nonconvergence signalled.)
*
      maxit = maxitr*n*n
      iter = 0
      oldll = -1
      oldm = -1
*
*     M points to last element of unconverged part of matrix
*
      m = n
*
*     Begin main iteration loop
*
   60 CONTINUE
*
*     Check for convergence or exceeding iteration count
*
      IF( m.LE.1 )
     $   GO TO 160
      IF( iter.GT.maxit )
     $   GO TO 200
*
*     Find diagonal block of matrix to work on
*
      IF( tol.LT.zero .AND. abs( d( m ) ).LE.thresh )
     $   d( m ) = zero
      smax = abs( d( m ) )
      smin = smax
      DO 70 lll = 1, m - 1
         ll = m - lll
         abss = abs( d( ll ) )
         abse = abs( e( ll ) )
         IF( tol.LT.zero .AND. abss.LE.thresh )
     $      d( ll ) = zero
         IF( abse.LE.thresh )
     $      GO TO 80
         smin = min( smin, abss )
         smax = max( smax, abss, abse )
   70 CONTINUE
      ll = 0
      GO TO 90
   80 CONTINUE
      e( ll ) = zero
*
*     Matrix splits since E(LL) = 0
*
      IF( ll.EQ.m-1 ) THEN
*
*        Convergence of bottom singular value, return to top of loop
*
         m = m - 1
         GO TO 60
      END IF
   90 CONTINUE
      ll = ll + 1
*
*     E(LL) through E(M-1) are nonzero, E(LL-1) is zero
*
      IF( ll.EQ.m-1 ) THEN
*
*        2 by 2 block, handle separately
*
         CALL slasv2( d( m-1 ), e( m-1 ), d( m ), sigmn, sigmx, sinr,
     $                cosr, sinl, cosl )
         d( m-1 ) = sigmx
         e( m-1 ) = zero
         d( m ) = sigmn
*
*        Compute singular vectors, if desired
*
         IF( ncvt.GT.0 )
     $      CALL csrot( ncvt, vt( m-1, 1 ), ldvt, vt( m, 1 ), ldvt,
     $                  cosr, sinr )
         IF( nru.GT.0 )
     $      CALL csrot( nru, u( 1, m-1 ), 1, u( 1, m ), 1, cosl, sinl )
         IF( ncc.GT.0 )
     $      CALL csrot( ncc, c( m-1, 1 ), ldc, c( m, 1 ), ldc, cosl,
     $                  sinl )
         m = m - 2
         GO TO 60
      END IF
*
*     If working on new submatrix, choose shift direction
*     (from larger end diagonal element towards smaller)
*
      IF( ll.GT.oldm .OR. m.LT.oldll ) THEN
         IF( abs( d( ll ) ).GE.abs( d( m ) ) ) THEN
*
*           Chase bulge from top (big end) to bottom (small end)
*
            idir = 1
         ELSE
*
*           Chase bulge from bottom (big end) to top (small end)
*
            idir = 2
         END IF
      END IF
*
*     Apply convergence tests
*
      IF( idir.EQ.1 ) THEN
*
*        Run convergence test in forward direction
*        First apply standard test to bottom of matrix
*
         IF( abs( e( m-1 ) ).LE.abs( tol )*abs( d( m ) ) .OR.
     $       ( tol.LT.zero .AND. abs( e( m-1 ) ).LE.thresh ) ) THEN
            e( m-1 ) = zero
            GO TO 60
         END IF
*
         IF( tol.GE.zero ) THEN
*
*           If relative accuracy desired,
*           apply convergence criterion forward
*
            mu = abs( d( ll ) )
            sminl = mu
            DO 100 lll = ll, m - 1
               IF( abs( e( lll ) ).LE.tol*mu ) THEN
                  e( lll ) = zero
                  GO TO 60
               END IF
               mu = abs( d( lll+1 ) )*( mu / ( mu+abs( e( lll ) ) ) )
               sminl = min( sminl, mu )
  100       CONTINUE
         END IF
*
      ELSE
*
*        Run convergence test in backward direction
*        First apply standard test to top of matrix
*
         IF( abs( e( ll ) ).LE.abs( tol )*abs( d( ll ) ) .OR.
     $       ( tol.LT.zero .AND. abs( e( ll ) ).LE.thresh ) ) THEN
            e( ll ) = zero
            GO TO 60
         END IF
*
         IF( tol.GE.zero ) THEN
*
*           If relative accuracy desired,
*           apply convergence criterion backward
*
            mu = abs( d( m ) )
            sminl = mu
            DO 110 lll = m - 1, ll, -1
               IF( abs( e( lll ) ).LE.tol*mu ) THEN
                  e( lll ) = zero
                  GO TO 60
               END IF
               mu = abs( d( lll ) )*( mu / ( mu+abs( e( lll ) ) ) )
               sminl = min( sminl, mu )
  110       CONTINUE
         END IF
      END IF
      oldll = ll
      oldm = m
*
*     Compute shift.  First, test if shifting would ruin relative
*     accuracy, and if so set the shift to zero.
*
      IF( tol.GE.zero .AND. n*tol*( sminl / smax ).LE.
     $    max( eps, hndrth*tol ) ) THEN
*
*        Use a zero shift to avoid loss of relative accuracy
*
         shift = zero
      ELSE
*
*        Compute the shift from 2-by-2 block at end of matrix
*
         IF( idir.EQ.1 ) THEN
            sll = abs( d( ll ) )
            CALL slas2( d( m-1 ), e( m-1 ), d( m ), shift, r )
         ELSE
            sll = abs( d( m ) )
            CALL slas2( d( ll ), e( ll ), d( ll+1 ), shift, r )
         END IF
*
*        Test if shift negligible, and if so set to zero
*
         IF( sll.GT.zero ) THEN
            IF( ( shift / sll )**2.LT.eps )
     $         shift = zero
         END IF
      END IF
*
*     Increment iteration count
*
      iter = iter + m - ll
*
*     If SHIFT = 0, do simplified QR iteration
*
      IF( shift.EQ.zero ) THEN
         IF( idir.EQ.1 ) THEN
*
*           Chase bulge from top to bottom
*           Save cosines and sines for later singular vector updates
*
            cs = one
            oldcs = one
            DO 120 i = ll, m - 1
               CALL slartg( d( i )*cs, e( i ), cs, sn, r )
               IF( i.GT.ll )
     $            e( i-1 ) = oldsn*r
               CALL slartg( oldcs*r, d( i+1 )*sn, oldcs, oldsn, d( i ) )
               rwork( i-ll+1 ) = cs
               rwork( i-ll+1+nm1 ) = sn
               rwork( i-ll+1+nm12 ) = oldcs
               rwork( i-ll+1+nm13 ) = oldsn
  120       CONTINUE
            h = d( m )*cs
            d( m ) = h*oldcs
            e( m-1 ) = h*oldsn
*
*           Update singular vectors
*
            IF( ncvt.GT.0 )
     $         CALL clasr( 'L', 'V', 'F', m-ll+1, ncvt, rwork( 1 ),
     $                     rwork( n ), vt( ll, 1 ), ldvt )
            IF( nru.GT.0 )
     $         CALL clasr( 'R', 'V', 'F', nru, m-ll+1, rwork( nm12+1 ),
     $                     rwork( nm13+1 ), u( 1, ll ), ldu )
            IF( ncc.GT.0 )
     $         CALL clasr( 'L', 'V', 'F', m-ll+1, ncc, rwork( nm12+1 ),
     $                     rwork( nm13+1 ), c( ll, 1 ), ldc )
*
*           Test convergence
*
            IF( abs( e( m-1 ) ).LE.thresh )
     $         e( m-1 ) = zero
*
         ELSE
*
*           Chase bulge from bottom to top
*           Save cosines and sines for later singular vector updates
*
            cs = one
            oldcs = one
            DO 130 i = m, ll + 1, -1
               CALL slartg( d( i )*cs, e( i-1 ), cs, sn, r )
               IF( i.LT.m )
     $            e( i ) = oldsn*r
               CALL slartg( oldcs*r, d( i-1 )*sn, oldcs, oldsn, d( i ) )
               rwork( i-ll ) = cs
               rwork( i-ll+nm1 ) = -sn
               rwork( i-ll+nm12 ) = oldcs
               rwork( i-ll+nm13 ) = -oldsn
  130       CONTINUE
            h = d( ll )*cs
            d( ll ) = h*oldcs
            e( ll ) = h*oldsn
*
*           Update singular vectors
*
            IF( ncvt.GT.0 )
     $         CALL clasr( 'L', 'V', 'B', m-ll+1, ncvt, rwork( nm12+1 ),
     $                     rwork( nm13+1 ), vt( ll, 1 ), ldvt )
            IF( nru.GT.0 )
     $         CALL clasr( 'R', 'V', 'B', nru, m-ll+1, rwork( 1 ),
     $                     rwork( n ), u( 1, ll ), ldu )
            IF( ncc.GT.0 )
     $         CALL clasr( 'L', 'V', 'B', m-ll+1, ncc, rwork( 1 ),
     $                     rwork( n ), c( ll, 1 ), ldc )
*
*           Test convergence
*
            IF( abs( e( ll ) ).LE.thresh )
     $         e( ll ) = zero
         END IF
      ELSE
*
*        Use nonzero shift
*
         IF( idir.EQ.1 ) THEN
*
*           Chase bulge from top to bottom
*           Save cosines and sines for later singular vector updates
*
            f = ( abs( d( ll ) )-shift )*
     $          ( sign( one, d( ll ) )+shift / d( ll ) )
            g = e( ll )
            DO 140 i = ll, m - 1
               CALL slartg( f, g, cosr, sinr, r )
               IF( i.GT.ll )
     $            e( i-1 ) = r
               f = cosr*d( i ) + sinr*e( i )
               e( i ) = cosr*e( i ) - sinr*d( i )
               g = sinr*d( i+1 )
               d( i+1 ) = cosr*d( i+1 )
               CALL slartg( f, g, cosl, sinl, r )
               d( i ) = r
               f = cosl*e( i ) + sinl*d( i+1 )
               d( i+1 ) = cosl*d( i+1 ) - sinl*e( i )
               IF( i.LT.m-1 ) THEN
                  g = sinl*e( i+1 )
                  e( i+1 ) = cosl*e( i+1 )
               END IF
               rwork( i-ll+1 ) = cosr
               rwork( i-ll+1+nm1 ) = sinr
               rwork( i-ll+1+nm12 ) = cosl
               rwork( i-ll+1+nm13 ) = sinl
  140       CONTINUE
            e( m-1 ) = f
*
*           Update singular vectors
*
            IF( ncvt.GT.0 )
     $         CALL clasr( 'L', 'V', 'F', m-ll+1, ncvt, rwork( 1 ),
     $                     rwork( n ), vt( ll, 1 ), ldvt )
            IF( nru.GT.0 )
     $         CALL clasr( 'R', 'V', 'F', nru, m-ll+1, rwork( nm12+1 ),
     $                     rwork( nm13+1 ), u( 1, ll ), ldu )
            IF( ncc.GT.0 )
     $         CALL clasr( 'L', 'V', 'F', m-ll+1, ncc, rwork( nm12+1 ),
     $                     rwork( nm13+1 ), c( ll, 1 ), ldc )
*
*           Test convergence
*
            IF( abs( e( m-1 ) ).LE.thresh )
     $         e( m-1 ) = zero
*
         ELSE
*
*           Chase bulge from bottom to top
*           Save cosines and sines for later singular vector updates
*
            f = ( abs( d( m ) )-shift )*( sign( one, d( m ) )+shift /
     $          d( m ) )
            g = e( m-1 )
            DO 150 i = m, ll + 1, -1
               CALL slartg( f, g, cosr, sinr, r )
               IF( i.LT.m )
     $            e( i ) = r
               f = cosr*d( i ) + sinr*e( i-1 )
               e( i-1 ) = cosr*e( i-1 ) - sinr*d( i )
               g = sinr*d( i-1 )
               d( i-1 ) = cosr*d( i-1 )
               CALL slartg( f, g, cosl, sinl, r )
               d( i ) = r
               f = cosl*e( i-1 ) + sinl*d( i-1 )
               d( i-1 ) = cosl*d( i-1 ) - sinl*e( i-1 )
               IF( i.GT.ll+1 ) THEN
                  g = sinl*e( i-2 )
                  e( i-2 ) = cosl*e( i-2 )
               END IF
               rwork( i-ll ) = cosr
               rwork( i-ll+nm1 ) = -sinr
               rwork( i-ll+nm12 ) = cosl
               rwork( i-ll+nm13 ) = -sinl
  150       CONTINUE
            e( ll ) = f
*
*           Test convergence
*
            IF( abs( e( ll ) ).LE.thresh )
     $         e( ll ) = zero
*
*           Update singular vectors if desired
*
            IF( ncvt.GT.0 )
     $         CALL clasr( 'L', 'V', 'B', m-ll+1, ncvt, rwork( nm12+1 ),
     $                     rwork( nm13+1 ), vt( ll, 1 ), ldvt )
            IF( nru.GT.0 )
     $         CALL clasr( 'R', 'V', 'B', nru, m-ll+1, rwork( 1 ),
     $                     rwork( n ), u( 1, ll ), ldu )
            IF( ncc.GT.0 )
     $         CALL clasr( 'L', 'V', 'B', m-ll+1, ncc, rwork( 1 ),
     $                     rwork( n ), c( ll, 1 ), ldc )
         END IF
      END IF
*
*     QR iteration finished, go back and check convergence
*
      GO TO 60
*
*     All singular values converged, so make them positive
*
  160 CONTINUE
      DO 170 i = 1, n
         IF( d( i ).LT.zero ) THEN
            d( i ) = -d( i )
*
*           Change sign of singular vectors, if desired
*
            IF( ncvt.GT.0 )
     $         CALL csscal( ncvt, negone, vt( i, 1 ), ldvt )
         END IF
  170 CONTINUE
*
*     Sort the singular values into decreasing order (insertion sort on
*     singular values, but only one transposition per singular vector)
*
      DO 190 i = 1, n - 1
*
*        Scan for smallest D(I)
*
         isub = 1
         smin = d( 1 )
         DO 180 j = 2, n + 1 - i
            IF( d( j ).LE.smin ) THEN
               isub = j
               smin = d( j )
            END IF
  180    CONTINUE
         IF( isub.NE.n+1-i ) THEN
*
*           Swap singular values and vectors
*
            d( isub ) = d( n+1-i )
            d( n+1-i ) = smin
            IF( ncvt.GT.0 )
     $         CALL cswap( ncvt, vt( isub, 1 ), ldvt, vt( n+1-i, 1 ),
     $                     ldvt )
            IF( nru.GT.0 )
     $         CALL cswap( nru, u( 1, isub ), 1, u( 1, n+1-i ), 1 )
            IF( ncc.GT.0 )
     $         CALL cswap( ncc, c( isub, 1 ), ldc, c( n+1-i, 1 ), ldc )
         END IF
  190 CONTINUE
      GO TO 220
*
*     Maximum number of iterations exceeded, failure to converge
*
  200 CONTINUE
      info = 0
      DO 210 i = 1, n - 1
         IF( e( i ).NE.zero )
     $      info = info + 1
  210 CONTINUE
  220 CONTINUE
      RETURN
*
*     End of CBDSQR
*

◆ cgghd3()

subroutine cgghd3	(	character	compq,
		character	compz,
		integer	n,
		integer	ilo,
		integer	ihi,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( ldb, * )	b,
		integer	ldb,
		complex, dimension( ldq, * )	q,
		integer	ldq,
		complex, dimension( ldz, * )	z,
		integer	ldz,
		complex, dimension( * )	work,
		integer	lwork,
		integer	info )

CGGHD3

Download CGGHD3 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!>
!> CGGHD3 reduces a pair of complex matrices (A,B) to generalized upper
!> Hessenberg form using unitary transformations, where A is a
!> general matrix and B is upper triangular.  The form of the
!> generalized eigenvalue problem is
!>    A*x = lambda*B*x,
!> and B is typically made upper triangular by computing its QR
!> factorization and moving the unitary matrix Q to the left side
!> of the equation.
!>
!> This subroutine simultaneously reduces A to a Hessenberg matrix H:
!>    Q**H*A*Z = H
!> and transforms B to another upper triangular matrix T:
!>    Q**H*B*Z = T
!> in order to reduce the problem to its standard form
!>    H*y = lambda*T*y
!> where y = Z**H*x.
!>
!> The unitary matrices Q and Z are determined as products of Givens
!> rotations.  They may either be formed explicitly, or they may be
!> postmultiplied into input matrices Q1 and Z1, so that
!>
!>      Q1 * A * Z1**H = (Q1*Q) * H * (Z1*Z)**H
!>
!>      Q1 * B * Z1**H = (Q1*Q) * T * (Z1*Z)**H
!>
!> If Q1 is the unitary matrix from the QR factorization of B in the
!> original equation A*x = lambda*B*x, then CGGHD3 reduces the original
!> problem to generalized Hessenberg form.
!>
!> This is a blocked variant of CGGHRD, using matrix-matrix
!> multiplications for parts of the computation to enhance performance.
!>

Parameters

[in]	COMPQ	!> COMPQ is CHARACTER1 !> = 'N': do not compute Q; !> = 'I': Q is initialized to the unit matrix, and the !> unitary matrix Q is returned; !> = 'V': Q must contain a unitary matrix Q1 on entry, !> and the product Q1Q is returned. !>
[in]	COMPZ	!> COMPZ is CHARACTER1 !> = 'N': do not compute Z; !> = 'I': Z is initialized to the unit matrix, and the !> unitary matrix Z is returned; !> = 'V': Z must contain a unitary matrix Z1 on entry, !> and the product Z1Z is returned. !>
[in]	N	!> N is INTEGER !> The order of the matrices A and B. N >= 0. !>
[in]	ILO	!> ILO is INTEGER !>
[in]	IHI	!> IHI is INTEGER !> !> ILO and IHI mark the rows and columns of A which are to be !> reduced. It is assumed that A is already upper triangular !> in rows and columns 1:ILO-1 and IHI+1:N. ILO and IHI are !> normally set by a previous call to CGGBAL; otherwise they !> should be set to 1 and N respectively. !> 1 <= ILO <= IHI <= N, if N > 0; ILO=1 and IHI=0, if N=0. !>
[in,out]	A	!> A is COMPLEX array, dimension (LDA, N) !> On entry, the N-by-N general matrix to be reduced. !> On exit, the upper triangle and the first subdiagonal of A !> are overwritten with the upper Hessenberg matrix H, and the !> rest is set to zero. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,N). !>
[in,out]	B	!> B is COMPLEX array, dimension (LDB, N) !> On entry, the N-by-N upper triangular matrix B. !> On exit, the upper triangular matrix T = Q**H B Z. The !> elements below the diagonal are set to zero. !>
[in]	LDB	!> LDB is INTEGER !> The leading dimension of the array B. LDB >= max(1,N). !>
[in,out]	Q	!> Q is COMPLEX array, dimension (LDQ, N) !> On entry, if COMPQ = 'V', the unitary matrix Q1, typically !> from the QR factorization of B. !> On exit, if COMPQ='I', the unitary matrix Q, and if !> COMPQ = 'V', the product Q1*Q. !> Not referenced if COMPQ='N'. !>
[in]	LDQ	!> LDQ is INTEGER !> The leading dimension of the array Q. !> LDQ >= N if COMPQ='V' or 'I'; LDQ >= 1 otherwise. !>
[in,out]	Z	!> Z is COMPLEX array, dimension (LDZ, N) !> On entry, if COMPZ = 'V', the unitary matrix Z1. !> On exit, if COMPZ='I', the unitary matrix Z, and if !> COMPZ = 'V', the product Z1*Z. !> Not referenced if COMPZ='N'. !>
[in]	LDZ	!> LDZ is INTEGER !> The leading dimension of the array Z. !> LDZ >= N if COMPZ='V' or 'I'; LDZ >= 1 otherwise. !>
[out]	WORK	!> WORK is COMPLEX array, dimension (LWORK) !> On exit, if INFO = 0, WORK(1) returns the optimal LWORK. !>
[in]	LWORK	!> LWORK is INTEGER !> The length of the array WORK. LWORK >= 1. !> For optimum performance LWORK >= 6NNB, where NB is the !> optimal blocksize. !> !> If LWORK = -1, then a workspace query is assumed; the routine !> only calculates the optimal size of the WORK array, returns !> this value as the first entry of the WORK array, and no error !> message related to LWORK is issued by XERBLA. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> < 0: if INFO = -i, the i-th argument had an illegal value. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  This routine reduces A to Hessenberg form and maintains B in triangular form
!>  using a blocked variant of Moler and Stewart's original algorithm,
!>  as described by Kagstrom, Kressner, Quintana-Orti, and Quintana-Orti
!>  (BIT 2008).
!>

Definition at line 229 of file cgghd3.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*
      IMPLICIT NONE
*
*     .. Scalar Arguments ..
      CHARACTER          COMPQ, COMPZ
      INTEGER            IHI, ILO, INFO, LDA, LDB, LDQ, LDZ, N, LWORK
*     ..
*     .. Array Arguments ..
      COMPLEX            A( LDA, * ), B( LDB, * ), Q( LDQ, * ),
     $                   Z( LDZ, * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            CONE, CZERO
      parameter( cone = ( 1.0e+0, 0.0e+0 ),
     $                     czero = ( 0.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      LOGICAL            BLK22, INITQ, INITZ, LQUERY, WANTQ, WANTZ
      CHARACTER*1        COMPQ2, COMPZ2
      INTEGER            COLA, I, IERR, J, J0, JCOL, JJ, JROW, K,
     $                   KACC22, LEN, LWKOPT, N2NB, NB, NBLST, NBMIN,
     $                   NH, NNB, NX, PPW, PPWO, PW, TOP, TOPQ
      REAL               C
      COMPLEX            C1, C2, CTEMP, S, S1, S2, TEMP, TEMP1, TEMP2,
     $                   TEMP3
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      INTEGER            ILAENV
      EXTERNAL           ilaenv, lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           cgghrd, clartg, claset, cunm22, crot, cgemm,
     $                   cgemv, ctrmv, clacpy, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          real, cmplx, conjg, max
*     ..
*     .. Executable Statements ..
*
*     Decode and test the input parameters.
*
      info = 0
      nb = ilaenv( 1, 'CGGHD3', ' ', n, ilo, ihi, -1 )
      lwkopt = max( 6*n*nb, 1 )
      work( 1 ) = cmplx( lwkopt )
      initq = lsame( compq, 'I' )
      wantq = initq .OR. lsame( compq, 'V' )
      initz = lsame( compz, 'I' )
      wantz = initz .OR. lsame( compz, 'V' )
      lquery = ( lwork.EQ.-1 )
*
      IF( .NOT.lsame( compq, 'N' ) .AND. .NOT.wantq ) THEN
         info = -1
      ELSE IF( .NOT.lsame( compz, 'N' ) .AND. .NOT.wantz ) THEN
         info = -2
      ELSE IF( n.LT.0 ) THEN
         info = -3
      ELSE IF( ilo.LT.1 ) THEN
         info = -4
      ELSE IF( ihi.GT.n .OR. ihi.LT.ilo-1 ) THEN
         info = -5
      ELSE IF( lda.LT.max( 1, n ) ) THEN
         info = -7
      ELSE IF( ldb.LT.max( 1, n ) ) THEN
         info = -9
      ELSE IF( ( wantq .AND. ldq.LT.n ) .OR. ldq.LT.1 ) THEN
         info = -11
      ELSE IF( ( wantz .AND. ldz.LT.n ) .OR. ldz.LT.1 ) THEN
         info = -13
      ELSE IF( lwork.LT.1 .AND. .NOT.lquery ) THEN
         info = -15
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CGGHD3', -info )
         RETURN
      ELSE IF( lquery ) THEN
         RETURN
      END IF
*
*     Initialize Q and Z if desired.
*
      IF( initq )
     $   CALL claset( 'All', n, n, czero, cone, q, ldq )
      IF( initz )
     $   CALL claset( 'All', n, n, czero, cone, z, ldz )
*
*     Zero out lower triangle of B.
*
      IF( n.GT.1 )
     $   CALL claset( 'Lower', n-1, n-1, czero, czero, b(2, 1), ldb )
*
*     Quick return if possible
*
      nh = ihi - ilo + 1
      IF( nh.LE.1 ) THEN
         work( 1 ) = cone
         RETURN
      END IF
*
*     Determine the blocksize.
*
      nbmin = ilaenv( 2, 'CGGHD3', ' ', n, ilo, ihi, -1 )
      IF( nb.GT.1 .AND. nb.LT.nh ) THEN
*
*        Determine when to use unblocked instead of blocked code.
*
         nx = max( nb, ilaenv( 3, 'CGGHD3', ' ', n, ilo, ihi, -1 ) )
         IF( nx.LT.nh ) THEN
*
*           Determine if workspace is large enough for blocked code.
*
            IF( lwork.LT.lwkopt ) THEN
*
*              Not enough workspace to use optimal NB:  determine the
*              minimum value of NB, and reduce NB or force use of
*              unblocked code.
*
               nbmin = max( 2, ilaenv( 2, 'CGGHD3', ' ', n, ilo, ihi,
     $                      -1 ) )
               IF( lwork.GE.6*n*nbmin ) THEN
                  nb = lwork / ( 6*n )
               ELSE
                  nb = 1
               END IF
            END IF
         END IF
      END IF
*
      IF( nb.LT.nbmin .OR. nb.GE.nh ) THEN
*
*        Use unblocked code below
*
         jcol = ilo
*
      ELSE
*
*        Use blocked code
*
         kacc22 = ilaenv( 16, 'CGGHD3', ' ', n, ilo, ihi, -1 )
         blk22 = kacc22.EQ.2
         DO jcol = ilo, ihi-2, nb
            nnb = min( nb, ihi-jcol-1 )
*
*           Initialize small unitary factors that will hold the
*           accumulated Givens rotations in workspace.
*           N2NB   denotes the number of 2*NNB-by-2*NNB factors
*           NBLST  denotes the (possibly smaller) order of the last
*                  factor.
*
            n2nb = ( ihi-jcol-1 ) / nnb - 1
            nblst = ihi - jcol - n2nb*nnb
            CALL claset( 'All', nblst, nblst, czero, cone, work, nblst )
            pw = nblst * nblst + 1
            DO i = 1, n2nb
               CALL claset( 'All', 2*nnb, 2*nnb, czero, cone,
     $                      work( pw ), 2*nnb )
               pw = pw + 4*nnb*nnb
            END DO
*
*           Reduce columns JCOL:JCOL+NNB-1 of A to Hessenberg form.
*
            DO j = jcol, jcol+nnb-1
*
*              Reduce Jth column of A. Store cosines and sines in Jth
*              column of A and B, respectively.
*
               DO i = ihi, j+2, -1
                  temp = a( i-1, j )
                  CALL clartg( temp, a( i, j ), c, s, a( i-1, j ) )
                  a( i, j ) = cmplx( c )
                  b( i, j ) = s
               END DO
*
*              Accumulate Givens rotations into workspace array.
*
               ppw  = ( nblst + 1 )*( nblst - 2 ) - j + jcol + 1
               len  = 2 + j - jcol
               jrow = j + n2nb*nnb + 2
               DO i = ihi, jrow, -1
                  ctemp = a( i, j )
                  s = b( i, j )
                  DO jj = ppw, ppw+len-1
                     temp = work( jj + nblst )
                     work( jj + nblst ) = ctemp*temp - s*work( jj )
                     work( jj ) = conjg( s )*temp + ctemp*work( jj )
                  END DO
                  len = len + 1
                  ppw = ppw - nblst - 1
               END DO
*
               ppwo = nblst*nblst + ( nnb+j-jcol-1 )*2*nnb + nnb
               j0 = jrow - nnb
               DO jrow = j0, j+2, -nnb
                  ppw = ppwo
                  len  = 2 + j - jcol
                  DO i = jrow+nnb-1, jrow, -1
                     ctemp = a( i, j )
                     s = b( i, j )
                     DO jj = ppw, ppw+len-1
                        temp = work( jj + 2*nnb )
                        work( jj + 2*nnb ) = ctemp*temp - s*work( jj )
                        work( jj ) = conjg( s )*temp + ctemp*work( jj )
                     END DO
                     len = len + 1
                     ppw = ppw - 2*nnb - 1
                  END DO
                  ppwo = ppwo + 4*nnb*nnb
               END DO
*
*              TOP denotes the number of top rows in A and B that will
*              not be updated during the next steps.
*
               IF( jcol.LE.2 ) THEN
                  top = 0
               ELSE
                  top = jcol
               END IF
*
*              Propagate transformations through B and replace stored
*              left sines/cosines by right sines/cosines.
*
               DO jj = n, j+1, -1
*
*                 Update JJth column of B.
*
                  DO i = min( jj+1, ihi ), j+2, -1
                     ctemp = a( i, j )
                     s = b( i, j )
                     temp = b( i, jj )
                     b( i, jj ) = ctemp*temp - conjg( s )*b( i-1, jj )
                     b( i-1, jj ) = s*temp + ctemp*b( i-1, jj )
                  END DO
*
*                 Annihilate B( JJ+1, JJ ).
*
                  IF( jj.LT.ihi ) THEN
                     temp = b( jj+1, jj+1 )
                     CALL clartg( temp, b( jj+1, jj ), c, s,
     $                            b( jj+1, jj+1 ) )
                     b( jj+1, jj ) = czero
                     CALL crot( jj-top, b( top+1, jj+1 ), 1,
     $                          b( top+1, jj ), 1, c, s )
                     a( jj+1, j ) = cmplx( c )
                     b( jj+1, j ) = -conjg( s )
                  END IF
               END DO
*
*              Update A by transformations from right.
*
               jj = mod( ihi-j-1, 3 )
               DO i = ihi-j-3, jj+1, -3
                  ctemp = a( j+1+i, j )
                  s = -b( j+1+i, j )
                  c1 = a( j+2+i, j )
                  s1 = -b( j+2+i, j )
                  c2 = a( j+3+i, j )
                  s2 = -b( j+3+i, j )
*
                  DO k = top+1, ihi
                     temp = a( k, j+i  )
                     temp1 = a( k, j+i+1 )
                     temp2 = a( k, j+i+2 )
                     temp3 = a( k, j+i+3 )
                     a( k, j+i+3 ) = c2*temp3 + conjg( s2 )*temp2
                     temp2 = -s2*temp3 + c2*temp2
                     a( k, j+i+2 ) = c1*temp2 + conjg( s1 )*temp1
                     temp1 = -s1*temp2 + c1*temp1
                     a( k, j+i+1 ) = ctemp*temp1 + conjg( s )*temp
                     a( k, j+i ) = -s*temp1 + ctemp*temp
                  END DO
               END DO
*
               IF( jj.GT.0 ) THEN
                  DO i = jj, 1, -1
                     c = dble( a( j+1+i, j ) )
                     CALL crot( ihi-top, a( top+1, j+i+1 ), 1,
     $                          a( top+1, j+i ), 1, c,
     $                          -conjg( b( j+1+i, j ) ) )
                  END DO
               END IF
*
*              Update (J+1)th column of A by transformations from left.
*
               IF ( j .LT. jcol + nnb - 1 ) THEN
                  len  = 1 + j - jcol
*
*                 Multiply with the trailing accumulated unitary
*                 matrix, which takes the form
*
*                        [  U11  U12  ]
*                    U = [            ],
*                        [  U21  U22  ]
*
*                 where U21 is a LEN-by-LEN matrix and U12 is lower
*                 triangular.
*
                  jrow = ihi - nblst + 1
                  CALL cgemv( 'Conjugate', nblst, len, cone, work,
     $                        nblst, a( jrow, j+1 ), 1, czero,
     $                        work( pw ), 1 )
                  ppw = pw + len
                  DO i = jrow, jrow+nblst-len-1
                     work( ppw ) = a( i, j+1 )
                     ppw = ppw + 1
                  END DO
                  CALL ctrmv( 'Lower', 'Conjugate', 'Non-unit',
     $                        nblst-len, work( len*nblst + 1 ), nblst,
     $                        work( pw+len ), 1 )
                  CALL cgemv( 'Conjugate', len, nblst-len, cone,
     $                        work( (len+1)*nblst - len + 1 ), nblst,
     $                        a( jrow+nblst-len, j+1 ), 1, cone,
     $                        work( pw+len ), 1 )
                  ppw = pw
                  DO i = jrow, jrow+nblst-1
                     a( i, j+1 ) = work( ppw )
                     ppw = ppw + 1
                  END DO
*
*                 Multiply with the other accumulated unitary
*                 matrices, which take the form
*
*                        [  U11  U12   0  ]
*                        [                ]
*                    U = [  U21  U22   0  ],
*                        [                ]
*                        [   0    0    I  ]
*
*                 where I denotes the (NNB-LEN)-by-(NNB-LEN) identity
*                 matrix, U21 is a LEN-by-LEN upper triangular matrix
*                 and U12 is an NNB-by-NNB lower triangular matrix.
*
                  ppwo = 1 + nblst*nblst
                  j0 = jrow - nnb
                  DO jrow = j0, jcol+1, -nnb
                     ppw = pw + len
                     DO i = jrow, jrow+nnb-1
                        work( ppw ) = a( i, j+1 )
                        ppw = ppw + 1
                     END DO
                     ppw = pw
                     DO i = jrow+nnb, jrow+nnb+len-1
                        work( ppw ) = a( i, j+1 )
                        ppw = ppw + 1
                     END DO
                     CALL ctrmv( 'Upper', 'Conjugate', 'Non-unit', len,
     $                           work( ppwo + nnb ), 2*nnb, work( pw ),
     $                           1 )
                     CALL ctrmv( 'Lower', 'Conjugate', 'Non-unit', nnb,
     $                           work( ppwo + 2*len*nnb ),
     $                           2*nnb, work( pw + len ), 1 )
                     CALL cgemv( 'Conjugate', nnb, len, cone,
     $                           work( ppwo ), 2*nnb, a( jrow, j+1 ), 1,
     $                           cone, work( pw ), 1 )
                     CALL cgemv( 'Conjugate', len, nnb, cone,
     $                           work( ppwo + 2*len*nnb + nnb ), 2*nnb,
     $                           a( jrow+nnb, j+1 ), 1, cone,
     $                           work( pw+len ), 1 )
                     ppw = pw
                     DO i = jrow, jrow+len+nnb-1
                        a( i, j+1 ) = work( ppw )
                        ppw = ppw + 1
                     END DO
                     ppwo = ppwo + 4*nnb*nnb
                  END DO
               END IF
            END DO
*
*           Apply accumulated unitary matrices to A.
*
            cola = n - jcol - nnb + 1
            j = ihi - nblst + 1
            CALL cgemm( 'Conjugate', 'No Transpose', nblst,
     $                  cola, nblst, cone, work, nblst,
     $                  a( j, jcol+nnb ), lda, czero, work( pw ),
     $                  nblst )
            CALL clacpy( 'All', nblst, cola, work( pw ), nblst,
     $                   a( j, jcol+nnb ), lda )
            ppwo = nblst*nblst + 1
            j0 = j - nnb
            DO j = j0, jcol+1, -nnb
               IF ( blk22 ) THEN
*
*                 Exploit the structure of
*
*                        [  U11  U12  ]
*                    U = [            ]
*                        [  U21  U22  ],
*
*                 where all blocks are NNB-by-NNB, U21 is upper
*                 triangular and U12 is lower triangular.
*
                  CALL cunm22( 'Left', 'Conjugate', 2*nnb, cola, nnb,
     $                         nnb, work( ppwo ), 2*nnb,
     $                         a( j, jcol+nnb ), lda, work( pw ),
     $                         lwork-pw+1, ierr )
               ELSE
*
*                 Ignore the structure of U.
*
                  CALL cgemm( 'Conjugate', 'No Transpose', 2*nnb,
     $                        cola, 2*nnb, cone, work( ppwo ), 2*nnb,
     $                        a( j, jcol+nnb ), lda, czero, work( pw ),
     $                        2*nnb )
                  CALL clacpy( 'All', 2*nnb, cola, work( pw ), 2*nnb,
     $                         a( j, jcol+nnb ), lda )
               END IF
               ppwo = ppwo + 4*nnb*nnb
            END DO
*
*           Apply accumulated unitary matrices to Q.
*
            IF( wantq ) THEN
               j = ihi - nblst + 1
               IF ( initq ) THEN
                  topq = max( 2, j - jcol + 1 )
                  nh  = ihi - topq + 1
               ELSE
                  topq = 1
                  nh = n
               END IF
               CALL cgemm( 'No Transpose', 'No Transpose', nh,
     $                     nblst, nblst, cone, q( topq, j ), ldq,
     $                     work, nblst, czero, work( pw ), nh )
               CALL clacpy( 'All', nh, nblst, work( pw ), nh,
     $                      q( topq, j ), ldq )
               ppwo = nblst*nblst + 1
               j0 = j - nnb
               DO j = j0, jcol+1, -nnb
                  IF ( initq ) THEN
                     topq = max( 2, j - jcol + 1 )
                     nh  = ihi - topq + 1
                  END IF
                  IF ( blk22 ) THEN
*
*                    Exploit the structure of U.
*
                     CALL cunm22( 'Right', 'No Transpose', nh, 2*nnb,
     $                            nnb, nnb, work( ppwo ), 2*nnb,
     $                            q( topq, j ), ldq, work( pw ),
     $                            lwork-pw+1, ierr )
                  ELSE
*
*                    Ignore the structure of U.
*
                     CALL cgemm( 'No Transpose', 'No Transpose', nh,
     $                           2*nnb, 2*nnb, cone, q( topq, j ), ldq,
     $                           work( ppwo ), 2*nnb, czero, work( pw ),
     $                           nh )
                     CALL clacpy( 'All', nh, 2*nnb, work( pw ), nh,
     $                            q( topq, j ), ldq )
                  END IF
                  ppwo = ppwo + 4*nnb*nnb
               END DO
            END IF
*
*           Accumulate right Givens rotations if required.
*
            IF ( wantz .OR. top.GT.0 ) THEN
*
*              Initialize small unitary factors that will hold the
*              accumulated Givens rotations in workspace.
*
               CALL claset( 'All', nblst, nblst, czero, cone, work,
     $                      nblst )
               pw = nblst * nblst + 1
               DO i = 1, n2nb
                  CALL claset( 'All', 2*nnb, 2*nnb, czero, cone,
     $                         work( pw ), 2*nnb )
                  pw = pw + 4*nnb*nnb
               END DO
*
*              Accumulate Givens rotations into workspace array.
*
               DO j = jcol, jcol+nnb-1
                  ppw  = ( nblst + 1 )*( nblst - 2 ) - j + jcol + 1
                  len  = 2 + j - jcol
                  jrow = j + n2nb*nnb + 2
                  DO i = ihi, jrow, -1
                     ctemp = a( i, j )
                     a( i, j ) = czero
                     s = b( i, j )
                     b( i, j ) = czero
                     DO jj = ppw, ppw+len-1
                        temp = work( jj + nblst )
                        work( jj + nblst ) = ctemp*temp -
     $                                       conjg( s )*work( jj )
                        work( jj ) = s*temp + ctemp*work( jj )
                     END DO
                     len = len + 1
                     ppw = ppw - nblst - 1
                  END DO
*
                  ppwo = nblst*nblst + ( nnb+j-jcol-1 )*2*nnb + nnb
                  j0 = jrow - nnb
                  DO jrow = j0, j+2, -nnb
                     ppw = ppwo
                     len  = 2 + j - jcol
                     DO i = jrow+nnb-1, jrow, -1
                        ctemp = a( i, j )
                        a( i, j ) = czero
                        s = b( i, j )
                        b( i, j ) = czero
                        DO jj = ppw, ppw+len-1
                           temp = work( jj + 2*nnb )
                           work( jj + 2*nnb ) = ctemp*temp -
     $                                          conjg( s )*work( jj )
                           work( jj ) = s*temp + ctemp*work( jj )
                        END DO
                        len = len + 1
                        ppw = ppw - 2*nnb - 1
                     END DO
                     ppwo = ppwo + 4*nnb*nnb
                  END DO
               END DO
            ELSE
*
               CALL claset( 'Lower', ihi - jcol - 1, nnb, czero, czero,
     $                      a( jcol + 2, jcol ), lda )
               CALL claset( 'Lower', ihi - jcol - 1, nnb, czero, czero,
     $                      b( jcol + 2, jcol ), ldb )
            END IF
*
*           Apply accumulated unitary matrices to A and B.
*
            IF ( top.GT.0 ) THEN
               j = ihi - nblst + 1
               CALL cgemm( 'No Transpose', 'No Transpose', top,
     $                     nblst, nblst, cone, a( 1, j ), lda,
     $                     work, nblst, czero, work( pw ), top )
               CALL clacpy( 'All', top, nblst, work( pw ), top,
     $                      a( 1, j ), lda )
               ppwo = nblst*nblst + 1
               j0 = j - nnb
               DO j = j0, jcol+1, -nnb
                  IF ( blk22 ) THEN
*
*                    Exploit the structure of U.
*
                     CALL cunm22( 'Right', 'No Transpose', top, 2*nnb,
     $                            nnb, nnb, work( ppwo ), 2*nnb,
     $                            a( 1, j ), lda, work( pw ),
     $                            lwork-pw+1, ierr )
                  ELSE
*
*                    Ignore the structure of U.
*
                     CALL cgemm( 'No Transpose', 'No Transpose', top,
     $                           2*nnb, 2*nnb, cone, a( 1, j ), lda,
     $                           work( ppwo ), 2*nnb, czero,
     $                           work( pw ), top )
                     CALL clacpy( 'All', top, 2*nnb, work( pw ), top,
     $                            a( 1, j ), lda )
                  END IF
                  ppwo = ppwo + 4*nnb*nnb
               END DO
*
               j = ihi - nblst + 1
               CALL cgemm( 'No Transpose', 'No Transpose', top,
     $                     nblst, nblst, cone, b( 1, j ), ldb,
     $                     work, nblst, czero, work( pw ), top )
               CALL clacpy( 'All', top, nblst, work( pw ), top,
     $                      b( 1, j ), ldb )
               ppwo = nblst*nblst + 1
               j0 = j - nnb
               DO j = j0, jcol+1, -nnb
                  IF ( blk22 ) THEN
*
*                    Exploit the structure of U.
*
                     CALL cunm22( 'Right', 'No Transpose', top, 2*nnb,
     $                            nnb, nnb, work( ppwo ), 2*nnb,
     $                            b( 1, j ), ldb, work( pw ),
     $                            lwork-pw+1, ierr )
                  ELSE
*
*                    Ignore the structure of U.
*
                     CALL cgemm( 'No Transpose', 'No Transpose', top,
     $                           2*nnb, 2*nnb, cone, b( 1, j ), ldb,
     $                           work( ppwo ), 2*nnb, czero,
     $                           work( pw ), top )
                     CALL clacpy( 'All', top, 2*nnb, work( pw ), top,
     $                            b( 1, j ), ldb )
                  END IF
                  ppwo = ppwo + 4*nnb*nnb
               END DO
            END IF
*
*           Apply accumulated unitary matrices to Z.
*
            IF( wantz ) THEN
               j = ihi - nblst + 1
               IF ( initq ) THEN
                  topq = max( 2, j - jcol + 1 )
                  nh  = ihi - topq + 1
               ELSE
                  topq = 1
                  nh = n
               END IF
               CALL cgemm( 'No Transpose', 'No Transpose', nh,
     $                     nblst, nblst, cone, z( topq, j ), ldz,
     $                     work, nblst, czero, work( pw ), nh )
               CALL clacpy( 'All', nh, nblst, work( pw ), nh,
     $                      z( topq, j ), ldz )
               ppwo = nblst*nblst + 1
               j0 = j - nnb
               DO j = j0, jcol+1, -nnb
                     IF ( initq ) THEN
                     topq = max( 2, j - jcol + 1 )
                     nh  = ihi - topq + 1
                  END IF
                  IF ( blk22 ) THEN
*
*                    Exploit the structure of U.
*
                     CALL cunm22( 'Right', 'No Transpose', nh, 2*nnb,
     $                            nnb, nnb, work( ppwo ), 2*nnb,
     $                            z( topq, j ), ldz, work( pw ),
     $                            lwork-pw+1, ierr )
                  ELSE
*
*                    Ignore the structure of U.
*
                     CALL cgemm( 'No Transpose', 'No Transpose', nh,
     $                           2*nnb, 2*nnb, cone, z( topq, j ), ldz,
     $                           work( ppwo ), 2*nnb, czero, work( pw ),
     $                           nh )
                     CALL clacpy( 'All', nh, 2*nnb, work( pw ), nh,
     $                            z( topq, j ), ldz )
                  END IF
                  ppwo = ppwo + 4*nnb*nnb
               END DO
            END IF
         END DO
      END IF
*
*     Use unblocked code to reduce the rest of the matrix
*     Avoid re-initialization of modified Q and Z.
*
      compq2 = compq
      compz2 = compz
      IF ( jcol.NE.ilo ) THEN
         IF ( wantq )
     $      compq2 = 'V'
         IF ( wantz )
     $      compz2 = 'V'
      END IF
*
      IF ( jcol.LT.ihi )
     $   CALL cgghrd( compq2, compz2, n, jcol, ihi, a, lda, b, ldb, q,
     $                ldq, z, ldz, ierr )
      work( 1 ) = cmplx( lwkopt )
*
      RETURN
*
*     End of CGGHD3
*

◆ cgghrd()

subroutine cgghrd	(	character	compq,
		character	compz,
		integer	n,
		integer	ilo,
		integer	ihi,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( ldb, * )	b,
		integer	ldb,
		complex, dimension( ldq, * )	q,
		integer	ldq,
		complex, dimension( ldz, * )	z,
		integer	ldz,
		integer	info )

CGGHRD

Download CGGHRD + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CGGHRD reduces a pair of complex matrices (A,B) to generalized upper
!> Hessenberg form using unitary transformations, where A is a
!> general matrix and B is upper triangular.  The form of the generalized
!> eigenvalue problem is
!>    A*x = lambda*B*x,
!> and B is typically made upper triangular by computing its QR
!> factorization and moving the unitary matrix Q to the left side
!> of the equation.
!>
!> This subroutine simultaneously reduces A to a Hessenberg matrix H:
!>    Q**H*A*Z = H
!> and transforms B to another upper triangular matrix T:
!>    Q**H*B*Z = T
!> in order to reduce the problem to its standard form
!>    H*y = lambda*T*y
!> where y = Z**H*x.
!>
!> The unitary matrices Q and Z are determined as products of Givens
!> rotations.  They may either be formed explicitly, or they may be
!> postmultiplied into input matrices Q1 and Z1, so that
!>      Q1 * A * Z1**H = (Q1*Q) * H * (Z1*Z)**H
!>      Q1 * B * Z1**H = (Q1*Q) * T * (Z1*Z)**H
!> If Q1 is the unitary matrix from the QR factorization of B in the
!> original equation A*x = lambda*B*x, then CGGHRD reduces the original
!> problem to generalized Hessenberg form.
!>

Parameters

[in]	COMPQ	!> COMPQ is CHARACTER1 !> = 'N': do not compute Q; !> = 'I': Q is initialized to the unit matrix, and the !> unitary matrix Q is returned; !> = 'V': Q must contain a unitary matrix Q1 on entry, !> and the product Q1Q is returned. !>
[in]	COMPZ	!> COMPZ is CHARACTER1 !> = 'N': do not compute Z; !> = 'I': Z is initialized to the unit matrix, and the !> unitary matrix Z is returned; !> = 'V': Z must contain a unitary matrix Z1 on entry, !> and the product Z1Z is returned. !>
[in]	N	!> N is INTEGER !> The order of the matrices A and B. N >= 0. !>
[in]	ILO	!> ILO is INTEGER !>
[in]	IHI	!> IHI is INTEGER !> !> ILO and IHI mark the rows and columns of A which are to be !> reduced. It is assumed that A is already upper triangular !> in rows and columns 1:ILO-1 and IHI+1:N. ILO and IHI are !> normally set by a previous call to CGGBAL; otherwise they !> should be set to 1 and N respectively. !> 1 <= ILO <= IHI <= N, if N > 0; ILO=1 and IHI=0, if N=0. !>
[in,out]	A	!> A is COMPLEX array, dimension (LDA, N) !> On entry, the N-by-N general matrix to be reduced. !> On exit, the upper triangle and the first subdiagonal of A !> are overwritten with the upper Hessenberg matrix H, and the !> rest is set to zero. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,N). !>
[in,out]	B	!> B is COMPLEX array, dimension (LDB, N) !> On entry, the N-by-N upper triangular matrix B. !> On exit, the upper triangular matrix T = Q**H B Z. The !> elements below the diagonal are set to zero. !>
[in]	LDB	!> LDB is INTEGER !> The leading dimension of the array B. LDB >= max(1,N). !>
[in,out]	Q	!> Q is COMPLEX array, dimension (LDQ, N) !> On entry, if COMPQ = 'V', the unitary matrix Q1, typically !> from the QR factorization of B. !> On exit, if COMPQ='I', the unitary matrix Q, and if !> COMPQ = 'V', the product Q1*Q. !> Not referenced if COMPQ='N'. !>
[in]	LDQ	!> LDQ is INTEGER !> The leading dimension of the array Q. !> LDQ >= N if COMPQ='V' or 'I'; LDQ >= 1 otherwise. !>
[in,out]	Z	!> Z is COMPLEX array, dimension (LDZ, N) !> On entry, if COMPZ = 'V', the unitary matrix Z1. !> On exit, if COMPZ='I', the unitary matrix Z, and if !> COMPZ = 'V', the product Z1*Z. !> Not referenced if COMPZ='N'. !>
[in]	LDZ	!> LDZ is INTEGER !> The leading dimension of the array Z. !> LDZ >= N if COMPZ='V' or 'I'; LDZ >= 1 otherwise. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> < 0: if INFO = -i, the i-th argument had an illegal value. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  This routine reduces A to Hessenberg and B to triangular form by
!>  an unblocked reduction, as described in _Matrix_Computations_,
!>  by Golub and van Loan (Johns Hopkins Press).
!>

Definition at line 202 of file cgghrd.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          COMPQ, COMPZ
      INTEGER            IHI, ILO, INFO, LDA, LDB, LDQ, LDZ, N
*     ..
*     .. Array Arguments ..
      COMPLEX            A( LDA, * ), B( LDB, * ), Q( LDQ, * ),
     $                   Z( LDZ, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            CONE, CZERO
      parameter( cone = ( 1.0e+0, 0.0e+0 ),
     $                   czero = ( 0.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      LOGICAL            ILQ, ILZ
      INTEGER            ICOMPQ, ICOMPZ, JCOL, JROW
      REAL               C
      COMPLEX            CTEMP, S
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           clartg, claset, crot, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          conjg, max
*     ..
*     .. Executable Statements ..
*
*     Decode COMPQ
*
      IF( lsame( compq, 'N' ) ) THEN
         ilq = .false.
         icompq = 1
      ELSE IF( lsame( compq, 'V' ) ) THEN
         ilq = .true.
         icompq = 2
      ELSE IF( lsame( compq, 'I' ) ) THEN
         ilq = .true.
         icompq = 3
      ELSE
         icompq = 0
      END IF
*
*     Decode COMPZ
*
      IF( lsame( compz, 'N' ) ) THEN
         ilz = .false.
         icompz = 1
      ELSE IF( lsame( compz, 'V' ) ) THEN
         ilz = .true.
         icompz = 2
      ELSE IF( lsame( compz, 'I' ) ) THEN
         ilz = .true.
         icompz = 3
      ELSE
         icompz = 0
      END IF
*
*     Test the input parameters.
*
      info = 0
      IF( icompq.LE.0 ) THEN
         info = -1
      ELSE IF( icompz.LE.0 ) THEN
         info = -2
      ELSE IF( n.LT.0 ) THEN
         info = -3
      ELSE IF( ilo.LT.1 ) THEN
         info = -4
      ELSE IF( ihi.GT.n .OR. ihi.LT.ilo-1 ) THEN
         info = -5
      ELSE IF( lda.LT.max( 1, n ) ) THEN
         info = -7
      ELSE IF( ldb.LT.max( 1, n ) ) THEN
         info = -9
      ELSE IF( ( ilq .AND. ldq.LT.n ) .OR. ldq.LT.1 ) THEN
         info = -11
      ELSE IF( ( ilz .AND. ldz.LT.n ) .OR. ldz.LT.1 ) THEN
         info = -13
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CGGHRD', -info )
         RETURN
      END IF
*
*     Initialize Q and Z if desired.
*
      IF( icompq.EQ.3 )
     $   CALL claset( 'Full', n, n, czero, cone, q, ldq )
      IF( icompz.EQ.3 )
     $   CALL claset( 'Full', n, n, czero, cone, z, ldz )
*
*     Quick return if possible
*
      IF( n.LE.1 )
     $   RETURN
*
*     Zero out lower triangle of B
*
      DO 20 jcol = 1, n - 1
         DO 10 jrow = jcol + 1, n
            b( jrow, jcol ) = czero
   10    CONTINUE
   20 CONTINUE
*
*     Reduce A and B
*
      DO 40 jcol = ilo, ihi - 2
*
         DO 30 jrow = ihi, jcol + 2, -1
*
*           Step 1: rotate rows JROW-1, JROW to kill A(JROW,JCOL)
*
            ctemp = a( jrow-1, jcol )
            CALL clartg( ctemp, a( jrow, jcol ), c, s,
     $                   a( jrow-1, jcol ) )
            a( jrow, jcol ) = czero
            CALL crot( n-jcol, a( jrow-1, jcol+1 ), lda,
     $                 a( jrow, jcol+1 ), lda, c, s )
            CALL crot( n+2-jrow, b( jrow-1, jrow-1 ), ldb,
     $                 b( jrow, jrow-1 ), ldb, c, s )
            IF( ilq )
     $         CALL crot( n, q( 1, jrow-1 ), 1, q( 1, jrow ), 1, c,
     $                    conjg( s ) )
*
*           Step 2: rotate columns JROW, JROW-1 to kill B(JROW,JROW-1)
*
            ctemp = b( jrow, jrow )
            CALL clartg( ctemp, b( jrow, jrow-1 ), c, s,
     $                   b( jrow, jrow ) )
            b( jrow, jrow-1 ) = czero
            CALL crot( ihi, a( 1, jrow ), 1, a( 1, jrow-1 ), 1, c, s )
            CALL crot( jrow-1, b( 1, jrow ), 1, b( 1, jrow-1 ), 1, c,
     $                 s )
            IF( ilz )
     $         CALL crot( n, z( 1, jrow ), 1, z( 1, jrow-1 ), 1, c, s )
   30    CONTINUE
   40 CONTINUE
*
      RETURN
*
*     End of CGGHRD
*

◆ cggqrf()

subroutine cggqrf	(	integer	n,
		integer	m,
		integer	p,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( * )	taua,
		complex, dimension( ldb, * )	b,
		integer	ldb,
		complex, dimension( * )	taub,
		complex, dimension( * )	work,
		integer	lwork,
		integer	info )

CGGQRF

Download CGGQRF + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CGGQRF computes a generalized QR factorization of an N-by-M matrix A
!> and an N-by-P matrix B:
!>
!>             A = Q*R,        B = Q*T*Z,
!>
!> where Q is an N-by-N unitary matrix, Z is a P-by-P unitary matrix,
!> and R and T assume one of the forms:
!>
!> if N >= M,  R = ( R11 ) M  ,   or if N < M,  R = ( R11  R12 ) N,
!>                 (  0  ) N-M                         N   M-N
!>                    M
!>
!> where R11 is upper triangular, and
!>
!> if N <= P,  T = ( 0  T12 ) N,   or if N > P,  T = ( T11 ) N-P,
!>                  P-N  N                           ( T21 ) P
!>                                                      P
!>
!> where T12 or T21 is upper triangular.
!>
!> In particular, if B is square and nonsingular, the GQR factorization
!> of A and B implicitly gives the QR factorization of inv(B)*A:
!>
!>              inv(B)*A = Z**H * (inv(T)*R)
!>
!> where inv(B) denotes the inverse of the matrix B, and Z' denotes the
!> conjugate transpose of matrix Z.
!>

Parameters

[in]	N	!> N is INTEGER !> The number of rows of the matrices A and B. N >= 0. !>
[in]	M	!> M is INTEGER !> The number of columns of the matrix A. M >= 0. !>
[in]	P	!> P is INTEGER !> The number of columns of the matrix B. P >= 0. !>
[in,out]	A	!> A is COMPLEX array, dimension (LDA,M) !> On entry, the N-by-M matrix A. !> On exit, the elements on and above the diagonal of the array !> contain the min(N,M)-by-M upper trapezoidal matrix R (R is !> upper triangular if N >= M); the elements below the diagonal, !> with the array TAUA, represent the unitary matrix Q as a !> product of min(N,M) elementary reflectors (see Further !> Details). !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,N). !>
[out]	TAUA	!> TAUA is COMPLEX array, dimension (min(N,M)) !> The scalar factors of the elementary reflectors which !> represent the unitary matrix Q (see Further Details). !>
[in,out]	B	!> B is COMPLEX array, dimension (LDB,P) !> On entry, the N-by-P matrix B. !> On exit, if N <= P, the upper triangle of the subarray !> B(1:N,P-N+1:P) contains the N-by-N upper triangular matrix T; !> if N > P, the elements on and above the (N-P)-th subdiagonal !> contain the N-by-P upper trapezoidal matrix T; the remaining !> elements, with the array TAUB, represent the unitary !> matrix Z as a product of elementary reflectors (see Further !> Details). !>
[in]	LDB	!> LDB is INTEGER !> The leading dimension of the array B. LDB >= max(1,N). !>
[out]	TAUB	!> TAUB is COMPLEX array, dimension (min(N,P)) !> The scalar factors of the elementary reflectors which !> represent the unitary matrix Z (see Further Details). !>
[out]	WORK	!> WORK is COMPLEX array, dimension (MAX(1,LWORK)) !> On exit, if INFO = 0, WORK(1) returns the optimal LWORK. !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the array WORK. LWORK >= max(1,N,M,P). !> For optimum performance LWORK >= max(N,M,P)*max(NB1,NB2,NB3), !> where NB1 is the optimal blocksize for the QR factorization !> of an N-by-M matrix, NB2 is the optimal blocksize for the !> RQ factorization of an N-by-P matrix, and NB3 is the optimal !> blocksize for a call of CUNMQR. !> !> If LWORK = -1, then a workspace query is assumed; the routine !> only calculates the optimal size of the WORK array, returns !> this value as the first entry of the WORK array, and no error !> message related to LWORK is issued by XERBLA. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  The matrix Q is represented as a product of elementary reflectors
!>
!>     Q = H(1) H(2) . . . H(k), where k = min(n,m).
!>
!>  Each H(i) has the form
!>
!>     H(i) = I - taua * v * v**H
!>
!>  where taua is a complex scalar, and v is a complex vector with
!>  v(1:i-1) = 0 and v(i) = 1; v(i+1:n) is stored on exit in A(i+1:n,i),
!>  and taua in TAUA(i).
!>  To form Q explicitly, use LAPACK subroutine CUNGQR.
!>  To use Q to update another matrix, use LAPACK subroutine CUNMQR.
!>
!>  The matrix Z is represented as a product of elementary reflectors
!>
!>     Z = H(1) H(2) . . . H(k), where k = min(n,p).
!>
!>  Each H(i) has the form
!>
!>     H(i) = I - taub * v * v**H
!>
!>  where taub is a complex scalar, and v is a complex vector with
!>  v(p-k+i+1:p) = 0 and v(p-k+i) = 1; v(1:p-k+i-1) is stored on exit in
!>  B(n-k+i,1:p-k+i-1), and taub in TAUB(i).
!>  To form Z explicitly, use LAPACK subroutine CUNGRQ.
!>  To use Z to update another matrix, use LAPACK subroutine CUNMRQ.
!>

Definition at line 213 of file cggqrf.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INFO, LDA, LDB, LWORK, M, N, P
*     ..
*     .. Array Arguments ..
      COMPLEX            A( LDA, * ), B( LDB, * ), TAUA( * ), TAUB( * ),
     $                   WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Local Scalars ..
      LOGICAL            LQUERY
      INTEGER            LOPT, LWKOPT, NB, NB1, NB2, NB3
*     ..
*     .. External Subroutines ..
      EXTERNAL           cgeqrf, cgerqf, cunmqr, xerbla
*     ..
*     .. External Functions ..
      INTEGER            ILAENV
      EXTERNAL           ilaenv
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          int, max, min
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters
*
      info = 0
      nb1 = ilaenv( 1, 'CGEQRF', ' ', n, m, -1, -1 )
      nb2 = ilaenv( 1, 'CGERQF', ' ', n, p, -1, -1 )
      nb3 = ilaenv( 1, 'CUNMQR', ' ', n, m, p, -1 )
      nb = max( nb1, nb2, nb3 )
      lwkopt = max( n, m, p)*nb
      work( 1 ) = lwkopt
      lquery = ( lwork.EQ.-1 )
      IF( n.LT.0 ) THEN
         info = -1
      ELSE IF( m.LT.0 ) THEN
         info = -2
      ELSE IF( p.LT.0 ) THEN
         info = -3
      ELSE IF( lda.LT.max( 1, n ) ) THEN
         info = -5
      ELSE IF( ldb.LT.max( 1, n ) ) THEN
         info = -8
      ELSE IF( lwork.LT.max( 1, n, m, p ) .AND. .NOT.lquery ) THEN
         info = -11
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CGGQRF', -info )
         RETURN
      ELSE IF( lquery ) THEN
         RETURN
      END IF
*
*     QR factorization of N-by-M matrix A: A = Q*R
*
      CALL cgeqrf( n, m, a, lda, taua, work, lwork, info )
      lopt = real( work( 1 ) )
*
*     Update B := Q**H*B.
*
      CALL cunmqr( 'Left', 'Conjugate Transpose', n, p, min( n, m ), a,
     $             lda, taua, b, ldb, work, lwork, info )
      lopt = max( lopt, int( work( 1 ) ) )
*
*     RQ factorization of N-by-P matrix B: B = T*Z.
*
      CALL cgerqf( n, p, b, ldb, taub, work, lwork, info )
      work( 1 ) = max( lopt, int( work( 1 ) ) )
*
      RETURN
*
*     End of CGGQRF
*

◆ cggrqf()

subroutine cggrqf	(	integer	m,
		integer	p,
		integer	n,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( * )	taua,
		complex, dimension( ldb, * )	b,
		integer	ldb,
		complex, dimension( * )	taub,
		complex, dimension( * )	work,
		integer	lwork,
		integer	info )

CGGRQF

Download CGGRQF + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CGGRQF computes a generalized RQ factorization of an M-by-N matrix A
!> and a P-by-N matrix B:
!>
!>             A = R*Q,        B = Z*T*Q,
!>
!> where Q is an N-by-N unitary matrix, Z is a P-by-P unitary
!> matrix, and R and T assume one of the forms:
!>
!> if M <= N,  R = ( 0  R12 ) M,   or if M > N,  R = ( R11 ) M-N,
!>                  N-M  M                           ( R21 ) N
!>                                                      N
!>
!> where R12 or R21 is upper triangular, and
!>
!> if P >= N,  T = ( T11 ) N  ,   or if P < N,  T = ( T11  T12 ) P,
!>                 (  0  ) P-N                         P   N-P
!>                    N
!>
!> where T11 is upper triangular.
!>
!> In particular, if B is square and nonsingular, the GRQ factorization
!> of A and B implicitly gives the RQ factorization of A*inv(B):
!>
!>              A*inv(B) = (R*inv(T))*Z**H
!>
!> where inv(B) denotes the inverse of the matrix B, and Z**H denotes the
!> conjugate transpose of the matrix Z.
!>

Parameters

[in]	M	!> M is INTEGER !> The number of rows of the matrix A. M >= 0. !>
[in]	P	!> P is INTEGER !> The number of rows of the matrix B. P >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrices A and B. N >= 0. !>
[in,out]	A	!> A is COMPLEX array, dimension (LDA,N) !> On entry, the M-by-N matrix A. !> On exit, if M <= N, the upper triangle of the subarray !> A(1:M,N-M+1:N) contains the M-by-M upper triangular matrix R; !> if M > N, the elements on and above the (M-N)-th subdiagonal !> contain the M-by-N upper trapezoidal matrix R; the remaining !> elements, with the array TAUA, represent the unitary !> matrix Q as a product of elementary reflectors (see Further !> Details). !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,M). !>
[out]	TAUA	!> TAUA is COMPLEX array, dimension (min(M,N)) !> The scalar factors of the elementary reflectors which !> represent the unitary matrix Q (see Further Details). !>
[in,out]	B	!> B is COMPLEX array, dimension (LDB,N) !> On entry, the P-by-N matrix B. !> On exit, the elements on and above the diagonal of the array !> contain the min(P,N)-by-N upper trapezoidal matrix T (T is !> upper triangular if P >= N); the elements below the diagonal, !> with the array TAUB, represent the unitary matrix Z as a !> product of elementary reflectors (see Further Details). !>
[in]	LDB	!> LDB is INTEGER !> The leading dimension of the array B. LDB >= max(1,P). !>
[out]	TAUB	!> TAUB is COMPLEX array, dimension (min(P,N)) !> The scalar factors of the elementary reflectors which !> represent the unitary matrix Z (see Further Details). !>
[out]	WORK	!> WORK is COMPLEX array, dimension (MAX(1,LWORK)) !> On exit, if INFO = 0, WORK(1) returns the optimal LWORK. !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the array WORK. LWORK >= max(1,N,M,P). !> For optimum performance LWORK >= max(N,M,P)*max(NB1,NB2,NB3), !> where NB1 is the optimal blocksize for the RQ factorization !> of an M-by-N matrix, NB2 is the optimal blocksize for the !> QR factorization of a P-by-N matrix, and NB3 is the optimal !> blocksize for a call of CUNMRQ. !> !> If LWORK = -1, then a workspace query is assumed; the routine !> only calculates the optimal size of the WORK array, returns !> this value as the first entry of the WORK array, and no error !> message related to LWORK is issued by XERBLA. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO=-i, the i-th argument had an illegal value. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  The matrix Q is represented as a product of elementary reflectors
!>
!>     Q = H(1) H(2) . . . H(k), where k = min(m,n).
!>
!>  Each H(i) has the form
!>
!>     H(i) = I - taua * v * v**H
!>
!>  where taua is a complex scalar, and v is a complex vector with
!>  v(n-k+i+1:n) = 0 and v(n-k+i) = 1; v(1:n-k+i-1) is stored on exit in
!>  A(m-k+i,1:n-k+i-1), and taua in TAUA(i).
!>  To form Q explicitly, use LAPACK subroutine CUNGRQ.
!>  To use Q to update another matrix, use LAPACK subroutine CUNMRQ.
!>
!>  The matrix Z is represented as a product of elementary reflectors
!>
!>     Z = H(1) H(2) . . . H(k), where k = min(p,n).
!>
!>  Each H(i) has the form
!>
!>     H(i) = I - taub * v * v**H
!>
!>  where taub is a complex scalar, and v is a complex vector with
!>  v(1:i-1) = 0 and v(i) = 1; v(i+1:p) is stored on exit in B(i+1:p,i),
!>  and taub in TAUB(i).
!>  To form Z explicitly, use LAPACK subroutine CUNGQR.
!>  To use Z to update another matrix, use LAPACK subroutine CUNMQR.
!>

Definition at line 212 of file cggrqf.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INFO, LDA, LDB, LWORK, M, N, P
*     ..
*     .. Array Arguments ..
      COMPLEX            A( LDA, * ), B( LDB, * ), TAUA( * ), TAUB( * ),
     $                   WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Local Scalars ..
      LOGICAL            LQUERY
      INTEGER            LOPT, LWKOPT, NB, NB1, NB2, NB3
*     ..
*     .. External Subroutines ..
      EXTERNAL           cgeqrf, cgerqf, cunmrq, xerbla
*     ..
*     .. External Functions ..
      INTEGER            ILAENV
      EXTERNAL           ilaenv
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          int, max, min
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters
*
      info = 0
      nb1 = ilaenv( 1, 'CGERQF', ' ', m, n, -1, -1 )
      nb2 = ilaenv( 1, 'CGEQRF', ' ', p, n, -1, -1 )
      nb3 = ilaenv( 1, 'CUNMRQ', ' ', m, n, p, -1 )
      nb = max( nb1, nb2, nb3 )
      lwkopt = max( n, m, p)*nb
      work( 1 ) = lwkopt
      lquery = ( lwork.EQ.-1 )
      IF( m.LT.0 ) THEN
         info = -1
      ELSE IF( p.LT.0 ) THEN
         info = -2
      ELSE IF( n.LT.0 ) THEN
         info = -3
      ELSE IF( lda.LT.max( 1, m ) ) THEN
         info = -5
      ELSE IF( ldb.LT.max( 1, p ) ) THEN
         info = -8
      ELSE IF( lwork.LT.max( 1, m, p, n ) .AND. .NOT.lquery ) THEN
         info = -11
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CGGRQF', -info )
         RETURN
      ELSE IF( lquery ) THEN
         RETURN
      END IF
*
*     RQ factorization of M-by-N matrix A: A = R*Q
*
      CALL cgerqf( m, n, a, lda, taua, work, lwork, info )
      lopt = real( work( 1 ) )
*
*     Update B := B*Q**H
*
      CALL cunmrq( 'Right', 'Conjugate Transpose', p, n, min( m, n ),
     $             a( max( 1, m-n+1 ), 1 ), lda, taua, b, ldb, work,
     $             lwork, info )
      lopt = max( lopt, int( work( 1 ) ) )
*
*     QR factorization of P-by-N matrix B: B = Z*T
*
      CALL cgeqrf( p, n, b, ldb, taub, work, lwork, info )
      work( 1 ) = max( lopt, int( work( 1 ) ) )
*
      RETURN
*
*     End of CGGRQF
*

◆ cggsvp()

subroutine cggsvp	(	character	jobu,
		character	jobv,
		character	jobq,
		integer	m,
		integer	p,
		integer	n,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( ldb, * )	b,
		integer	ldb,
		real	tola,
		real	tolb,
		integer	k,
		integer	l,
		complex, dimension( ldu, * )	u,
		integer	ldu,
		complex, dimension( ldv, * )	v,
		integer	ldv,
		complex, dimension( ldq, * )	q,
		integer	ldq,
		integer, dimension( * )	iwork,
		real, dimension( * )	rwork,
		complex, dimension( * )	tau,
		complex, dimension( * )	work,
		integer	info )

CGGSVP

Download CGGSVP + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> This routine is deprecated and has been replaced by routine CGGSVP3.
!>
!> CGGSVP computes unitary matrices U, V and Q such that
!>
!>                    N-K-L  K    L
!>  U**H*A*Q =     K ( 0    A12  A13 )  if M-K-L >= 0;
!>                 L ( 0     0   A23 )
!>             M-K-L ( 0     0    0  )
!>
!>                  N-K-L  K    L
!>         =     K ( 0    A12  A13 )  if M-K-L < 0;
!>             M-K ( 0     0   A23 )
!>
!>                  N-K-L  K    L
!>  V**H*B*Q =   L ( 0     0   B13 )
!>             P-L ( 0     0    0  )
!>
!> where the K-by-K matrix A12 and L-by-L matrix B13 are nonsingular
!> upper triangular; A23 is L-by-L upper triangular if M-K-L >= 0,
!> otherwise A23 is (M-K)-by-L upper trapezoidal.  K+L = the effective
!> numerical rank of the (M+P)-by-N matrix (A**H,B**H)**H.
!>
!> This decomposition is the preprocessing step for computing the
!> Generalized Singular Value Decomposition (GSVD), see subroutine
!> CGGSVD.
!>

Parameters

[in]	JOBU	!> JOBU is CHARACTER*1 !> = 'U': Unitary matrix U is computed; !> = 'N': U is not computed. !>
[in]	JOBV	!> JOBV is CHARACTER*1 !> = 'V': Unitary matrix V is computed; !> = 'N': V is not computed. !>
[in]	JOBQ	!> JOBQ is CHARACTER*1 !> = 'Q': Unitary matrix Q is computed; !> = 'N': Q is not computed. !>
[in]	M	!> M is INTEGER !> The number of rows of the matrix A. M >= 0. !>
[in]	P	!> P is INTEGER !> The number of rows of the matrix B. P >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrices A and B. N >= 0. !>
[in,out]	A	!> A is COMPLEX array, dimension (LDA,N) !> On entry, the M-by-N matrix A. !> On exit, A contains the triangular (or trapezoidal) matrix !> described in the Purpose section. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,M). !>
[in,out]	B	!> B is COMPLEX array, dimension (LDB,N) !> On entry, the P-by-N matrix B. !> On exit, B contains the triangular matrix described in !> the Purpose section. !>
[in]	LDB	!> LDB is INTEGER !> The leading dimension of the array B. LDB >= max(1,P). !>
[in]	TOLA	!> TOLA is REAL !>
[in]	TOLB	!> TOLB is REAL !> !> TOLA and TOLB are the thresholds to determine the effective !> numerical rank of matrix B and a subblock of A. Generally, !> they are set to !> TOLA = MAX(M,N)norm(A)MACHEPS, !> TOLB = MAX(P,N)norm(B)MACHEPS. !> The size of TOLA and TOLB may affect the size of backward !> errors of the decomposition. !>
[out]	K	!> K is INTEGER !>
[out]	L	!> L is INTEGER !> !> On exit, K and L specify the dimension of the subblocks !> described in Purpose section. !> K + L = effective numerical rank of (AH,BH)**H. !>
[out]	U	!> U is COMPLEX array, dimension (LDU,M) !> If JOBU = 'U', U contains the unitary matrix U. !> If JOBU = 'N', U is not referenced. !>
[in]	LDU	!> LDU is INTEGER !> The leading dimension of the array U. LDU >= max(1,M) if !> JOBU = 'U'; LDU >= 1 otherwise. !>
[out]	V	!> V is COMPLEX array, dimension (LDV,P) !> If JOBV = 'V', V contains the unitary matrix V. !> If JOBV = 'N', V is not referenced. !>
[in]	LDV	!> LDV is INTEGER !> The leading dimension of the array V. LDV >= max(1,P) if !> JOBV = 'V'; LDV >= 1 otherwise. !>
[out]	Q	!> Q is COMPLEX array, dimension (LDQ,N) !> If JOBQ = 'Q', Q contains the unitary matrix Q. !> If JOBQ = 'N', Q is not referenced. !>
[in]	LDQ	!> LDQ is INTEGER !> The leading dimension of the array Q. LDQ >= max(1,N) if !> JOBQ = 'Q'; LDQ >= 1 otherwise. !>
[out]	IWORK	!> IWORK is INTEGER array, dimension (N) !>
[out]	RWORK	!> RWORK is REAL array, dimension (2*N) !>
[out]	TAU	!> TAU is COMPLEX array, dimension (N) !>
[out]	WORK	!> WORK is COMPLEX array, dimension (max(3*N,M,P)) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:: The subroutine uses LAPACK subroutine CGEQPF for the QR factorization with column pivoting to detect the effective numerical rank of the a matrix. It may be replaced by a better rank determination strategy.

Definition at line 259 of file cggsvp.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          JOBQ, JOBU, JOBV
      INTEGER            INFO, K, L, LDA, LDB, LDQ, LDU, LDV, M, N, P
      REAL               TOLA, TOLB
*     ..
*     .. Array Arguments ..
      INTEGER            IWORK( * )
      REAL               RWORK( * )
      COMPLEX            A( LDA, * ), B( LDB, * ), Q( LDQ, * ),
     $                   TAU( * ), U( LDU, * ), V( LDV, * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            CZERO, CONE
      parameter( czero = ( 0.0e+0, 0.0e+0 ),
     $                   cone = ( 1.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      LOGICAL            FORWRD, WANTQ, WANTU, WANTV
      INTEGER            I, J
      COMPLEX            T
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           cgeqpf, cgeqr2, cgerq2, clacpy, clapmt, claset,
     $                   cung2r, cunm2r, cunmr2, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, aimag, max, min, real
*     ..
*     .. Statement Functions ..
      REAL               CABS1
*     ..
*     .. Statement Function definitions ..
      cabs1( t ) = abs( real( t ) ) + abs( aimag( t ) )
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters
*
      wantu = lsame( jobu, 'U' )
      wantv = lsame( jobv, 'V' )
      wantq = lsame( jobq, 'Q' )
      forwrd = .true.
*
      info = 0
      IF( .NOT.( wantu .OR. lsame( jobu, 'N' ) ) ) THEN
         info = -1
      ELSE IF( .NOT.( wantv .OR. lsame( jobv, 'N' ) ) ) THEN
         info = -2
      ELSE IF( .NOT.( wantq .OR. lsame( jobq, 'N' ) ) ) THEN
         info = -3
      ELSE IF( m.LT.0 ) THEN
         info = -4
      ELSE IF( p.LT.0 ) THEN
         info = -5
      ELSE IF( n.LT.0 ) THEN
         info = -6
      ELSE IF( lda.LT.max( 1, m ) ) THEN
         info = -8
      ELSE IF( ldb.LT.max( 1, p ) ) THEN
         info = -10
      ELSE IF( ldu.LT.1 .OR. ( wantu .AND. ldu.LT.m ) ) THEN
         info = -16
      ELSE IF( ldv.LT.1 .OR. ( wantv .AND. ldv.LT.p ) ) THEN
         info = -18
      ELSE IF( ldq.LT.1 .OR. ( wantq .AND. ldq.LT.n ) ) THEN
         info = -20
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CGGSVP', -info )
         RETURN
      END IF
*
*     QR with column pivoting of B: B*P = V*( S11 S12 )
*                                           (  0   0  )
*
      DO 10 i = 1, n
         iwork( i ) = 0
   10 CONTINUE
      CALL cgeqpf( p, n, b, ldb, iwork, tau, work, rwork, info )
*
*     Update A := A*P
*
      CALL clapmt( forwrd, m, n, a, lda, iwork )
*
*     Determine the effective rank of matrix B.
*
      l = 0
      DO 20 i = 1, min( p, n )
         IF( cabs1( b( i, i ) ).GT.tolb )
     $      l = l + 1
   20 CONTINUE
*
      IF( wantv ) THEN
*
*        Copy the details of V, and form V.
*
         CALL claset( 'Full', p, p, czero, czero, v, ldv )
         IF( p.GT.1 )
     $      CALL clacpy( 'Lower', p-1, n, b( 2, 1 ), ldb, v( 2, 1 ),
     $                   ldv )
         CALL cung2r( p, p, min( p, n ), v, ldv, tau, work, info )
      END IF
*
*     Clean up B
*
      DO 40 j = 1, l - 1
         DO 30 i = j + 1, l
            b( i, j ) = czero
   30    CONTINUE
   40 CONTINUE
      IF( p.GT.l )
     $   CALL claset( 'Full', p-l, n, czero, czero, b( l+1, 1 ), ldb )
*
      IF( wantq ) THEN
*
*        Set Q = I and Update Q := Q*P
*
         CALL claset( 'Full', n, n, czero, cone, q, ldq )
         CALL clapmt( forwrd, n, n, q, ldq, iwork )
      END IF
*
      IF( p.GE.l .AND. n.NE.l ) THEN
*
*        RQ factorization of ( S11 S12 ) = ( 0 S12 )*Z
*
         CALL cgerq2( l, n, b, ldb, tau, work, info )
*
*        Update A := A*Z**H
*
         CALL cunmr2( 'Right', 'Conjugate transpose', m, n, l, b, ldb,
     $                tau, a, lda, work, info )
         IF( wantq ) THEN
*
*           Update Q := Q*Z**H
*
            CALL cunmr2( 'Right', 'Conjugate transpose', n, n, l, b,
     $                   ldb, tau, q, ldq, work, info )
         END IF
*
*        Clean up B
*
         CALL claset( 'Full', l, n-l, czero, czero, b, ldb )
         DO 60 j = n - l + 1, n
            DO 50 i = j - n + l + 1, l
               b( i, j ) = czero
   50       CONTINUE
   60    CONTINUE
*
      END IF
*
*     Let              N-L     L
*                A = ( A11    A12 ) M,
*
*     then the following does the complete QR decomposition of A11:
*
*              A11 = U*(  0  T12 )*P1**H
*                      (  0   0  )
*
      DO 70 i = 1, n - l
         iwork( i ) = 0
   70 CONTINUE
      CALL cgeqpf( m, n-l, a, lda, iwork, tau, work, rwork, info )
*
*     Determine the effective rank of A11
*
      k = 0
      DO 80 i = 1, min( m, n-l )
         IF( cabs1( a( i, i ) ).GT.tola )
     $      k = k + 1
   80 CONTINUE
*
*     Update A12 := U**H*A12, where A12 = A( 1:M, N-L+1:N )
*
      CALL cunm2r( 'Left', 'Conjugate transpose', m, l, min( m, n-l ),
     $             a, lda, tau, a( 1, n-l+1 ), lda, work, info )
*
      IF( wantu ) THEN
*
*        Copy the details of U, and form U
*
         CALL claset( 'Full', m, m, czero, czero, u, ldu )
         IF( m.GT.1 )
     $      CALL clacpy( 'Lower', m-1, n-l, a( 2, 1 ), lda, u( 2, 1 ),
     $                   ldu )
         CALL cung2r( m, m, min( m, n-l ), u, ldu, tau, work, info )
      END IF
*
      IF( wantq ) THEN
*
*        Update Q( 1:N, 1:N-L )  = Q( 1:N, 1:N-L )*P1
*
         CALL clapmt( forwrd, n, n-l, q, ldq, iwork )
      END IF
*
*     Clean up A: set the strictly lower triangular part of
*     A(1:K, 1:K) = 0, and A( K+1:M, 1:N-L ) = 0.
*
      DO 100 j = 1, k - 1
         DO 90 i = j + 1, k
            a( i, j ) = czero
   90    CONTINUE
  100 CONTINUE
      IF( m.GT.k )
     $   CALL claset( 'Full', m-k, n-l, czero, czero, a( k+1, 1 ), lda )
*
      IF( n-l.GT.k ) THEN
*
*        RQ factorization of ( T11 T12 ) = ( 0 T12 )*Z1
*
         CALL cgerq2( k, n-l, a, lda, tau, work, info )
*
         IF( wantq ) THEN
*
*           Update Q( 1:N,1:N-L ) = Q( 1:N,1:N-L )*Z1**H
*
            CALL cunmr2( 'Right', 'Conjugate transpose', n, n-l, k, a,
     $                   lda, tau, q, ldq, work, info )
         END IF
*
*        Clean up A
*
         CALL claset( 'Full', k, n-l-k, czero, czero, a, lda )
         DO 120 j = n - l - k + 1, n - l
            DO 110 i = j - n + l + k + 1, k
               a( i, j ) = czero
  110       CONTINUE
  120    CONTINUE
*
      END IF
*
      IF( m.GT.k ) THEN
*
*        QR factorization of A( K+1:M,N-L+1:N )
*
         CALL cgeqr2( m-k, l, a( k+1, n-l+1 ), lda, tau, work, info )
*
         IF( wantu ) THEN
*
*           Update U(:,K+1:M) := U(:,K+1:M)*U1
*
            CALL cunm2r( 'Right', 'No transpose', m, m-k, min( m-k, l ),
     $                   a( k+1, n-l+1 ), lda, tau, u( 1, k+1 ), ldu,
     $                   work, info )
         END IF
*
*        Clean up
*
         DO 140 j = n - l + 1, n
            DO 130 i = j - n + k + l + 1, m
               a( i, j ) = czero
  130       CONTINUE
  140    CONTINUE
*
      END IF
*
      RETURN
*
*     End of CGGSVP
*

◆ cggsvp3()

subroutine cggsvp3	(	character	jobu,
		character	jobv,
		character	jobq,
		integer	m,
		integer	p,
		integer	n,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( ldb, * )	b,
		integer	ldb,
		real	tola,
		real	tolb,
		integer	k,
		integer	l,
		complex, dimension( ldu, * )	u,
		integer	ldu,
		complex, dimension( ldv, * )	v,
		integer	ldv,
		complex, dimension( ldq, * )	q,
		integer	ldq,
		integer, dimension( * )	iwork,
		real, dimension( * )	rwork,
		complex, dimension( * )	tau,
		complex, dimension( * )	work,
		integer	lwork,
		integer	info )

CGGSVP3

Download CGGSVP3 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CGGSVP3 computes unitary matrices U, V and Q such that
!>
!>                    N-K-L  K    L
!>  U**H*A*Q =     K ( 0    A12  A13 )  if M-K-L >= 0;
!>                 L ( 0     0   A23 )
!>             M-K-L ( 0     0    0  )
!>
!>                  N-K-L  K    L
!>         =     K ( 0    A12  A13 )  if M-K-L < 0;
!>             M-K ( 0     0   A23 )
!>
!>                  N-K-L  K    L
!>  V**H*B*Q =   L ( 0     0   B13 )
!>             P-L ( 0     0    0  )
!>
!> where the K-by-K matrix A12 and L-by-L matrix B13 are nonsingular
!> upper triangular; A23 is L-by-L upper triangular if M-K-L >= 0,
!> otherwise A23 is (M-K)-by-L upper trapezoidal.  K+L = the effective
!> numerical rank of the (M+P)-by-N matrix (A**H,B**H)**H.
!>
!> This decomposition is the preprocessing step for computing the
!> Generalized Singular Value Decomposition (GSVD), see subroutine
!> CGGSVD3.
!>

Parameters

[in]	JOBU	!> JOBU is CHARACTER*1 !> = 'U': Unitary matrix U is computed; !> = 'N': U is not computed. !>
[in]	JOBV	!> JOBV is CHARACTER*1 !> = 'V': Unitary matrix V is computed; !> = 'N': V is not computed. !>
[in]	JOBQ	!> JOBQ is CHARACTER*1 !> = 'Q': Unitary matrix Q is computed; !> = 'N': Q is not computed. !>
[in]	M	!> M is INTEGER !> The number of rows of the matrix A. M >= 0. !>
[in]	P	!> P is INTEGER !> The number of rows of the matrix B. P >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrices A and B. N >= 0. !>
[in,out]	A	!> A is COMPLEX array, dimension (LDA,N) !> On entry, the M-by-N matrix A. !> On exit, A contains the triangular (or trapezoidal) matrix !> described in the Purpose section. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,M). !>
[in,out]	B	!> B is COMPLEX array, dimension (LDB,N) !> On entry, the P-by-N matrix B. !> On exit, B contains the triangular matrix described in !> the Purpose section. !>
[in]	LDB	!> LDB is INTEGER !> The leading dimension of the array B. LDB >= max(1,P). !>
[in]	TOLA	!> TOLA is REAL !>
[in]	TOLB	!> TOLB is REAL !> !> TOLA and TOLB are the thresholds to determine the effective !> numerical rank of matrix B and a subblock of A. Generally, !> they are set to !> TOLA = MAX(M,N)norm(A)MACHEPS, !> TOLB = MAX(P,N)norm(B)MACHEPS. !> The size of TOLA and TOLB may affect the size of backward !> errors of the decomposition. !>
[out]	K	!> K is INTEGER !>
[out]	L	!> L is INTEGER !> !> On exit, K and L specify the dimension of the subblocks !> described in Purpose section. !> K + L = effective numerical rank of (AH,BH)**H. !>
[out]	U	!> U is COMPLEX array, dimension (LDU,M) !> If JOBU = 'U', U contains the unitary matrix U. !> If JOBU = 'N', U is not referenced. !>
[in]	LDU	!> LDU is INTEGER !> The leading dimension of the array U. LDU >= max(1,M) if !> JOBU = 'U'; LDU >= 1 otherwise. !>
[out]	V	!> V is COMPLEX array, dimension (LDV,P) !> If JOBV = 'V', V contains the unitary matrix V. !> If JOBV = 'N', V is not referenced. !>
[in]	LDV	!> LDV is INTEGER !> The leading dimension of the array V. LDV >= max(1,P) if !> JOBV = 'V'; LDV >= 1 otherwise. !>
[out]	Q	!> Q is COMPLEX array, dimension (LDQ,N) !> If JOBQ = 'Q', Q contains the unitary matrix Q. !> If JOBQ = 'N', Q is not referenced. !>
[in]	LDQ	!> LDQ is INTEGER !> The leading dimension of the array Q. LDQ >= max(1,N) if !> JOBQ = 'Q'; LDQ >= 1 otherwise. !>
[out]	IWORK	!> IWORK is INTEGER array, dimension (N) !>
[out]	RWORK	!> RWORK is REAL array, dimension (2*N) !>
[out]	TAU	!> TAU is COMPLEX array, dimension (N) !>
[out]	WORK	!> WORK is COMPLEX array, dimension (MAX(1,LWORK)) !> On exit, if INFO = 0, WORK(1) returns the optimal LWORK. !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the array WORK. !> !> If LWORK = -1, then a workspace query is assumed; the routine !> only calculates the optimal size of the WORK array, returns !> this value as the first entry of the WORK array, and no error !> message related to LWORK is issued by XERBLA. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  The subroutine uses LAPACK subroutine CGEQP3 for the QR factorization
!>  with column pivoting to detect the effective numerical rank of the
!>  a matrix. It may be replaced by a better rank determination strategy.
!>
!>  CGGSVP3 replaces the deprecated subroutine CGGSVP.
!>
!>

Definition at line 275 of file cggsvp3.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
      IMPLICIT NONE
*
*     .. Scalar Arguments ..
      CHARACTER          JOBQ, JOBU, JOBV
      INTEGER            INFO, K, L, LDA, LDB, LDQ, LDU, LDV, M, N, P,
     $                   LWORK
      REAL               TOLA, TOLB
*     ..
*     .. Array Arguments ..
      INTEGER            IWORK( * )
      REAL               RWORK( * )
      COMPLEX            A( LDA, * ), B( LDB, * ), Q( LDQ, * ),
     $                   TAU( * ), U( LDU, * ), V( LDV, * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            CZERO, CONE
      parameter( czero = ( 0.0e+0, 0.0e+0 ),
     $                   cone = ( 1.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      LOGICAL            FORWRD, WANTQ, WANTU, WANTV, LQUERY
      INTEGER            I, J, LWKOPT
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           cgeqp3, cgeqr2, cgerq2, clacpy, clapmt,
     $                   claset, cung2r, cunm2r, cunmr2, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, aimag, max, min, real
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters
*
      wantu = lsame( jobu, 'U' )
      wantv = lsame( jobv, 'V' )
      wantq = lsame( jobq, 'Q' )
      forwrd = .true.
      lquery = ( lwork.EQ.-1 )
      lwkopt = 1
*
*     Test the input arguments
*
      info = 0
      IF( .NOT.( wantu .OR. lsame( jobu, 'N' ) ) ) THEN
         info = -1
      ELSE IF( .NOT.( wantv .OR. lsame( jobv, 'N' ) ) ) THEN
         info = -2
      ELSE IF( .NOT.( wantq .OR. lsame( jobq, 'N' ) ) ) THEN
         info = -3
      ELSE IF( m.LT.0 ) THEN
         info = -4
      ELSE IF( p.LT.0 ) THEN
         info = -5
      ELSE IF( n.LT.0 ) THEN
         info = -6
      ELSE IF( lda.LT.max( 1, m ) ) THEN
         info = -8
      ELSE IF( ldb.LT.max( 1, p ) ) THEN
         info = -10
      ELSE IF( ldu.LT.1 .OR. ( wantu .AND. ldu.LT.m ) ) THEN
         info = -16
      ELSE IF( ldv.LT.1 .OR. ( wantv .AND. ldv.LT.p ) ) THEN
         info = -18
      ELSE IF( ldq.LT.1 .OR. ( wantq .AND. ldq.LT.n ) ) THEN
         info = -20
      ELSE IF( lwork.LT.1 .AND. .NOT.lquery ) THEN
         info = -24
      END IF
*
*     Compute workspace
*
      IF( info.EQ.0 ) THEN
         CALL cgeqp3( p, n, b, ldb, iwork, tau, work, -1, rwork, info )
         lwkopt = int( work( 1 ) )
         IF( wantv ) THEN
            lwkopt = max( lwkopt, p )
         END IF
         lwkopt = max( lwkopt, min( n, p ) )
         lwkopt = max( lwkopt, m )
         IF( wantq ) THEN
            lwkopt = max( lwkopt, n )
         END IF
         CALL cgeqp3( m, n, a, lda, iwork, tau, work, -1, rwork, info )
         lwkopt = max( lwkopt, int( work( 1 ) ) )
         lwkopt = max( 1, lwkopt )
         work( 1 ) = cmplx( lwkopt )
      END IF
*
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CGGSVP3', -info )
         RETURN
      END IF
      IF( lquery ) THEN
         RETURN
      ENDIF
*
*     QR with column pivoting of B: B*P = V*( S11 S12 )
*                                           (  0   0  )
*
      DO 10 i = 1, n
         iwork( i ) = 0
   10 CONTINUE
      CALL cgeqp3( p, n, b, ldb, iwork, tau, work, lwork, rwork, info )
*
*     Update A := A*P
*
      CALL clapmt( forwrd, m, n, a, lda, iwork )
*
*     Determine the effective rank of matrix B.
*
      l = 0
      DO 20 i = 1, min( p, n )
         IF( abs( b( i, i ) ).GT.tolb )
     $      l = l + 1
   20 CONTINUE
*
      IF( wantv ) THEN
*
*        Copy the details of V, and form V.
*
         CALL claset( 'Full', p, p, czero, czero, v, ldv )
         IF( p.GT.1 )
     $      CALL clacpy( 'Lower', p-1, n, b( 2, 1 ), ldb, v( 2, 1 ),
     $                   ldv )
         CALL cung2r( p, p, min( p, n ), v, ldv, tau, work, info )
      END IF
*
*     Clean up B
*
      DO 40 j = 1, l - 1
         DO 30 i = j + 1, l
            b( i, j ) = czero
   30    CONTINUE
   40 CONTINUE
      IF( p.GT.l )
     $   CALL claset( 'Full', p-l, n, czero, czero, b( l+1, 1 ), ldb )
*
      IF( wantq ) THEN
*
*        Set Q = I and Update Q := Q*P
*
         CALL claset( 'Full', n, n, czero, cone, q, ldq )
         CALL clapmt( forwrd, n, n, q, ldq, iwork )
      END IF
*
      IF( p.GE.l .AND. n.NE.l ) THEN
*
*        RQ factorization of ( S11 S12 ) = ( 0 S12 )*Z
*
         CALL cgerq2( l, n, b, ldb, tau, work, info )
*
*        Update A := A*Z**H
*
         CALL cunmr2( 'Right', 'Conjugate transpose', m, n, l, b, ldb,
     $                tau, a, lda, work, info )
         IF( wantq ) THEN
*
*           Update Q := Q*Z**H
*
            CALL cunmr2( 'Right', 'Conjugate transpose', n, n, l, b,
     $                   ldb, tau, q, ldq, work, info )
         END IF
*
*        Clean up B
*
         CALL claset( 'Full', l, n-l, czero, czero, b, ldb )
         DO 60 j = n - l + 1, n
            DO 50 i = j - n + l + 1, l
               b( i, j ) = czero
   50       CONTINUE
   60    CONTINUE
*
      END IF
*
*     Let              N-L     L
*                A = ( A11    A12 ) M,
*
*     then the following does the complete QR decomposition of A11:
*
*              A11 = U*(  0  T12 )*P1**H
*                      (  0   0  )
*
      DO 70 i = 1, n - l
         iwork( i ) = 0
   70 CONTINUE
      CALL cgeqp3( m, n-l, a, lda, iwork, tau, work, lwork, rwork,
     $             info )
*
*     Determine the effective rank of A11
*
      k = 0
      DO 80 i = 1, min( m, n-l )
         IF( abs( a( i, i ) ).GT.tola )
     $      k = k + 1
   80 CONTINUE
*
*     Update A12 := U**H*A12, where A12 = A( 1:M, N-L+1:N )
*
      CALL cunm2r( 'Left', 'Conjugate transpose', m, l, min( m, n-l ),
     $             a, lda, tau, a( 1, n-l+1 ), lda, work, info )
*
      IF( wantu ) THEN
*
*        Copy the details of U, and form U
*
         CALL claset( 'Full', m, m, czero, czero, u, ldu )
         IF( m.GT.1 )
     $      CALL clacpy( 'Lower', m-1, n-l, a( 2, 1 ), lda, u( 2, 1 ),
     $                   ldu )
         CALL cung2r( m, m, min( m, n-l ), u, ldu, tau, work, info )
      END IF
*
      IF( wantq ) THEN
*
*        Update Q( 1:N, 1:N-L )  = Q( 1:N, 1:N-L )*P1
*
         CALL clapmt( forwrd, n, n-l, q, ldq, iwork )
      END IF
*
*     Clean up A: set the strictly lower triangular part of
*     A(1:K, 1:K) = 0, and A( K+1:M, 1:N-L ) = 0.
*
      DO 100 j = 1, k - 1
         DO 90 i = j + 1, k
            a( i, j ) = czero
   90    CONTINUE
  100 CONTINUE
      IF( m.GT.k )
     $   CALL claset( 'Full', m-k, n-l, czero, czero, a( k+1, 1 ), lda )
*
      IF( n-l.GT.k ) THEN
*
*        RQ factorization of ( T11 T12 ) = ( 0 T12 )*Z1
*
         CALL cgerq2( k, n-l, a, lda, tau, work, info )
*
         IF( wantq ) THEN
*
*           Update Q( 1:N,1:N-L ) = Q( 1:N,1:N-L )*Z1**H
*
            CALL cunmr2( 'Right', 'Conjugate transpose', n, n-l, k, a,
     $                   lda, tau, q, ldq, work, info )
         END IF
*
*        Clean up A
*
         CALL claset( 'Full', k, n-l-k, czero, czero, a, lda )
         DO 120 j = n - l - k + 1, n - l
            DO 110 i = j - n + l + k + 1, k
               a( i, j ) = czero
  110       CONTINUE
  120    CONTINUE
*
      END IF
*
      IF( m.GT.k ) THEN
*
*        QR factorization of A( K+1:M,N-L+1:N )
*
         CALL cgeqr2( m-k, l, a( k+1, n-l+1 ), lda, tau, work, info )
*
         IF( wantu ) THEN
*
*           Update U(:,K+1:M) := U(:,K+1:M)*U1
*
            CALL cunm2r( 'Right', 'No transpose', m, m-k, min( m-k, l ),
     $                   a( k+1, n-l+1 ), lda, tau, u( 1, k+1 ), ldu,
     $                   work, info )
         END IF
*
*        Clean up
*
         DO 140 j = n - l + 1, n
            DO 130 i = j - n + k + l + 1, m
               a( i, j ) = czero
  130       CONTINUE
  140    CONTINUE
*
      END IF
*
      work( 1 ) = cmplx( lwkopt )
      RETURN
*
*     End of CGGSVP3
*

◆ cgsvj0()

subroutine cgsvj0	(	character*1	jobv,
		integer	m,
		integer	n,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( n )	d,
		real, dimension( n )	sva,
		integer	mv,
		complex, dimension( ldv, * )	v,
		integer	ldv,
		real	eps,
		real	sfmin,
		real	tol,
		integer	nsweep,
		complex, dimension( lwork )	work,
		integer	lwork,
		integer	info )

CGSVJ0 pre-processor for the routine cgesvj.

Download CGSVJ0 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CGSVJ0 is called from CGESVJ as a pre-processor and that is its main
!> purpose. It applies Jacobi rotations in the same way as CGESVJ does, but
!> it does not check convergence (stopping criterion). Few tuning
!> parameters (marked by [TP]) are available for the implementer.
!>

Parameters

[in]	JOBV	!> JOBV is CHARACTER*1 !> Specifies whether the output from this procedure is used !> to compute the matrix V: !> = 'V': the product of the Jacobi rotations is accumulated !> by postmulyiplying the N-by-N array V. !> (See the description of V.) !> = 'A': the product of the Jacobi rotations is accumulated !> by postmulyiplying the MV-by-N array V. !> (See the descriptions of MV and V.) !> = 'N': the Jacobi rotations are not accumulated. !>
[in]	M	!> M is INTEGER !> The number of rows of the input matrix A. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the input matrix A. !> M >= N >= 0. !>
[in,out]	A	!> A is COMPLEX array, dimension (LDA,N) !> On entry, M-by-N matrix A, such that Adiag(D) represents !> the input matrix. !> On exit, !> A_onexit diag(D_onexit) represents the input matrix A*diag(D) !> post-multiplied by a sequence of Jacobi rotations, where the !> rotation threshold and the total number of sweeps are given in !> TOL and NSWEEP, respectively. !> (See the descriptions of D, TOL and NSWEEP.) !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,M). !>
[in,out]	D	!> D is COMPLEX array, dimension (N) !> The array D accumulates the scaling factors from the complex scaled !> Jacobi rotations. !> On entry, Adiag(D) represents the input matrix. !> On exit, A_onexitdiag(D_onexit) represents the input matrix !> post-multiplied by a sequence of Jacobi rotations, where the !> rotation threshold and the total number of sweeps are given in !> TOL and NSWEEP, respectively. !> (See the descriptions of A, TOL and NSWEEP.) !>
[in,out]	SVA	!> SVA is REAL array, dimension (N) !> On entry, SVA contains the Euclidean norms of the columns of !> the matrix Adiag(D). !> On exit, SVA contains the Euclidean norms of the columns of !> the matrix A_onexitdiag(D_onexit). !>
[in]	MV	!> MV is INTEGER !> If JOBV = 'A', then MV rows of V are post-multipled by a !> sequence of Jacobi rotations. !> If JOBV = 'N', then MV is not referenced. !>
[in,out]	V	!> V is COMPLEX array, dimension (LDV,N) !> If JOBV = 'V' then N rows of V are post-multipled by a !> sequence of Jacobi rotations. !> If JOBV = 'A' then MV rows of V are post-multipled by a !> sequence of Jacobi rotations. !> If JOBV = 'N', then V is not referenced. !>
[in]	LDV	!> LDV is INTEGER !> The leading dimension of the array V, LDV >= 1. !> If JOBV = 'V', LDV >= N. !> If JOBV = 'A', LDV >= MV. !>
[in]	EPS	!> EPS is REAL !> EPS = SLAMCH('Epsilon') !>
[in]	SFMIN	!> SFMIN is REAL !> SFMIN = SLAMCH('Safe Minimum') !>
[in]	TOL	!> TOL is REAL !> TOL is the threshold for Jacobi rotations. For a pair !> A(:,p), A(:,q) of pivot columns, the Jacobi rotation is !> applied only if ABS(COS(angle(A(:,p),A(:,q)))) > TOL. !>
[in]	NSWEEP	!> NSWEEP is INTEGER !> NSWEEP is the number of sweeps of Jacobi rotations to be !> performed. !>
[out]	WORK	!> WORK is COMPLEX array, dimension (LWORK) !>
[in]	LWORK	!> LWORK is INTEGER !> LWORK is the dimension of WORK. LWORK >= M. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> < 0: if INFO = -i, then the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:: CGSVJ0 is used just to enable CGESVJ to call a simplified version of itself to work on a submatrix of the original matrix.

Contributor:: Zlatko Drmac (Zagreb, Croatia)

Bugs, Examples and Comments:: Please report all bugs and send interesting test examples and comments to drmac.nosp@m.@mat.nosp@m.h.hr. Thank you.

Definition at line 216 of file cgsvj0.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
      IMPLICIT NONE
*     .. Scalar Arguments ..
      INTEGER            INFO, LDA, LDV, LWORK, M, MV, N, NSWEEP
      REAL               EPS, SFMIN, TOL
      CHARACTER*1        JOBV
*     ..
*     .. Array Arguments ..
      COMPLEX            A( LDA, * ), D( N ), V( LDV, * ), WORK( LWORK )
      REAL               SVA( N )
*     ..
*
*  =====================================================================
*
*     .. Local Parameters ..
      REAL               ZERO, HALF, ONE
      parameter( zero = 0.0e0, half = 0.5e0, one = 1.0e0)
      COMPLEX      CZERO,                  CONE
      parameter( czero = (0.0e0, 0.0e0), cone = (1.0e0, 0.0e0) )
*     ..
*     .. Local Scalars ..
      COMPLEX            AAPQ, OMPQ
      REAL               AAPP, AAPP0, AAPQ1, AAQQ, APOAQ, AQOAP, BIG,
     $                   BIGTHETA, CS, MXAAPQ, MXSINJ, ROOTBIG, ROOTEPS,
     $                   ROOTSFMIN, ROOTTOL, SMALL, SN, T, TEMP1, THETA,
     $                   THSIGN
      INTEGER            BLSKIP, EMPTSW, i, ibr, IERR, igl, IJBLSK, ir1,
     $                   ISWROT, jbc, jgl, KBL, LKAHEAD, MVL, NBL,
     $                   NOTROT, p, PSKIPPED, q, ROWSKIP, SWBAND
      LOGICAL            APPLV, ROTOK, RSVEC
*     ..
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC abs, max, conjg, real, min, sign, sqrt
*     ..
*     .. External Functions ..
      REAL               SCNRM2
      COMPLEX            CDOTC
      INTEGER            ISAMAX
      LOGICAL            LSAME
      EXTERNAL           isamax, lsame, cdotc, scnrm2
*     ..
*     ..
*     .. External Subroutines ..
*     ..
*     from BLAS
      EXTERNAL           ccopy, crot, cswap, caxpy
*     from LAPACK
      EXTERNAL           clascl, classq, xerbla
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      applv = lsame( jobv, 'A' )
      rsvec = lsame( jobv, 'V' )
      IF( .NOT.( rsvec .OR. applv .OR. lsame( jobv, 'N' ) ) ) THEN
         info = -1
      ELSE IF( m.LT.0 ) THEN
         info = -2
      ELSE IF( ( n.LT.0 ) .OR. ( n.GT.m ) ) THEN
         info = -3
      ELSE IF( lda.LT.m ) THEN
         info = -5
      ELSE IF( ( rsvec.OR.applv ) .AND. ( mv.LT.0 ) ) THEN
         info = -8
      ELSE IF( ( rsvec.AND.( ldv.LT.n ) ).OR.
     $         ( applv.AND.( ldv.LT.mv ) ) ) THEN
         info = -10
      ELSE IF( tol.LE.eps ) THEN
         info = -13
      ELSE IF( nsweep.LT.0 ) THEN
         info = -14
      ELSE IF( lwork.LT.m ) THEN
         info = -16
      ELSE
         info = 0
      END IF
*
*     #:(
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CGSVJ0', -info )
         RETURN
      END IF
*
      IF( rsvec ) THEN
         mvl = n
      ELSE IF( applv ) THEN
         mvl = mv
      END IF
      rsvec = rsvec .OR. applv
 
      rooteps = sqrt( eps )
      rootsfmin = sqrt( sfmin )
      small = sfmin / eps
      big = one / sfmin
      rootbig = one / rootsfmin
      bigtheta = one / rooteps
      roottol = sqrt( tol )
*
*     .. Row-cyclic Jacobi SVD algorithm with column pivoting ..
*
      emptsw = ( n*( n-1 ) ) / 2
      notrot = 0
*
*     .. Row-cyclic pivot strategy with de Rijk's pivoting ..
*
 
      swband = 0
*[TP] SWBAND is a tuning parameter [TP]. It is meaningful and effective
*     if CGESVJ is used as a computational routine in the preconditioned
*     Jacobi SVD algorithm CGEJSV. For sweeps i=1:SWBAND the procedure
*     works on pivots inside a band-like region around the diagonal.
*     The boundaries are determined dynamically, based on the number of
*     pivots above a threshold.
*
      kbl = min( 8, n )
*[TP] KBL is a tuning parameter that defines the tile size in the
*     tiling of the p-q loops of pivot pairs. In general, an optimal
*     value of KBL depends on the matrix dimensions and on the
*     parameters of the computer's memory.
*
      nbl = n / kbl
      IF( ( nbl*kbl ).NE.n )nbl = nbl + 1
*
      blskip = kbl**2
*[TP] BLKSKIP is a tuning parameter that depends on SWBAND and KBL.
*
      rowskip = min( 5, kbl )
*[TP] ROWSKIP is a tuning parameter.
*
      lkahead = 1
*[TP] LKAHEAD is a tuning parameter.
*
*     Quasi block transformations, using the lower (upper) triangular
*     structure of the input matrix. The quasi-block-cycling usually
*     invokes cubic convergence. Big part of this cycle is done inside
*     canonical subspaces of dimensions less than M.
*
*
*     .. Row-cyclic pivot strategy with de Rijk's pivoting ..
*
      DO 1993 i = 1, nsweep
*
*     .. go go go ...
*
         mxaapq = zero
         mxsinj = zero
         iswrot = 0
*
         notrot = 0
         pskipped = 0
*
*     Each sweep is unrolled using KBL-by-KBL tiles over the pivot pairs
*     1 <= p < q <= N. This is the first step toward a blocked implementation
*     of the rotations. New implementation, based on block transformations,
*     is under development.
*
         DO 2000 ibr = 1, nbl
*
            igl = ( ibr-1 )*kbl + 1
*
            DO 1002 ir1 = 0, min( lkahead, nbl-ibr )
*
               igl = igl + ir1*kbl
*
               DO 2001 p = igl, min( igl+kbl-1, n-1 )
*
*     .. de Rijk's pivoting
*
                  q = isamax( n-p+1, sva( p ), 1 ) + p - 1
                  IF( p.NE.q ) THEN
                     CALL cswap( m, a( 1, p ), 1, a( 1, q ), 1 )
                     IF( rsvec )CALL cswap( mvl, v( 1, p ), 1,
     $                                           v( 1, q ), 1 )
                     temp1 = sva( p )
                     sva( p ) = sva( q )
                     sva( q ) = temp1
                     aapq = d(p)
                     d(p) = d(q)
                     d(q) = aapq
                  END IF
*
                  IF( ir1.EQ.0 ) THEN
*
*        Column norms are periodically updated by explicit
*        norm computation.
*        Caveat:
*        Unfortunately, some BLAS implementations compute SNCRM2(M,A(1,p),1)
*        as SQRT(S=CDOTC(M,A(1,p),1,A(1,p),1)), which may cause the result to
*        overflow for ||A(:,p)||_2 > SQRT(overflow_threshold), and to
*        underflow for ||A(:,p)||_2 < SQRT(underflow_threshold).
*        Hence, SCNRM2 cannot be trusted, not even in the case when
*        the true norm is far from the under(over)flow boundaries.
*        If properly implemented SCNRM2 is available, the IF-THEN-ELSE-END IF
*        below should be replaced with "AAPP = SCNRM2( M, A(1,p), 1 )".
*
                     IF( ( sva( p ).LT.rootbig ) .AND.
     $                    ( sva( p ).GT.rootsfmin ) ) THEN
                        sva( p ) = scnrm2( m, a( 1, p ), 1 )
                     ELSE
                        temp1 = zero
                        aapp = one
                        CALL classq( m, a( 1, p ), 1, temp1, aapp )
                        sva( p ) = temp1*sqrt( aapp )
                     END IF
                     aapp = sva( p )
                  ELSE
                     aapp = sva( p )
                  END IF
*
                  IF( aapp.GT.zero ) THEN
*
                     pskipped = 0
*
                     DO 2002 q = p + 1, min( igl+kbl-1, n )
*
                        aaqq = sva( q )
*
                        IF( aaqq.GT.zero ) THEN
*
                           aapp0 = aapp
                           IF( aaqq.GE.one ) THEN
                              rotok = ( small*aapp ).LE.aaqq
                              IF( aapp.LT.( big / aaqq ) ) THEN
                                 aapq = ( cdotc( m, a( 1, p ), 1,
     $                                   a( 1, q ), 1 ) / aaqq ) / aapp
                              ELSE
                                 CALL ccopy( m, a( 1, p ), 1,
     $                                        work, 1 )
                                 CALL clascl( 'G', 0, 0, aapp, one,
     $                                m, 1, work, lda, ierr )
                                 aapq = cdotc( m, work, 1,
     $                                   a( 1, q ), 1 ) / aaqq
                              END IF
                           ELSE
                              rotok = aapp.LE.( aaqq / small )
                              IF( aapp.GT.( small / aaqq ) ) THEN
                                 aapq = ( cdotc( m, a( 1, p ), 1,
     $                                    a( 1, q ), 1 ) / aapp ) / aaqq
                              ELSE
                                 CALL ccopy( m, a( 1, q ), 1,
     $                                        work, 1 )
                                 CALL clascl( 'G', 0, 0, aaqq,
     $                                         one, m, 1,
     $                                         work, lda, ierr )
                                 aapq = cdotc( m, a( 1, p ), 1,
     $                                   work, 1 ) / aapp
                              END IF
                           END IF
*
*                           AAPQ = AAPQ * CONJG( CWORK(p) ) * CWORK(q)
                           aapq1  = -abs(aapq)
                           mxaapq = max( mxaapq, -aapq1 )
*
*        TO rotate or NOT to rotate, THAT is the question ...
*
                           IF( abs( aapq1 ).GT.tol ) THEN
                              ompq = aapq / abs(aapq)
*
*           .. rotate
*[RTD]      ROTATED = ROTATED + ONE
*
                              IF( ir1.EQ.0 ) THEN
                                 notrot = 0
                                 pskipped = 0
                                 iswrot = iswrot + 1
                              END IF
*
                              IF( rotok ) THEN
*
                                 aqoap = aaqq / aapp
                                 apoaq = aapp / aaqq
                                 theta = -half*abs( aqoap-apoaq )/aapq1
*
                                 IF( abs( theta ).GT.bigtheta ) THEN
*
                                    t  = half / theta
                                    cs = one
 
                                    CALL crot( m, a(1,p), 1, a(1,q), 1,
     $                                          cs, conjg(ompq)*t )
                                    IF ( rsvec ) THEN
                                        CALL crot( mvl, v(1,p), 1,
     $                                  v(1,q), 1, cs, conjg(ompq)*t )
                                    END IF
 
                                    sva( q ) = aaqq*sqrt( max( zero,
     $                                          one+t*apoaq*aapq1 ) )
                                    aapp = aapp*sqrt( max( zero,
     $                                          one-t*aqoap*aapq1 ) )
                                    mxsinj = max( mxsinj, abs( t ) )
*
                                 ELSE
*
*                 .. choose correct signum for THETA and rotate
*
                                    thsign = -sign( one, aapq1 )
                                    t = one / ( theta+thsign*
     $                                   sqrt( one+theta*theta ) )
                                    cs = sqrt( one / ( one+t*t ) )
                                    sn = t*cs
*
                                    mxsinj = max( mxsinj, abs( sn ) )
                                    sva( q ) = aaqq*sqrt( max( zero,
     $                                          one+t*apoaq*aapq1 ) )
                                    aapp = aapp*sqrt( max( zero,
     $                                      one-t*aqoap*aapq1 ) )
*
                                    CALL crot( m, a(1,p), 1, a(1,q), 1,
     $                                          cs, conjg(ompq)*sn )
                                    IF ( rsvec ) THEN
                                        CALL crot( mvl, v(1,p), 1,
     $                                  v(1,q), 1, cs, conjg(ompq)*sn )
                                    END IF
                                 END IF
                                 d(p) = -d(q) * ompq
*
                                 ELSE
*              .. have to use modified Gram-Schmidt like transformation
                                 CALL ccopy( m, a( 1, p ), 1,
     $                                       work, 1 )
                                 CALL clascl( 'G', 0, 0, aapp, one, m,
     $                                        1, work, lda,
     $                                        ierr )
                                 CALL clascl( 'G', 0, 0, aaqq, one, m,
     $                                        1, a( 1, q ), lda, ierr )
                                 CALL caxpy( m, -aapq, work, 1,
     $                                       a( 1, q ), 1 )
                                 CALL clascl( 'G', 0, 0, one, aaqq, m,
     $                                        1, a( 1, q ), lda, ierr )
                                 sva( q ) = aaqq*sqrt( max( zero,
     $                                      one-aapq1*aapq1 ) )
                                 mxsinj = max( mxsinj, sfmin )
                              END IF
*           END IF ROTOK THEN ... ELSE
*
*           In the case of cancellation in updating SVA(q), SVA(p)
*           recompute SVA(q), SVA(p).
*
                              IF( ( sva( q ) / aaqq )**2.LE.rooteps )
     $                            THEN
                                 IF( ( aaqq.LT.rootbig ) .AND.
     $                               ( aaqq.GT.rootsfmin ) ) THEN
                                    sva( q ) = scnrm2( m, a( 1, q ), 1 )
                                 ELSE
                                    t = zero
                                    aaqq = one
                                    CALL classq( m, a( 1, q ), 1, t,
     $                                           aaqq )
                                    sva( q ) = t*sqrt( aaqq )
                                 END IF
                              END IF
                              IF( ( aapp / aapp0 ).LE.rooteps ) THEN
                                 IF( ( aapp.LT.rootbig ) .AND.
     $                               ( aapp.GT.rootsfmin ) ) THEN
                                    aapp = scnrm2( m, a( 1, p ), 1 )
                                 ELSE
                                    t = zero
                                    aapp = one
                                    CALL classq( m, a( 1, p ), 1, t,
     $                                           aapp )
                                    aapp = t*sqrt( aapp )
                                 END IF
                                 sva( p ) = aapp
                              END IF
*
                           ELSE
*        A(:,p) and A(:,q) already numerically orthogonal
                              IF( ir1.EQ.0 )notrot = notrot + 1
*[RTD]      SKIPPED  = SKIPPED  + 1
                              pskipped = pskipped + 1
                           END IF
                        ELSE
*        A(:,q) is zero column
                           IF( ir1.EQ.0 )notrot = notrot + 1
                           pskipped = pskipped + 1
                        END IF
*
                        IF( ( i.LE.swband ) .AND.
     $                      ( pskipped.GT.rowskip ) ) THEN
                           IF( ir1.EQ.0 )aapp = -aapp
                           notrot = 0
                           GO TO 2103
                        END IF
*
 2002                CONTINUE
*     END q-LOOP
*
 2103                CONTINUE
*     bailed out of q-loop
*
                     sva( p ) = aapp
*
                  ELSE
                     sva( p ) = aapp
                     IF( ( ir1.EQ.0 ) .AND. ( aapp.EQ.zero ) )
     $                   notrot = notrot + min( igl+kbl-1, n ) - p
                  END IF
*
 2001          CONTINUE
*     end of the p-loop
*     end of doing the block ( ibr, ibr )
 1002       CONTINUE
*     end of ir1-loop
*
* ... go to the off diagonal blocks
*
            igl = ( ibr-1 )*kbl + 1
*
            DO 2010 jbc = ibr + 1, nbl
*
               jgl = ( jbc-1 )*kbl + 1
*
*        doing the block at ( ibr, jbc )
*
               ijblsk = 0
               DO 2100 p = igl, min( igl+kbl-1, n )
*
                  aapp = sva( p )
                  IF( aapp.GT.zero ) THEN
*
                     pskipped = 0
*
                     DO 2200 q = jgl, min( jgl+kbl-1, n )
*
                        aaqq = sva( q )
                        IF( aaqq.GT.zero ) THEN
                           aapp0 = aapp
*
*     .. M x 2 Jacobi SVD ..
*
*        Safe Gram matrix computation
*
                           IF( aaqq.GE.one ) THEN
                              IF( aapp.GE.aaqq ) THEN
                                 rotok = ( small*aapp ).LE.aaqq
                              ELSE
                                 rotok = ( small*aaqq ).LE.aapp
                              END IF
                              IF( aapp.LT.( big / aaqq ) ) THEN
                                 aapq = ( cdotc( m, a( 1, p ), 1,
     $                                  a( 1, q ), 1 ) / aaqq ) / aapp
                              ELSE
                                 CALL ccopy( m, a( 1, p ), 1,
     $                                       work, 1 )
                                 CALL clascl( 'G', 0, 0, aapp,
     $                                        one, m, 1,
     $                                        work, lda, ierr )
                                 aapq = cdotc( m, work, 1,
     $                                  a( 1, q ), 1 ) / aaqq
                              END IF
                           ELSE
                              IF( aapp.GE.aaqq ) THEN
                                 rotok = aapp.LE.( aaqq / small )
                              ELSE
                                 rotok = aaqq.LE.( aapp / small )
                              END IF
                              IF( aapp.GT.( small / aaqq ) ) THEN
                                 aapq = ( cdotc( m, a( 1, p ), 1,
     $                                 a( 1, q ), 1 ) / max(aaqq,aapp) )
     $                                               / min(aaqq,aapp)
                              ELSE
                                 CALL ccopy( m, a( 1, q ), 1,
     $                                       work, 1 )
                                 CALL clascl( 'G', 0, 0, aaqq,
     $                                        one, m, 1,
     $                                        work, lda, ierr )
                                 aapq = cdotc( m, a( 1, p ), 1,
     $                                  work, 1 ) / aapp
                              END IF
                           END IF
*
*                           AAPQ = AAPQ * CONJG(CWORK(p))*CWORK(q)
                           aapq1  = -abs(aapq)
                           mxaapq = max( mxaapq, -aapq1 )
*
*        TO rotate or NOT to rotate, THAT is the question ...
*
                           IF( abs( aapq1 ).GT.tol ) THEN
                              ompq = aapq / abs(aapq)
                              notrot = 0
*[RTD]      ROTATED  = ROTATED + 1
                              pskipped = 0
                              iswrot = iswrot + 1
*
                              IF( rotok ) THEN
*
                                 aqoap = aaqq / aapp
                                 apoaq = aapp / aaqq
                                 theta = -half*abs( aqoap-apoaq )/ aapq1
                                 IF( aaqq.GT.aapp0 )theta = -theta
*
                                 IF( abs( theta ).GT.bigtheta ) THEN
                                    t  = half / theta
                                    cs = one
                                    CALL crot( m, a(1,p), 1, a(1,q), 1,
     $                                          cs, conjg(ompq)*t )
                                    IF( rsvec ) THEN
                                        CALL crot( mvl, v(1,p), 1,
     $                                  v(1,q), 1, cs, conjg(ompq)*t )
                                    END IF
                                    sva( q ) = aaqq*sqrt( max( zero,
     $                                         one+t*apoaq*aapq1 ) )
                                    aapp = aapp*sqrt( max( zero,
     $                                     one-t*aqoap*aapq1 ) )
                                    mxsinj = max( mxsinj, abs( t ) )
                                 ELSE
*
*                 .. choose correct signum for THETA and rotate
*
                                    thsign = -sign( one, aapq1 )
                                    IF( aaqq.GT.aapp0 )thsign = -thsign
                                    t = one / ( theta+thsign*
     $                                  sqrt( one+theta*theta ) )
                                    cs = sqrt( one / ( one+t*t ) )
                                    sn = t*cs
                                    mxsinj = max( mxsinj, abs( sn ) )
                                    sva( q ) = aaqq*sqrt( max( zero,
     $                                         one+t*apoaq*aapq1 ) )
                                    aapp = aapp*sqrt( max( zero,
     $                                         one-t*aqoap*aapq1 ) )
*
                                    CALL crot( m, a(1,p), 1, a(1,q), 1,
     $                                          cs, conjg(ompq)*sn )
                                    IF( rsvec ) THEN
                                        CALL crot( mvl, v(1,p), 1,
     $                                  v(1,q), 1, cs, conjg(ompq)*sn )
                                    END IF
                                 END IF
                                 d(p) = -d(q) * ompq
*
                              ELSE
*              .. have to use modified Gram-Schmidt like transformation
                               IF( aapp.GT.aaqq ) THEN
                                    CALL ccopy( m, a( 1, p ), 1,
     $                                          work, 1 )
                                    CALL clascl( 'G', 0, 0, aapp, one,
     $                                           m, 1, work,lda,
     $                                           ierr )
                                    CALL clascl( 'G', 0, 0, aaqq, one,
     $                                           m, 1, a( 1, q ), lda,
     $                                           ierr )
                                    CALL caxpy( m, -aapq, work,
     $                                          1, a( 1, q ), 1 )
                                    CALL clascl( 'G', 0, 0, one, aaqq,
     $                                           m, 1, a( 1, q ), lda,
     $                                           ierr )
                                    sva( q ) = aaqq*sqrt( max( zero,
     $                                         one-aapq1*aapq1 ) )
                                    mxsinj = max( mxsinj, sfmin )
                               ELSE
                                   CALL ccopy( m, a( 1, q ), 1,
     $                                          work, 1 )
                                    CALL clascl( 'G', 0, 0, aaqq, one,
     $                                           m, 1, work,lda,
     $                                           ierr )
                                    CALL clascl( 'G', 0, 0, aapp, one,
     $                                           m, 1, a( 1, p ), lda,
     $                                           ierr )
                                    CALL caxpy( m, -conjg(aapq),
     $                                   work, 1, a( 1, p ), 1 )
                                    CALL clascl( 'G', 0, 0, one, aapp,
     $                                           m, 1, a( 1, p ), lda,
     $                                           ierr )
                                    sva( p ) = aapp*sqrt( max( zero,
     $                                         one-aapq1*aapq1 ) )
                                    mxsinj = max( mxsinj, sfmin )
                               END IF
                              END IF
*           END IF ROTOK THEN ... ELSE
*
*           In the case of cancellation in updating SVA(q), SVA(p)
*           .. recompute SVA(q), SVA(p)
                              IF( ( sva( q ) / aaqq )**2.LE.rooteps )
     $                            THEN
                                 IF( ( aaqq.LT.rootbig ) .AND.
     $                               ( aaqq.GT.rootsfmin ) ) THEN
                                    sva( q ) = scnrm2( m, a( 1, q ), 1)
                                  ELSE
                                    t = zero
                                    aaqq = one
                                    CALL classq( m, a( 1, q ), 1, t,
     $                                           aaqq )
                                    sva( q ) = t*sqrt( aaqq )
                                 END IF
                              END IF
                              IF( ( aapp / aapp0 )**2.LE.rooteps ) THEN
                                 IF( ( aapp.LT.rootbig ) .AND.
     $                               ( aapp.GT.rootsfmin ) ) THEN
                                    aapp = scnrm2( m, a( 1, p ), 1 )
                                 ELSE
                                    t = zero
                                    aapp = one
                                    CALL classq( m, a( 1, p ), 1, t,
     $                                           aapp )
                                    aapp = t*sqrt( aapp )
                                 END IF
                                 sva( p ) = aapp
                              END IF
*              end of OK rotation
                           ELSE
                              notrot = notrot + 1
*[RTD]      SKIPPED  = SKIPPED  + 1
                              pskipped = pskipped + 1
                              ijblsk = ijblsk + 1
                           END IF
                        ELSE
                           notrot = notrot + 1
                           pskipped = pskipped + 1
                           ijblsk = ijblsk + 1
                        END IF
*
                        IF( ( i.LE.swband ) .AND. ( ijblsk.GE.blskip ) )
     $                      THEN
                           sva( p ) = aapp
                           notrot = 0
                           GO TO 2011
                        END IF
                        IF( ( i.LE.swband ) .AND.
     $                      ( pskipped.GT.rowskip ) ) THEN
                           aapp = -aapp
                           notrot = 0
                           GO TO 2203
                        END IF
*
 2200                CONTINUE
*        end of the q-loop
 2203                CONTINUE
*
                     sva( p ) = aapp
*
                  ELSE
*
                     IF( aapp.EQ.zero )notrot = notrot +
     $                   min( jgl+kbl-1, n ) - jgl + 1
                     IF( aapp.LT.zero )notrot = 0
*
                  END IF
*
 2100          CONTINUE
*     end of the p-loop
 2010       CONTINUE
*     end of the jbc-loop
 2011       CONTINUE
*2011 bailed out of the jbc-loop
            DO 2012 p = igl, min( igl+kbl-1, n )
               sva( p ) = abs( sva( p ) )
 2012       CONTINUE
***
 2000    CONTINUE
*2000 :: end of the ibr-loop
*
*     .. update SVA(N)
         IF( ( sva( n ).LT.rootbig ) .AND. ( sva( n ).GT.rootsfmin ) )
     $       THEN
            sva( n ) = scnrm2( m, a( 1, n ), 1 )
         ELSE
            t = zero
            aapp = one
            CALL classq( m, a( 1, n ), 1, t, aapp )
            sva( n ) = t*sqrt( aapp )
         END IF
*
*     Additional steering devices
*
         IF( ( i.LT.swband ) .AND. ( ( mxaapq.LE.roottol ) .OR.
     $       ( iswrot.LE.n ) ) )swband = i
*
         IF( ( i.GT.swband+1 ) .AND. ( mxaapq.LT.sqrt( real( n ) )*
     $       tol ) .AND. ( real( n )*mxaapq*mxsinj.LT.tol ) ) THEN
            GO TO 1994
         END IF
*
         IF( notrot.GE.emptsw )GO TO 1994
*
 1993 CONTINUE
*     end i=1:NSWEEP loop
*
* #:( Reaching this point means that the procedure has not converged.
      info = nsweep - 1
      GO TO 1995
*
 1994 CONTINUE
* #:) Reaching this point means numerical convergence after the i-th
*     sweep.
*
      info = 0
* #:) INFO = 0 confirms successful iterations.
 1995 CONTINUE
*
*     Sort the vector SVA() of column norms.
      DO 5991 p = 1, n - 1
         q = isamax( n-p+1, sva( p ), 1 ) + p - 1
         IF( p.NE.q ) THEN
            temp1 = sva( p )
            sva( p ) = sva( q )
            sva( q ) = temp1
            aapq = d( p )
            d( p ) = d( q )
            d( q ) = aapq
            CALL cswap( m, a( 1, p ), 1, a( 1, q ), 1 )
            IF( rsvec )CALL cswap( mvl, v( 1, p ), 1, v( 1, q ), 1 )
         END IF
 5991 CONTINUE
*
      RETURN
*     ..
*     .. END OF CGSVJ0
*     ..

◆ cgsvj1()

subroutine cgsvj1	(	character*1	jobv,
		integer	m,
		integer	n,
		integer	n1,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( n )	d,
		real, dimension( n )	sva,
		integer	mv,
		complex, dimension( ldv, * )	v,
		integer	ldv,
		real	eps,
		real	sfmin,
		real	tol,
		integer	nsweep,
		complex, dimension( lwork )	work,
		integer	lwork,
		integer	info )

CGSVJ1 pre-processor for the routine cgesvj, applies Jacobi rotations targeting only particular pivots.

Download CGSVJ1 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CGSVJ1 is called from CGESVJ as a pre-processor and that is its main
!> purpose. It applies Jacobi rotations in the same way as CGESVJ does, but
!> it targets only particular pivots and it does not check convergence
!> (stopping criterion). Few tuning parameters (marked by [TP]) are
!> available for the implementer.
!>
!> Further Details
!> ~~~~~~~~~~~~~~~
!> CGSVJ1 applies few sweeps of Jacobi rotations in the column space of
!> the input M-by-N matrix A. The pivot pairs are taken from the (1,2)
!> off-diagonal block in the corresponding N-by-N Gram matrix A^T * A. The
!> block-entries (tiles) of the (1,2) off-diagonal block are marked by the
!> [x]'s in the following scheme:
!>
!>    | *  *  * [x] [x] [x]|
!>    | *  *  * [x] [x] [x]|    Row-cycling in the nblr-by-nblc [x] blocks.
!>    | *  *  * [x] [x] [x]|    Row-cyclic pivoting inside each [x] block.
!>    |[x] [x] [x] *  *  * |
!>    |[x] [x] [x] *  *  * |
!>    |[x] [x] [x] *  *  * |
!>
!> In terms of the columns of A, the first N1 columns are rotated 'against'
!> the remaining N-N1 columns, trying to increase the angle between the
!> corresponding subspaces. The off-diagonal block is N1-by(N-N1) and it is
!> tiled using quadratic tiles of side KBL. Here, KBL is a tuning parameter.
!> The number of sweeps is given in NSWEEP and the orthogonality threshold
!> is given in TOL.
!>

Parameters

[in]	JOBV	!> JOBV is CHARACTER*1 !> Specifies whether the output from this procedure is used !> to compute the matrix V: !> = 'V': the product of the Jacobi rotations is accumulated !> by postmulyiplying the N-by-N array V. !> (See the description of V.) !> = 'A': the product of the Jacobi rotations is accumulated !> by postmulyiplying the MV-by-N array V. !> (See the descriptions of MV and V.) !> = 'N': the Jacobi rotations are not accumulated. !>
[in]	M	!> M is INTEGER !> The number of rows of the input matrix A. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the input matrix A. !> M >= N >= 0. !>
[in]	N1	!> N1 is INTEGER !> N1 specifies the 2 x 2 block partition, the first N1 columns are !> rotated 'against' the remaining N-N1 columns of A. !>
[in,out]	A	!> A is COMPLEX array, dimension (LDA,N) !> On entry, M-by-N matrix A, such that Adiag(D) represents !> the input matrix. !> On exit, !> A_onexit D_onexit represents the input matrix A*diag(D) !> post-multiplied by a sequence of Jacobi rotations, where the !> rotation threshold and the total number of sweeps are given in !> TOL and NSWEEP, respectively. !> (See the descriptions of N1, D, TOL and NSWEEP.) !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,M). !>
[in,out]	D	!> D is COMPLEX array, dimension (N) !> The array D accumulates the scaling factors from the fast scaled !> Jacobi rotations. !> On entry, Adiag(D) represents the input matrix. !> On exit, A_onexitdiag(D_onexit) represents the input matrix !> post-multiplied by a sequence of Jacobi rotations, where the !> rotation threshold and the total number of sweeps are given in !> TOL and NSWEEP, respectively. !> (See the descriptions of N1, A, TOL and NSWEEP.) !>
[in,out]	SVA	!> SVA is REAL array, dimension (N) !> On entry, SVA contains the Euclidean norms of the columns of !> the matrix Adiag(D). !> On exit, SVA contains the Euclidean norms of the columns of !> the matrix onexitdiag(D_onexit). !>
[in]	MV	!> MV is INTEGER !> If JOBV = 'A', then MV rows of V are post-multipled by a !> sequence of Jacobi rotations. !> If JOBV = 'N', then MV is not referenced. !>
[in,out]	V	!> V is COMPLEX array, dimension (LDV,N) !> If JOBV = 'V' then N rows of V are post-multipled by a !> sequence of Jacobi rotations. !> If JOBV = 'A' then MV rows of V are post-multipled by a !> sequence of Jacobi rotations. !> If JOBV = 'N', then V is not referenced. !>
[in]	LDV	!> LDV is INTEGER !> The leading dimension of the array V, LDV >= 1. !> If JOBV = 'V', LDV >= N. !> If JOBV = 'A', LDV >= MV. !>
[in]	EPS	!> EPS is REAL !> EPS = SLAMCH('Epsilon') !>
[in]	SFMIN	!> SFMIN is REAL !> SFMIN = SLAMCH('Safe Minimum') !>
[in]	TOL	!> TOL is REAL !> TOL is the threshold for Jacobi rotations. For a pair !> A(:,p), A(:,q) of pivot columns, the Jacobi rotation is !> applied only if ABS(COS(angle(A(:,p),A(:,q)))) > TOL. !>
[in]	NSWEEP	!> NSWEEP is INTEGER !> NSWEEP is the number of sweeps of Jacobi rotations to be !> performed. !>
[out]	WORK	!> WORK is COMPLEX array, dimension (LWORK) !>
[in]	LWORK	!> LWORK is INTEGER !> LWORK is the dimension of WORK. LWORK >= M. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> < 0: if INFO = -i, then the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributor:: Zlatko Drmac (Zagreb, Croatia)

Definition at line 234 of file cgsvj1.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      REAL               EPS, SFMIN, TOL
      INTEGER            INFO, LDA, LDV, LWORK, M, MV, N, N1, NSWEEP
      CHARACTER*1        JOBV
*     ..
*     .. Array Arguments ..
      COMPLEX            A( LDA, * ), D( N ), V( LDV, * ), WORK( LWORK )
      REAL               SVA( N )
*     ..
*
*  =====================================================================
*
*     .. Local Parameters ..
      REAL               ZERO, HALF, ONE
      parameter( zero = 0.0e0, half = 0.5e0, one = 1.0e0)
*     ..
*     .. Local Scalars ..
      COMPLEX            AAPQ, OMPQ
      REAL               AAPP, AAPP0, AAPQ1, AAQQ, APOAQ, AQOAP, BIG,
     $                   BIGTHETA, CS, MXAAPQ, MXSINJ, ROOTBIG,
     $                   ROOTEPS, ROOTSFMIN, ROOTTOL, SMALL, SN, T,
     $                   TEMP1, THETA, THSIGN
      INTEGER            BLSKIP, EMPTSW, i, ibr, igl, IERR, IJBLSK,
     $                   ISWROT, jbc, jgl, KBL, MVL, NOTROT, nblc, nblr,
     $                   p, PSKIPPED, q, ROWSKIP, SWBAND
      LOGICAL            APPLV, ROTOK, RSVEC
*     ..
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, max, conjg, real, min, sign, sqrt
*     ..
*     .. External Functions ..
      REAL               SCNRM2
      COMPLEX            CDOTC
      INTEGER            ISAMAX
      LOGICAL            LSAME
      EXTERNAL           isamax, lsame, cdotc, scnrm2
*     ..
*     .. External Subroutines ..
*     .. from BLAS
      EXTERNAL           ccopy, crot, cswap, caxpy
*     .. from LAPACK
      EXTERNAL           clascl, classq, xerbla
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      applv = lsame( jobv, 'A' )
      rsvec = lsame( jobv, 'V' )
      IF( .NOT.( rsvec .OR. applv .OR. lsame( jobv, 'N' ) ) ) THEN
         info = -1
      ELSE IF( m.LT.0 ) THEN
         info = -2
      ELSE IF( ( n.LT.0 ) .OR. ( n.GT.m ) ) THEN
         info = -3
      ELSE IF( n1.LT.0 ) THEN
         info = -4
      ELSE IF( lda.LT.m ) THEN
         info = -6
      ELSE IF( ( rsvec.OR.applv ) .AND. ( mv.LT.0 ) ) THEN
         info = -9
      ELSE IF( ( rsvec.AND.( ldv.LT.n ) ).OR.
     $         ( applv.AND.( ldv.LT.mv ) )  ) THEN
         info = -11
      ELSE IF( tol.LE.eps ) THEN
         info = -14
      ELSE IF( nsweep.LT.0 ) THEN
         info = -15
      ELSE IF( lwork.LT.m ) THEN
         info = -17
      ELSE
         info = 0
      END IF
*
*     #:(
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CGSVJ1', -info )
         RETURN
      END IF
*
      IF( rsvec ) THEN
         mvl = n
      ELSE IF( applv ) THEN
         mvl = mv
      END IF
      rsvec = rsvec .OR. applv
 
      rooteps = sqrt( eps )
      rootsfmin = sqrt( sfmin )
      small = sfmin / eps
      big = one / sfmin
      rootbig = one / rootsfmin
*     LARGE = BIG / SQRT( REAL( M*N ) )
      bigtheta = one / rooteps
      roottol = sqrt( tol )
*
*     .. Initialize the right singular vector matrix ..
*
*     RSVEC = LSAME( JOBV, 'Y' )
*
      emptsw = n1*( n-n1 )
      notrot = 0
*
*     .. Row-cyclic pivot strategy with de Rijk's pivoting ..
*
      kbl = min( 8, n )
      nblr = n1 / kbl
      IF( ( nblr*kbl ).NE.n1 )nblr = nblr + 1
 
*     .. the tiling is nblr-by-nblc [tiles]
 
      nblc = ( n-n1 ) / kbl
      IF( ( nblc*kbl ).NE.( n-n1 ) )nblc = nblc + 1
      blskip = ( kbl**2 ) + 1
*[TP] BLKSKIP is a tuning parameter that depends on SWBAND and KBL.
 
      rowskip = min( 5, kbl )
*[TP] ROWSKIP is a tuning parameter.
      swband = 0
*[TP] SWBAND is a tuning parameter. It is meaningful and effective
*     if CGESVJ is used as a computational routine in the preconditioned
*     Jacobi SVD algorithm CGEJSV.
*
*
*     | *   *   * [x] [x] [x]|
*     | *   *   * [x] [x] [x]|    Row-cycling in the nblr-by-nblc [x] blocks.
*     | *   *   * [x] [x] [x]|    Row-cyclic pivoting inside each [x] block.
*     |[x] [x] [x] *   *   * |
*     |[x] [x] [x] *   *   * |
*     |[x] [x] [x] *   *   * |
*
*
      DO 1993 i = 1, nsweep
*
*     .. go go go ...
*
         mxaapq = zero
         mxsinj = zero
         iswrot = 0
*
         notrot = 0
         pskipped = 0
*
*     Each sweep is unrolled using KBL-by-KBL tiles over the pivot pairs
*     1 <= p < q <= N. This is the first step toward a blocked implementation
*     of the rotations. New implementation, based on block transformations,
*     is under development.
*
         DO 2000 ibr = 1, nblr
*
            igl = ( ibr-1 )*kbl + 1
*
 
*
* ... go to the off diagonal blocks
*
            igl = ( ibr-1 )*kbl + 1
*
*            DO 2010 jbc = ibr + 1, NBL
            DO 2010 jbc = 1, nblc
*
               jgl = ( jbc-1 )*kbl + n1 + 1
*
*        doing the block at ( ibr, jbc )
*
               ijblsk = 0
               DO 2100 p = igl, min( igl+kbl-1, n1 )
*
                  aapp = sva( p )
                  IF( aapp.GT.zero ) THEN
*
                     pskipped = 0
*
                     DO 2200 q = jgl, min( jgl+kbl-1, n )
*
                        aaqq = sva( q )
                        IF( aaqq.GT.zero ) THEN
                           aapp0 = aapp
*
*     .. M x 2 Jacobi SVD ..
*
*        Safe Gram matrix computation
*
                           IF( aaqq.GE.one ) THEN
                              IF( aapp.GE.aaqq ) THEN
                                 rotok = ( small*aapp ).LE.aaqq
                              ELSE
                                 rotok = ( small*aaqq ).LE.aapp
                              END IF
                              IF( aapp.LT.( big / aaqq ) ) THEN
                                 aapq = ( cdotc( m, a( 1, p ), 1,
     $                                  a( 1, q ), 1 ) / aaqq ) / aapp
                              ELSE
                                 CALL ccopy( m, a( 1, p ), 1,
     $                                       work, 1 )
                                 CALL clascl( 'G', 0, 0, aapp,
     $                                        one, m, 1,
     $                                        work, lda, ierr )
                                 aapq = cdotc( m, work, 1,
     $                                  a( 1, q ), 1 ) / aaqq
                              END IF
                           ELSE
                              IF( aapp.GE.aaqq ) THEN
                                 rotok = aapp.LE.( aaqq / small )
                              ELSE
                                 rotok = aaqq.LE.( aapp / small )
                              END IF
                              IF( aapp.GT.( small / aaqq ) ) THEN
                                 aapq = ( cdotc( m, a( 1, p ), 1,
     $                                 a( 1, q ), 1 ) / max(aaqq,aapp) )
     $                                               / min(aaqq,aapp)
                              ELSE
                                 CALL ccopy( m, a( 1, q ), 1,
     $                                       work, 1 )
                                 CALL clascl( 'G', 0, 0, aaqq,
     $                                        one, m, 1,
     $                                        work, lda, ierr )
                                 aapq = cdotc( m, a( 1, p ), 1,
     $                                  work, 1 ) / aapp
                              END IF
                           END IF
*
*                           AAPQ = AAPQ * CONJG(CWORK(p))*CWORK(q)
                           aapq1  = -abs(aapq)
                           mxaapq = max( mxaapq, -aapq1 )
*
*        TO rotate or NOT to rotate, THAT is the question ...
*
                           IF( abs( aapq1 ).GT.tol ) THEN
                              ompq = aapq / abs(aapq)
                              notrot = 0
*[RTD]      ROTATED  = ROTATED + 1
                              pskipped = 0
                              iswrot = iswrot + 1
*
                              IF( rotok ) THEN
*
                                 aqoap = aaqq / aapp
                                 apoaq = aapp / aaqq
                                 theta = -half*abs( aqoap-apoaq )/ aapq1
                                 IF( aaqq.GT.aapp0 )theta = -theta
*
                                 IF( abs( theta ).GT.bigtheta ) THEN
                                    t  = half / theta
                                    cs = one
                                    CALL crot( m, a(1,p), 1, a(1,q), 1,
     $                                          cs, conjg(ompq)*t )
                                    IF( rsvec ) THEN
                                        CALL crot( mvl, v(1,p), 1,
     $                                  v(1,q), 1, cs, conjg(ompq)*t )
                                    END IF
                                    sva( q ) = aaqq*sqrt( max( zero,
     $                                         one+t*apoaq*aapq1 ) )
                                    aapp = aapp*sqrt( max( zero,
     $                                     one-t*aqoap*aapq1 ) )
                                    mxsinj = max( mxsinj, abs( t ) )
                                 ELSE
*
*                 .. choose correct signum for THETA and rotate
*
                                    thsign = -sign( one, aapq1 )
                                    IF( aaqq.GT.aapp0 )thsign = -thsign
                                    t = one / ( theta+thsign*
     $                                  sqrt( one+theta*theta ) )
                                    cs = sqrt( one / ( one+t*t ) )
                                    sn = t*cs
                                    mxsinj = max( mxsinj, abs( sn ) )
                                    sva( q ) = aaqq*sqrt( max( zero,
     $                                         one+t*apoaq*aapq1 ) )
                                    aapp = aapp*sqrt( max( zero,
     $                                         one-t*aqoap*aapq1 ) )
*
                                    CALL crot( m, a(1,p), 1, a(1,q), 1,
     $                                          cs, conjg(ompq)*sn )
                                    IF( rsvec ) THEN
                                        CALL crot( mvl, v(1,p), 1,
     $                                  v(1,q), 1, cs, conjg(ompq)*sn )
                                    END IF
                                 END IF
                                 d(p) = -d(q) * ompq
*
                              ELSE
*              .. have to use modified Gram-Schmidt like transformation
                               IF( aapp.GT.aaqq ) THEN
                                    CALL ccopy( m, a( 1, p ), 1,
     $                                          work, 1 )
                                    CALL clascl( 'G', 0, 0, aapp, one,
     $                                           m, 1, work,lda,
     $                                           ierr )
                                    CALL clascl( 'G', 0, 0, aaqq, one,
     $                                           m, 1, a( 1, q ), lda,
     $                                           ierr )
                                    CALL caxpy( m, -aapq, work,
     $                                          1, a( 1, q ), 1 )
                                    CALL clascl( 'G', 0, 0, one, aaqq,
     $                                           m, 1, a( 1, q ), lda,
     $                                           ierr )
                                    sva( q ) = aaqq*sqrt( max( zero,
     $                                         one-aapq1*aapq1 ) )
                                    mxsinj = max( mxsinj, sfmin )
                               ELSE
                                   CALL ccopy( m, a( 1, q ), 1,
     $                                          work, 1 )
                                    CALL clascl( 'G', 0, 0, aaqq, one,
     $                                           m, 1, work,lda,
     $                                           ierr )
                                    CALL clascl( 'G', 0, 0, aapp, one,
     $                                           m, 1, a( 1, p ), lda,
     $                                           ierr )
                                    CALL caxpy( m, -conjg(aapq),
     $                                   work, 1, a( 1, p ), 1 )
                                    CALL clascl( 'G', 0, 0, one, aapp,
     $                                           m, 1, a( 1, p ), lda,
     $                                           ierr )
                                    sva( p ) = aapp*sqrt( max( zero,
     $                                         one-aapq1*aapq1 ) )
                                    mxsinj = max( mxsinj, sfmin )
                               END IF
                              END IF
*           END IF ROTOK THEN ... ELSE
*
*           In the case of cancellation in updating SVA(q), SVA(p)
*           .. recompute SVA(q), SVA(p)
                              IF( ( sva( q ) / aaqq )**2.LE.rooteps )
     $                            THEN
                                 IF( ( aaqq.LT.rootbig ) .AND.
     $                               ( aaqq.GT.rootsfmin ) ) THEN
                                    sva( q ) = scnrm2( m, a( 1, q ), 1)
                                  ELSE
                                    t = zero
                                    aaqq = one
                                    CALL classq( m, a( 1, q ), 1, t,
     $                                           aaqq )
                                    sva( q ) = t*sqrt( aaqq )
                                 END IF
                              END IF
                              IF( ( aapp / aapp0 )**2.LE.rooteps ) THEN
                                 IF( ( aapp.LT.rootbig ) .AND.
     $                               ( aapp.GT.rootsfmin ) ) THEN
                                    aapp = scnrm2( m, a( 1, p ), 1 )
                                 ELSE
                                    t = zero
                                    aapp = one
                                    CALL classq( m, a( 1, p ), 1, t,
     $                                           aapp )
                                    aapp = t*sqrt( aapp )
                                 END IF
                                 sva( p ) = aapp
                              END IF
*              end of OK rotation
                           ELSE
                              notrot = notrot + 1
*[RTD]      SKIPPED  = SKIPPED  + 1
                              pskipped = pskipped + 1
                              ijblsk = ijblsk + 1
                           END IF
                        ELSE
                           notrot = notrot + 1
                           pskipped = pskipped + 1
                           ijblsk = ijblsk + 1
                        END IF
*
                        IF( ( i.LE.swband ) .AND. ( ijblsk.GE.blskip ) )
     $                      THEN
                           sva( p ) = aapp
                           notrot = 0
                           GO TO 2011
                        END IF
                        IF( ( i.LE.swband ) .AND.
     $                      ( pskipped.GT.rowskip ) ) THEN
                           aapp = -aapp
                           notrot = 0
                           GO TO 2203
                        END IF
*
 2200                CONTINUE
*        end of the q-loop
 2203                CONTINUE
*
                     sva( p ) = aapp
*
                  ELSE
*
                     IF( aapp.EQ.zero )notrot = notrot +
     $                   min( jgl+kbl-1, n ) - jgl + 1
                     IF( aapp.LT.zero )notrot = 0
*
                  END IF
*
 2100          CONTINUE
*     end of the p-loop
 2010       CONTINUE
*     end of the jbc-loop
 2011       CONTINUE
*2011 bailed out of the jbc-loop
            DO 2012 p = igl, min( igl+kbl-1, n )
               sva( p ) = abs( sva( p ) )
 2012       CONTINUE
***
 2000    CONTINUE
*2000 :: end of the ibr-loop
*
*     .. update SVA(N)
         IF( ( sva( n ).LT.rootbig ) .AND. ( sva( n ).GT.rootsfmin ) )
     $       THEN
            sva( n ) = scnrm2( m, a( 1, n ), 1 )
         ELSE
            t = zero
            aapp = one
            CALL classq( m, a( 1, n ), 1, t, aapp )
            sva( n ) = t*sqrt( aapp )
         END IF
*
*     Additional steering devices
*
         IF( ( i.LT.swband ) .AND. ( ( mxaapq.LE.roottol ) .OR.
     $       ( iswrot.LE.n ) ) )swband = i
*
         IF( ( i.GT.swband+1 ) .AND. ( mxaapq.LT.sqrt( real( n ) )*
     $       tol ) .AND. ( real( n )*mxaapq*mxsinj.LT.tol ) ) THEN
            GO TO 1994
         END IF
*
         IF( notrot.GE.emptsw )GO TO 1994
*
 1993 CONTINUE
*     end i=1:NSWEEP loop
*
* #:( Reaching this point means that the procedure has not converged.
      info = nsweep - 1
      GO TO 1995
*
 1994 CONTINUE
* #:) Reaching this point means numerical convergence after the i-th
*     sweep.
*
      info = 0
* #:) INFO = 0 confirms successful iterations.
 1995 CONTINUE
*
*     Sort the vector SVA() of column norms.
      DO 5991 p = 1, n - 1
         q = isamax( n-p+1, sva( p ), 1 ) + p - 1
         IF( p.NE.q ) THEN
            temp1 = sva( p )
            sva( p ) = sva( q )
            sva( q ) = temp1
            aapq = d( p )
            d( p ) = d( q )
            d( q ) = aapq
            CALL cswap( m, a( 1, p ), 1, a( 1, q ), 1 )
            IF( rsvec )CALL cswap( mvl, v( 1, p ), 1, v( 1, q ), 1 )
         END IF
 5991 CONTINUE
*
*
      RETURN
*     ..
*     .. END OF CGSVJ1
*     ..

◆ chbgst()

subroutine chbgst	(	character	vect,
		character	uplo,
		integer	n,
		integer	ka,
		integer	kb,
		complex, dimension( ldab, * )	ab,
		integer	ldab,
		complex, dimension( ldbb, * )	bb,
		integer	ldbb,
		complex, dimension( ldx, * )	x,
		integer	ldx,
		complex, dimension( * )	work,
		real, dimension( * )	rwork,
		integer	info )

CHBGST

Download CHBGST + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CHBGST reduces a complex Hermitian-definite banded generalized
!> eigenproblem  A*x = lambda*B*x  to standard form  C*y = lambda*y,
!> such that C has the same bandwidth as A.
!>
!> B must have been previously factorized as S**H*S by CPBSTF, using a
!> split Cholesky factorization. A is overwritten by C = X**H*A*X, where
!> X = S**(-1)*Q and Q is a unitary matrix chosen to preserve the
!> bandwidth of A.
!>

Parameters

[in]	VECT	!> VECT is CHARACTER*1 !> = 'N': do not form the transformation matrix X; !> = 'V': form X. !>
[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': Upper triangle of A is stored; !> = 'L': Lower triangle of A is stored. !>
[in]	N	!> N is INTEGER !> The order of the matrices A and B. N >= 0. !>
[in]	KA	!> KA is INTEGER !> The number of superdiagonals of the matrix A if UPLO = 'U', !> or the number of subdiagonals if UPLO = 'L'. KA >= 0. !>
[in]	KB	!> KB is INTEGER !> The number of superdiagonals of the matrix B if UPLO = 'U', !> or the number of subdiagonals if UPLO = 'L'. KA >= KB >= 0. !>
[in,out]	AB	!> AB is COMPLEX array, dimension (LDAB,N) !> On entry, the upper or lower triangle of the Hermitian band !> matrix A, stored in the first ka+1 rows of the array. The !> j-th column of A is stored in the j-th column of the array AB !> as follows: !> if UPLO = 'U', AB(ka+1+i-j,j) = A(i,j) for max(1,j-ka)<=i<=j; !> if UPLO = 'L', AB(1+i-j,j) = A(i,j) for j<=i<=min(n,j+ka). !> !> On exit, the transformed matrix X*HA*X, stored in the same !> format as A. !>
[in]	LDAB	!> LDAB is INTEGER !> The leading dimension of the array AB. LDAB >= KA+1. !>
[in]	BB	!> BB is COMPLEX array, dimension (LDBB,N) !> The banded factor S from the split Cholesky factorization of !> B, as returned by CPBSTF, stored in the first kb+1 rows of !> the array. !>
[in]	LDBB	!> LDBB is INTEGER !> The leading dimension of the array BB. LDBB >= KB+1. !>
[out]	X	!> X is COMPLEX array, dimension (LDX,N) !> If VECT = 'V', the n-by-n matrix X. !> If VECT = 'N', the array X is not referenced. !>
[in]	LDX	!> LDX is INTEGER !> The leading dimension of the array X. !> LDX >= max(1,N) if VECT = 'V'; LDX >= 1 otherwise. !>
[out]	WORK	!> WORK is COMPLEX array, dimension (N) !>
[out]	RWORK	!> RWORK is REAL array, dimension (N) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 163 of file chbgst.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          UPLO, VECT
      INTEGER            INFO, KA, KB, LDAB, LDBB, LDX, N
*     ..
*     .. Array Arguments ..
      REAL               RWORK( * )
      COMPLEX            AB( LDAB, * ), BB( LDBB, * ), WORK( * ),
     $                   X( LDX, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            CZERO, CONE
      REAL               ONE
      parameter( czero = ( 0.0e+0, 0.0e+0 ),
     $                   cone = ( 1.0e+0, 0.0e+0 ), one = 1.0e+0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            UPDATE, UPPER, WANTX
      INTEGER            I, I0, I1, I2, INCA, J, J1, J1T, J2, J2T, K,
     $                   KA1, KB1, KBT, L, M, NR, NRT, NX
      REAL               BII
      COMPLEX            RA, RA1, T
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           cgerc, cgeru, clacgv, clar2v, clargv, clartg,
     $                   clartv, claset, crot, csscal, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          conjg, max, min, real
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters
*
      wantx = lsame( vect, 'V' )
      upper = lsame( uplo, 'U' )
      ka1 = ka + 1
      kb1 = kb + 1
      info = 0
      IF( .NOT.wantx .AND. .NOT.lsame( vect, 'N' ) ) THEN
         info = -1
      ELSE IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -2
      ELSE IF( n.LT.0 ) THEN
         info = -3
      ELSE IF( ka.LT.0 ) THEN
         info = -4
      ELSE IF( kb.LT.0 .OR. kb.GT.ka ) THEN
         info = -5
      ELSE IF( ldab.LT.ka+1 ) THEN
         info = -7
      ELSE IF( ldbb.LT.kb+1 ) THEN
         info = -9
      ELSE IF( ldx.LT.1 .OR. wantx .AND. ldx.LT.max( 1, n ) ) THEN
         info = -11
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CHBGST', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
      inca = ldab*ka1
*
*     Initialize X to the unit matrix, if needed
*
      IF( wantx )
     $   CALL claset( 'Full', n, n, czero, cone, x, ldx )
*
*     Set M to the splitting point m. It must be the same value as is
*     used in CPBSTF. The chosen value allows the arrays WORK and RWORK
*     to be of dimension (N).
*
      m = ( n+kb ) / 2
*
*     The routine works in two phases, corresponding to the two halves
*     of the split Cholesky factorization of B as S**H*S where
*
*     S = ( U    )
*         ( M  L )
*
*     with U upper triangular of order m, and L lower triangular of
*     order n-m. S has the same bandwidth as B.
*
*     S is treated as a product of elementary matrices:
*
*     S = S(m)*S(m-1)*...*S(2)*S(1)*S(m+1)*S(m+2)*...*S(n-1)*S(n)
*
*     where S(i) is determined by the i-th row of S.
*
*     In phase 1, the index i takes the values n, n-1, ... , m+1;
*     in phase 2, it takes the values 1, 2, ... , m.
*
*     For each value of i, the current matrix A is updated by forming
*     inv(S(i))**H*A*inv(S(i)). This creates a triangular bulge outside
*     the band of A. The bulge is then pushed down toward the bottom of
*     A in phase 1, and up toward the top of A in phase 2, by applying
*     plane rotations.
*
*     There are kb*(kb+1)/2 elements in the bulge, but at most 2*kb-1
*     of them are linearly independent, so annihilating a bulge requires
*     only 2*kb-1 plane rotations. The rotations are divided into a 1st
*     set of kb-1 rotations, and a 2nd set of kb rotations.
*
*     Wherever possible, rotations are generated and applied in vector
*     operations of length NR between the indices J1 and J2 (sometimes
*     replaced by modified values NRT, J1T or J2T).
*
*     The real cosines and complex sines of the rotations are stored in
*     the arrays RWORK and WORK, those of the 1st set in elements
*     2:m-kb-1, and those of the 2nd set in elements m-kb+1:n.
*
*     The bulges are not formed explicitly; nonzero elements outside the
*     band are created only when they are required for generating new
*     rotations; they are stored in the array WORK, in positions where
*     they are later overwritten by the sines of the rotations which
*     annihilate them.
*
*     **************************** Phase 1 *****************************
*
*     The logical structure of this phase is:
*
*     UPDATE = .TRUE.
*     DO I = N, M + 1, -1
*        use S(i) to update A and create a new bulge
*        apply rotations to push all bulges KA positions downward
*     END DO
*     UPDATE = .FALSE.
*     DO I = M + KA + 1, N - 1
*        apply rotations to push all bulges KA positions downward
*     END DO
*
*     To avoid duplicating code, the two loops are merged.
*
      update = .true.
      i = n + 1
   10 CONTINUE
      IF( update ) THEN
         i = i - 1
         kbt = min( kb, i-1 )
         i0 = i - 1
         i1 = min( n, i+ka )
         i2 = i - kbt + ka1
         IF( i.LT.m+1 ) THEN
            update = .false.
            i = i + 1
            i0 = m
            IF( ka.EQ.0 )
     $         GO TO 480
            GO TO 10
         END IF
      ELSE
         i = i + ka
         IF( i.GT.n-1 )
     $      GO TO 480
      END IF
*
      IF( upper ) THEN
*
*        Transform A, working with the upper triangle
*
         IF( update ) THEN
*
*           Form  inv(S(i))**H * A * inv(S(i))
*
            bii = real( bb( kb1, i ) )
            ab( ka1, i ) = ( real( ab( ka1, i ) ) / bii ) / bii
            DO 20 j = i + 1, i1
               ab( i-j+ka1, j ) = ab( i-j+ka1, j ) / bii
   20       CONTINUE
            DO 30 j = max( 1, i-ka ), i - 1
               ab( j-i+ka1, i ) = ab( j-i+ka1, i ) / bii
   30       CONTINUE
            DO 60 k = i - kbt, i - 1
               DO 40 j = i - kbt, k
                  ab( j-k+ka1, k ) = ab( j-k+ka1, k ) -
     $                               bb( j-i+kb1, i )*
     $                               conjg( ab( k-i+ka1, i ) ) -
     $                               conjg( bb( k-i+kb1, i ) )*
     $                               ab( j-i+ka1, i ) +
     $                               real( ab( ka1, i ) )*
     $                               bb( j-i+kb1, i )*
     $                               conjg( bb( k-i+kb1, i ) )
   40          CONTINUE
               DO 50 j = max( 1, i-ka ), i - kbt - 1
                  ab( j-k+ka1, k ) = ab( j-k+ka1, k ) -
     $                               conjg( bb( k-i+kb1, i ) )*
     $                               ab( j-i+ka1, i )
   50          CONTINUE
   60       CONTINUE
            DO 80 j = i, i1
               DO 70 k = max( j-ka, i-kbt ), i - 1
                  ab( k-j+ka1, j ) = ab( k-j+ka1, j ) -
     $                               bb( k-i+kb1, i )*ab( i-j+ka1, j )
   70          CONTINUE
   80       CONTINUE
*
            IF( wantx ) THEN
*
*              post-multiply X by inv(S(i))
*
               CALL csscal( n-m, one / bii, x( m+1, i ), 1 )
               IF( kbt.GT.0 )
     $            CALL cgerc( n-m, kbt, -cone, x( m+1, i ), 1,
     $                        bb( kb1-kbt, i ), 1, x( m+1, i-kbt ),
     $                        ldx )
            END IF
*
*           store a(i,i1) in RA1 for use in next loop over K
*
            ra1 = ab( i-i1+ka1, i1 )
         END IF
*
*        Generate and apply vectors of rotations to chase all the
*        existing bulges KA positions down toward the bottom of the
*        band
*
         DO 130 k = 1, kb - 1
            IF( update ) THEN
*
*              Determine the rotations which would annihilate the bulge
*              which has in theory just been created
*
               IF( i-k+ka.LT.n .AND. i-k.GT.1 ) THEN
*
*                 generate rotation to annihilate a(i,i-k+ka+1)
*
                  CALL clartg( ab( k+1, i-k+ka ), ra1,
     $                         rwork( i-k+ka-m ), work( i-k+ka-m ), ra )
*
*                 create nonzero element a(i-k,i-k+ka+1) outside the
*                 band and store it in WORK(i-k)
*
                  t = -bb( kb1-k, i )*ra1
                  work( i-k ) = rwork( i-k+ka-m )*t -
     $                          conjg( work( i-k+ka-m ) )*
     $                          ab( 1, i-k+ka )
                  ab( 1, i-k+ka ) = work( i-k+ka-m )*t +
     $                              rwork( i-k+ka-m )*ab( 1, i-k+ka )
                  ra1 = ra
               END IF
            END IF
            j2 = i - k - 1 + max( 1, k-i0+2 )*ka1
            nr = ( n-j2+ka ) / ka1
            j1 = j2 + ( nr-1 )*ka1
            IF( update ) THEN
               j2t = max( j2, i+2*ka-k+1 )
            ELSE
               j2t = j2
            END IF
            nrt = ( n-j2t+ka ) / ka1
            DO 90 j = j2t, j1, ka1
*
*              create nonzero element a(j-ka,j+1) outside the band
*              and store it in WORK(j-m)
*
               work( j-m ) = work( j-m )*ab( 1, j+1 )
               ab( 1, j+1 ) = rwork( j-m )*ab( 1, j+1 )
   90       CONTINUE
*
*           generate rotations in 1st set to annihilate elements which
*           have been created outside the band
*
            IF( nrt.GT.0 )
     $         CALL clargv( nrt, ab( 1, j2t ), inca, work( j2t-m ), ka1,
     $                      rwork( j2t-m ), ka1 )
            IF( nr.GT.0 ) THEN
*
*              apply rotations in 1st set from the right
*
               DO 100 l = 1, ka - 1
                  CALL clartv( nr, ab( ka1-l, j2 ), inca,
     $                         ab( ka-l, j2+1 ), inca, rwork( j2-m ),
     $                         work( j2-m ), ka1 )
  100          CONTINUE
*
*              apply rotations in 1st set from both sides to diagonal
*              blocks
*
               CALL clar2v( nr, ab( ka1, j2 ), ab( ka1, j2+1 ),
     $                      ab( ka, j2+1 ), inca, rwork( j2-m ),
     $                      work( j2-m ), ka1 )
*
               CALL clacgv( nr, work( j2-m ), ka1 )
            END IF
*
*           start applying rotations in 1st set from the left
*
            DO 110 l = ka - 1, kb - k + 1, -1
               nrt = ( n-j2+l ) / ka1
               IF( nrt.GT.0 )
     $            CALL clartv( nrt, ab( l, j2+ka1-l ), inca,
     $                         ab( l+1, j2+ka1-l ), inca, rwork( j2-m ),
     $                         work( j2-m ), ka1 )
  110       CONTINUE
*
            IF( wantx ) THEN
*
*              post-multiply X by product of rotations in 1st set
*
               DO 120 j = j2, j1, ka1
                  CALL crot( n-m, x( m+1, j ), 1, x( m+1, j+1 ), 1,
     $                       rwork( j-m ), conjg( work( j-m ) ) )
  120          CONTINUE
            END IF
  130    CONTINUE
*
         IF( update ) THEN
            IF( i2.LE.n .AND. kbt.GT.0 ) THEN
*
*              create nonzero element a(i-kbt,i-kbt+ka+1) outside the
*              band and store it in WORK(i-kbt)
*
               work( i-kbt ) = -bb( kb1-kbt, i )*ra1
            END IF
         END IF
*
         DO 170 k = kb, 1, -1
            IF( update ) THEN
               j2 = i - k - 1 + max( 2, k-i0+1 )*ka1
            ELSE
               j2 = i - k - 1 + max( 1, k-i0+1 )*ka1
            END IF
*
*           finish applying rotations in 2nd set from the left
*
            DO 140 l = kb - k, 1, -1
               nrt = ( n-j2+ka+l ) / ka1
               IF( nrt.GT.0 )
     $            CALL clartv( nrt, ab( l, j2-l+1 ), inca,
     $                         ab( l+1, j2-l+1 ), inca, rwork( j2-ka ),
     $                         work( j2-ka ), ka1 )
  140       CONTINUE
            nr = ( n-j2+ka ) / ka1
            j1 = j2 + ( nr-1 )*ka1
            DO 150 j = j1, j2, -ka1
               work( j ) = work( j-ka )
               rwork( j ) = rwork( j-ka )
  150       CONTINUE
            DO 160 j = j2, j1, ka1
*
*              create nonzero element a(j-ka,j+1) outside the band
*              and store it in WORK(j)
*
               work( j ) = work( j )*ab( 1, j+1 )
               ab( 1, j+1 ) = rwork( j )*ab( 1, j+1 )
  160       CONTINUE
            IF( update ) THEN
               IF( i-k.LT.n-ka .AND. k.LE.kbt )
     $            work( i-k+ka ) = work( i-k )
            END IF
  170    CONTINUE
*
         DO 210 k = kb, 1, -1
            j2 = i - k - 1 + max( 1, k-i0+1 )*ka1
            nr = ( n-j2+ka ) / ka1
            j1 = j2 + ( nr-1 )*ka1
            IF( nr.GT.0 ) THEN
*
*              generate rotations in 2nd set to annihilate elements
*              which have been created outside the band
*
               CALL clargv( nr, ab( 1, j2 ), inca, work( j2 ), ka1,
     $                      rwork( j2 ), ka1 )
*
*              apply rotations in 2nd set from the right
*
               DO 180 l = 1, ka - 1
                  CALL clartv( nr, ab( ka1-l, j2 ), inca,
     $                         ab( ka-l, j2+1 ), inca, rwork( j2 ),
     $                         work( j2 ), ka1 )
  180          CONTINUE
*
*              apply rotations in 2nd set from both sides to diagonal
*              blocks
*
               CALL clar2v( nr, ab( ka1, j2 ), ab( ka1, j2+1 ),
     $                      ab( ka, j2+1 ), inca, rwork( j2 ),
     $                      work( j2 ), ka1 )
*
               CALL clacgv( nr, work( j2 ), ka1 )
            END IF
*
*           start applying rotations in 2nd set from the left
*
            DO 190 l = ka - 1, kb - k + 1, -1
               nrt = ( n-j2+l ) / ka1
               IF( nrt.GT.0 )
     $            CALL clartv( nrt, ab( l, j2+ka1-l ), inca,
     $                         ab( l+1, j2+ka1-l ), inca, rwork( j2 ),
     $                         work( j2 ), ka1 )
  190       CONTINUE
*
            IF( wantx ) THEN
*
*              post-multiply X by product of rotations in 2nd set
*
               DO 200 j = j2, j1, ka1
                  CALL crot( n-m, x( m+1, j ), 1, x( m+1, j+1 ), 1,
     $                       rwork( j ), conjg( work( j ) ) )
  200          CONTINUE
            END IF
  210    CONTINUE
*
         DO 230 k = 1, kb - 1
            j2 = i - k - 1 + max( 1, k-i0+2 )*ka1
*
*           finish applying rotations in 1st set from the left
*
            DO 220 l = kb - k, 1, -1
               nrt = ( n-j2+l ) / ka1
               IF( nrt.GT.0 )
     $            CALL clartv( nrt, ab( l, j2+ka1-l ), inca,
     $                         ab( l+1, j2+ka1-l ), inca, rwork( j2-m ),
     $                         work( j2-m ), ka1 )
  220       CONTINUE
  230    CONTINUE
*
         IF( kb.GT.1 ) THEN
            DO 240 j = n - 1, j2 + ka, -1
               rwork( j-m ) = rwork( j-ka-m )
               work( j-m ) = work( j-ka-m )
  240       CONTINUE
         END IF
*
      ELSE
*
*        Transform A, working with the lower triangle
*
         IF( update ) THEN
*
*           Form  inv(S(i))**H * A * inv(S(i))
*
            bii = real( bb( 1, i ) )
            ab( 1, i ) = ( real( ab( 1, i ) ) / bii ) / bii
            DO 250 j = i + 1, i1
               ab( j-i+1, i ) = ab( j-i+1, i ) / bii
  250       CONTINUE
            DO 260 j = max( 1, i-ka ), i - 1
               ab( i-j+1, j ) = ab( i-j+1, j ) / bii
  260       CONTINUE
            DO 290 k = i - kbt, i - 1
               DO 270 j = i - kbt, k
                  ab( k-j+1, j ) = ab( k-j+1, j ) -
     $                             bb( i-j+1, j )*conjg( ab( i-k+1,
     $                             k ) ) - conjg( bb( i-k+1, k ) )*
     $                             ab( i-j+1, j ) + real( ab( 1, i ) )*
     $                             bb( i-j+1, j )*conjg( bb( i-k+1,
     $                             k ) )
  270          CONTINUE
               DO 280 j = max( 1, i-ka ), i - kbt - 1
                  ab( k-j+1, j ) = ab( k-j+1, j ) -
     $                             conjg( bb( i-k+1, k ) )*
     $                             ab( i-j+1, j )
  280          CONTINUE
  290       CONTINUE
            DO 310 j = i, i1
               DO 300 k = max( j-ka, i-kbt ), i - 1
                  ab( j-k+1, k ) = ab( j-k+1, k ) -
     $                             bb( i-k+1, k )*ab( j-i+1, i )
  300          CONTINUE
  310       CONTINUE
*
            IF( wantx ) THEN
*
*              post-multiply X by inv(S(i))
*
               CALL csscal( n-m, one / bii, x( m+1, i ), 1 )
               IF( kbt.GT.0 )
     $            CALL cgeru( n-m, kbt, -cone, x( m+1, i ), 1,
     $                        bb( kbt+1, i-kbt ), ldbb-1,
     $                        x( m+1, i-kbt ), ldx )
            END IF
*
*           store a(i1,i) in RA1 for use in next loop over K
*
            ra1 = ab( i1-i+1, i )
         END IF
*
*        Generate and apply vectors of rotations to chase all the
*        existing bulges KA positions down toward the bottom of the
*        band
*
         DO 360 k = 1, kb - 1
            IF( update ) THEN
*
*              Determine the rotations which would annihilate the bulge
*              which has in theory just been created
*
               IF( i-k+ka.LT.n .AND. i-k.GT.1 ) THEN
*
*                 generate rotation to annihilate a(i-k+ka+1,i)
*
                  CALL clartg( ab( ka1-k, i ), ra1, rwork( i-k+ka-m ),
     $                         work( i-k+ka-m ), ra )
*
*                 create nonzero element a(i-k+ka+1,i-k) outside the
*                 band and store it in WORK(i-k)
*
                  t = -bb( k+1, i-k )*ra1
                  work( i-k ) = rwork( i-k+ka-m )*t -
     $                          conjg( work( i-k+ka-m ) )*ab( ka1, i-k )
                  ab( ka1, i-k ) = work( i-k+ka-m )*t +
     $                             rwork( i-k+ka-m )*ab( ka1, i-k )
                  ra1 = ra
               END IF
            END IF
            j2 = i - k - 1 + max( 1, k-i0+2 )*ka1
            nr = ( n-j2+ka ) / ka1
            j1 = j2 + ( nr-1 )*ka1
            IF( update ) THEN
               j2t = max( j2, i+2*ka-k+1 )
            ELSE
               j2t = j2
            END IF
            nrt = ( n-j2t+ka ) / ka1
            DO 320 j = j2t, j1, ka1
*
*              create nonzero element a(j+1,j-ka) outside the band
*              and store it in WORK(j-m)
*
               work( j-m ) = work( j-m )*ab( ka1, j-ka+1 )
               ab( ka1, j-ka+1 ) = rwork( j-m )*ab( ka1, j-ka+1 )
  320       CONTINUE
*
*           generate rotations in 1st set to annihilate elements which
*           have been created outside the band
*
            IF( nrt.GT.0 )
     $         CALL clargv( nrt, ab( ka1, j2t-ka ), inca, work( j2t-m ),
     $                      ka1, rwork( j2t-m ), ka1 )
            IF( nr.GT.0 ) THEN
*
*              apply rotations in 1st set from the left
*
               DO 330 l = 1, ka - 1
                  CALL clartv( nr, ab( l+1, j2-l ), inca,
     $                         ab( l+2, j2-l ), inca, rwork( j2-m ),
     $                         work( j2-m ), ka1 )
  330          CONTINUE
*
*              apply rotations in 1st set from both sides to diagonal
*              blocks
*
               CALL clar2v( nr, ab( 1, j2 ), ab( 1, j2+1 ), ab( 2, j2 ),
     $                      inca, rwork( j2-m ), work( j2-m ), ka1 )
*
               CALL clacgv( nr, work( j2-m ), ka1 )
            END IF
*
*           start applying rotations in 1st set from the right
*
            DO 340 l = ka - 1, kb - k + 1, -1
               nrt = ( n-j2+l ) / ka1
               IF( nrt.GT.0 )
     $            CALL clartv( nrt, ab( ka1-l+1, j2 ), inca,
     $                         ab( ka1-l, j2+1 ), inca, rwork( j2-m ),
     $                         work( j2-m ), ka1 )
  340       CONTINUE
*
            IF( wantx ) THEN
*
*              post-multiply X by product of rotations in 1st set
*
               DO 350 j = j2, j1, ka1
                  CALL crot( n-m, x( m+1, j ), 1, x( m+1, j+1 ), 1,
     $                       rwork( j-m ), work( j-m ) )
  350          CONTINUE
            END IF
  360    CONTINUE
*
         IF( update ) THEN
            IF( i2.LE.n .AND. kbt.GT.0 ) THEN
*
*              create nonzero element a(i-kbt+ka+1,i-kbt) outside the
*              band and store it in WORK(i-kbt)
*
               work( i-kbt ) = -bb( kbt+1, i-kbt )*ra1
            END IF
         END IF
*
         DO 400 k = kb, 1, -1
            IF( update ) THEN
               j2 = i - k - 1 + max( 2, k-i0+1 )*ka1
            ELSE
               j2 = i - k - 1 + max( 1, k-i0+1 )*ka1
            END IF
*
*           finish applying rotations in 2nd set from the right
*
            DO 370 l = kb - k, 1, -1
               nrt = ( n-j2+ka+l ) / ka1
               IF( nrt.GT.0 )
     $            CALL clartv( nrt, ab( ka1-l+1, j2-ka ), inca,
     $                         ab( ka1-l, j2-ka+1 ), inca,
     $                         rwork( j2-ka ), work( j2-ka ), ka1 )
  370       CONTINUE
            nr = ( n-j2+ka ) / ka1
            j1 = j2 + ( nr-1 )*ka1
            DO 380 j = j1, j2, -ka1
               work( j ) = work( j-ka )
               rwork( j ) = rwork( j-ka )
  380       CONTINUE
            DO 390 j = j2, j1, ka1
*
*              create nonzero element a(j+1,j-ka) outside the band
*              and store it in WORK(j)
*
               work( j ) = work( j )*ab( ka1, j-ka+1 )
               ab( ka1, j-ka+1 ) = rwork( j )*ab( ka1, j-ka+1 )
  390       CONTINUE
            IF( update ) THEN
               IF( i-k.LT.n-ka .AND. k.LE.kbt )
     $            work( i-k+ka ) = work( i-k )
            END IF
  400    CONTINUE
*
         DO 440 k = kb, 1, -1
            j2 = i - k - 1 + max( 1, k-i0+1 )*ka1
            nr = ( n-j2+ka ) / ka1
            j1 = j2 + ( nr-1 )*ka1
            IF( nr.GT.0 ) THEN
*
*              generate rotations in 2nd set to annihilate elements
*              which have been created outside the band
*
               CALL clargv( nr, ab( ka1, j2-ka ), inca, work( j2 ), ka1,
     $                      rwork( j2 ), ka1 )
*
*              apply rotations in 2nd set from the left
*
               DO 410 l = 1, ka - 1
                  CALL clartv( nr, ab( l+1, j2-l ), inca,
     $                         ab( l+2, j2-l ), inca, rwork( j2 ),
     $                         work( j2 ), ka1 )
  410          CONTINUE
*
*              apply rotations in 2nd set from both sides to diagonal
*              blocks
*
               CALL clar2v( nr, ab( 1, j2 ), ab( 1, j2+1 ), ab( 2, j2 ),
     $                      inca, rwork( j2 ), work( j2 ), ka1 )
*
               CALL clacgv( nr, work( j2 ), ka1 )
            END IF
*
*           start applying rotations in 2nd set from the right
*
            DO 420 l = ka - 1, kb - k + 1, -1
               nrt = ( n-j2+l ) / ka1
               IF( nrt.GT.0 )
     $            CALL clartv( nrt, ab( ka1-l+1, j2 ), inca,
     $                         ab( ka1-l, j2+1 ), inca, rwork( j2 ),
     $                         work( j2 ), ka1 )
  420       CONTINUE
*
            IF( wantx ) THEN
*
*              post-multiply X by product of rotations in 2nd set
*
               DO 430 j = j2, j1, ka1
                  CALL crot( n-m, x( m+1, j ), 1, x( m+1, j+1 ), 1,
     $                       rwork( j ), work( j ) )
  430          CONTINUE
            END IF
  440    CONTINUE
*
         DO 460 k = 1, kb - 1
            j2 = i - k - 1 + max( 1, k-i0+2 )*ka1
*
*           finish applying rotations in 1st set from the right
*
            DO 450 l = kb - k, 1, -1
               nrt = ( n-j2+l ) / ka1
               IF( nrt.GT.0 )
     $            CALL clartv( nrt, ab( ka1-l+1, j2 ), inca,
     $                         ab( ka1-l, j2+1 ), inca, rwork( j2-m ),
     $                         work( j2-m ), ka1 )
  450       CONTINUE
  460    CONTINUE
*
         IF( kb.GT.1 ) THEN
            DO 470 j = n - 1, j2 + ka, -1
               rwork( j-m ) = rwork( j-ka-m )
               work( j-m ) = work( j-ka-m )
  470       CONTINUE
         END IF
*
      END IF
*
      GO TO 10
*
  480 CONTINUE
*
*     **************************** Phase 2 *****************************
*
*     The logical structure of this phase is:
*
*     UPDATE = .TRUE.
*     DO I = 1, M
*        use S(i) to update A and create a new bulge
*        apply rotations to push all bulges KA positions upward
*     END DO
*     UPDATE = .FALSE.
*     DO I = M - KA - 1, 2, -1
*        apply rotations to push all bulges KA positions upward
*     END DO
*
*     To avoid duplicating code, the two loops are merged.
*
      update = .true.
      i = 0
  490 CONTINUE
      IF( update ) THEN
         i = i + 1
         kbt = min( kb, m-i )
         i0 = i + 1
         i1 = max( 1, i-ka )
         i2 = i + kbt - ka1
         IF( i.GT.m ) THEN
            update = .false.
            i = i - 1
            i0 = m + 1
            IF( ka.EQ.0 )
     $         RETURN
            GO TO 490
         END IF
      ELSE
         i = i - ka
         IF( i.LT.2 )
     $      RETURN
      END IF
*
      IF( i.LT.m-kbt ) THEN
         nx = m
      ELSE
         nx = n
      END IF
*
      IF( upper ) THEN
*
*        Transform A, working with the upper triangle
*
         IF( update ) THEN
*
*           Form  inv(S(i))**H * A * inv(S(i))
*
            bii = real( bb( kb1, i ) )
            ab( ka1, i ) = ( real( ab( ka1, i ) ) / bii ) / bii
            DO 500 j = i1, i - 1
               ab( j-i+ka1, i ) = ab( j-i+ka1, i ) / bii
  500       CONTINUE
            DO 510 j = i + 1, min( n, i+ka )
               ab( i-j+ka1, j ) = ab( i-j+ka1, j ) / bii
  510       CONTINUE
            DO 540 k = i + 1, i + kbt
               DO 520 j = k, i + kbt
                  ab( k-j+ka1, j ) = ab( k-j+ka1, j ) -
     $                               bb( i-j+kb1, j )*
     $                               conjg( ab( i-k+ka1, k ) ) -
     $                               conjg( bb( i-k+kb1, k ) )*
     $                               ab( i-j+ka1, j ) +
     $                               real( ab( ka1, i ) )*
     $                               bb( i-j+kb1, j )*
     $                               conjg( bb( i-k+kb1, k ) )
  520          CONTINUE
               DO 530 j = i + kbt + 1, min( n, i+ka )
                  ab( k-j+ka1, j ) = ab( k-j+ka1, j ) -
     $                               conjg( bb( i-k+kb1, k ) )*
     $                               ab( i-j+ka1, j )
  530          CONTINUE
  540       CONTINUE
            DO 560 j = i1, i
               DO 550 k = i + 1, min( j+ka, i+kbt )
                  ab( j-k+ka1, k ) = ab( j-k+ka1, k ) -
     $                               bb( i-k+kb1, k )*ab( j-i+ka1, i )
  550          CONTINUE
  560       CONTINUE
*
            IF( wantx ) THEN
*
*              post-multiply X by inv(S(i))
*
               CALL csscal( nx, one / bii, x( 1, i ), 1 )
               IF( kbt.GT.0 )
     $            CALL cgeru( nx, kbt, -cone, x( 1, i ), 1,
     $                        bb( kb, i+1 ), ldbb-1, x( 1, i+1 ), ldx )
            END IF
*
*           store a(i1,i) in RA1 for use in next loop over K
*
            ra1 = ab( i1-i+ka1, i )
         END IF
*
*        Generate and apply vectors of rotations to chase all the
*        existing bulges KA positions up toward the top of the band
*
         DO 610 k = 1, kb - 1
            IF( update ) THEN
*
*              Determine the rotations which would annihilate the bulge
*              which has in theory just been created
*
               IF( i+k-ka1.GT.0 .AND. i+k.LT.m ) THEN
*
*                 generate rotation to annihilate a(i+k-ka-1,i)
*
                  CALL clartg( ab( k+1, i ), ra1, rwork( i+k-ka ),
     $                         work( i+k-ka ), ra )
*
*                 create nonzero element a(i+k-ka-1,i+k) outside the
*                 band and store it in WORK(m-kb+i+k)
*
                  t = -bb( kb1-k, i+k )*ra1
                  work( m-kb+i+k ) = rwork( i+k-ka )*t -
     $                               conjg( work( i+k-ka ) )*
     $                               ab( 1, i+k )
                  ab( 1, i+k ) = work( i+k-ka )*t +
     $                           rwork( i+k-ka )*ab( 1, i+k )
                  ra1 = ra
               END IF
            END IF
            j2 = i + k + 1 - max( 1, k+i0-m+1 )*ka1
            nr = ( j2+ka-1 ) / ka1
            j1 = j2 - ( nr-1 )*ka1
            IF( update ) THEN
               j2t = min( j2, i-2*ka+k-1 )
            ELSE
               j2t = j2
            END IF
            nrt = ( j2t+ka-1 ) / ka1
            DO 570 j = j1, j2t, ka1
*
*              create nonzero element a(j-1,j+ka) outside the band
*              and store it in WORK(j)
*
               work( j ) = work( j )*ab( 1, j+ka-1 )
               ab( 1, j+ka-1 ) = rwork( j )*ab( 1, j+ka-1 )
  570       CONTINUE
*
*           generate rotations in 1st set to annihilate elements which
*           have been created outside the band
*
            IF( nrt.GT.0 )
     $         CALL clargv( nrt, ab( 1, j1+ka ), inca, work( j1 ), ka1,
     $                      rwork( j1 ), ka1 )
            IF( nr.GT.0 ) THEN
*
*              apply rotations in 1st set from the left
*
               DO 580 l = 1, ka - 1
                  CALL clartv( nr, ab( ka1-l, j1+l ), inca,
     $                         ab( ka-l, j1+l ), inca, rwork( j1 ),
     $                         work( j1 ), ka1 )
  580          CONTINUE
*
*              apply rotations in 1st set from both sides to diagonal
*              blocks
*
               CALL clar2v( nr, ab( ka1, j1 ), ab( ka1, j1-1 ),
     $                      ab( ka, j1 ), inca, rwork( j1 ), work( j1 ),
     $                      ka1 )
*
               CALL clacgv( nr, work( j1 ), ka1 )
            END IF
*
*           start applying rotations in 1st set from the right
*
            DO 590 l = ka - 1, kb - k + 1, -1
               nrt = ( j2+l-1 ) / ka1
               j1t = j2 - ( nrt-1 )*ka1
               IF( nrt.GT.0 )
     $            CALL clartv( nrt, ab( l, j1t ), inca,
     $                         ab( l+1, j1t-1 ), inca, rwork( j1t ),
     $                         work( j1t ), ka1 )
  590       CONTINUE
*
            IF( wantx ) THEN
*
*              post-multiply X by product of rotations in 1st set
*
               DO 600 j = j1, j2, ka1
                  CALL crot( nx, x( 1, j ), 1, x( 1, j-1 ), 1,
     $                       rwork( j ), work( j ) )
  600          CONTINUE
            END IF
  610    CONTINUE
*
         IF( update ) THEN
            IF( i2.GT.0 .AND. kbt.GT.0 ) THEN
*
*              create nonzero element a(i+kbt-ka-1,i+kbt) outside the
*              band and store it in WORK(m-kb+i+kbt)
*
               work( m-kb+i+kbt ) = -bb( kb1-kbt, i+kbt )*ra1
            END IF
         END IF
*
         DO 650 k = kb, 1, -1
            IF( update ) THEN
               j2 = i + k + 1 - max( 2, k+i0-m )*ka1
            ELSE
               j2 = i + k + 1 - max( 1, k+i0-m )*ka1
            END IF
*
*           finish applying rotations in 2nd set from the right
*
            DO 620 l = kb - k, 1, -1
               nrt = ( j2+ka+l-1 ) / ka1
               j1t = j2 - ( nrt-1 )*ka1
               IF( nrt.GT.0 )
     $            CALL clartv( nrt, ab( l, j1t+ka ), inca,
     $                         ab( l+1, j1t+ka-1 ), inca,
     $                         rwork( m-kb+j1t+ka ),
     $                         work( m-kb+j1t+ka ), ka1 )
  620       CONTINUE
            nr = ( j2+ka-1 ) / ka1
            j1 = j2 - ( nr-1 )*ka1
            DO 630 j = j1, j2, ka1
               work( m-kb+j ) = work( m-kb+j+ka )
               rwork( m-kb+j ) = rwork( m-kb+j+ka )
  630       CONTINUE
            DO 640 j = j1, j2, ka1
*
*              create nonzero element a(j-1,j+ka) outside the band
*              and store it in WORK(m-kb+j)
*
               work( m-kb+j ) = work( m-kb+j )*ab( 1, j+ka-1 )
               ab( 1, j+ka-1 ) = rwork( m-kb+j )*ab( 1, j+ka-1 )
  640       CONTINUE
            IF( update ) THEN
               IF( i+k.GT.ka1 .AND. k.LE.kbt )
     $            work( m-kb+i+k-ka ) = work( m-kb+i+k )
            END IF
  650    CONTINUE
*
         DO 690 k = kb, 1, -1
            j2 = i + k + 1 - max( 1, k+i0-m )*ka1
            nr = ( j2+ka-1 ) / ka1
            j1 = j2 - ( nr-1 )*ka1
            IF( nr.GT.0 ) THEN
*
*              generate rotations in 2nd set to annihilate elements
*              which have been created outside the band
*
               CALL clargv( nr, ab( 1, j1+ka ), inca, work( m-kb+j1 ),
     $                      ka1, rwork( m-kb+j1 ), ka1 )
*
*              apply rotations in 2nd set from the left
*
               DO 660 l = 1, ka - 1
                  CALL clartv( nr, ab( ka1-l, j1+l ), inca,
     $                         ab( ka-l, j1+l ), inca, rwork( m-kb+j1 ),
     $                         work( m-kb+j1 ), ka1 )
  660          CONTINUE
*
*              apply rotations in 2nd set from both sides to diagonal
*              blocks
*
               CALL clar2v( nr, ab( ka1, j1 ), ab( ka1, j1-1 ),
     $                      ab( ka, j1 ), inca, rwork( m-kb+j1 ),
     $                      work( m-kb+j1 ), ka1 )
*
               CALL clacgv( nr, work( m-kb+j1 ), ka1 )
            END IF
*
*           start applying rotations in 2nd set from the right
*
            DO 670 l = ka - 1, kb - k + 1, -1
               nrt = ( j2+l-1 ) / ka1
               j1t = j2 - ( nrt-1 )*ka1
               IF( nrt.GT.0 )
     $            CALL clartv( nrt, ab( l, j1t ), inca,
     $                         ab( l+1, j1t-1 ), inca,
     $                         rwork( m-kb+j1t ), work( m-kb+j1t ),
     $                         ka1 )
  670       CONTINUE
*
            IF( wantx ) THEN
*
*              post-multiply X by product of rotations in 2nd set
*
               DO 680 j = j1, j2, ka1
                  CALL crot( nx, x( 1, j ), 1, x( 1, j-1 ), 1,
     $                       rwork( m-kb+j ), work( m-kb+j ) )
  680          CONTINUE
            END IF
  690    CONTINUE
*
         DO 710 k = 1, kb - 1
            j2 = i + k + 1 - max( 1, k+i0-m+1 )*ka1
*
*           finish applying rotations in 1st set from the right
*
            DO 700 l = kb - k, 1, -1
               nrt = ( j2+l-1 ) / ka1
               j1t = j2 - ( nrt-1 )*ka1
               IF( nrt.GT.0 )
     $            CALL clartv( nrt, ab( l, j1t ), inca,
     $                         ab( l+1, j1t-1 ), inca, rwork( j1t ),
     $                         work( j1t ), ka1 )
  700       CONTINUE
  710    CONTINUE
*
         IF( kb.GT.1 ) THEN
            DO 720 j = 2, i2 - ka
               rwork( j ) = rwork( j+ka )
               work( j ) = work( j+ka )
  720       CONTINUE
         END IF
*
      ELSE
*
*        Transform A, working with the lower triangle
*
         IF( update ) THEN
*
*           Form  inv(S(i))**H * A * inv(S(i))
*
            bii = real( bb( 1, i ) )
            ab( 1, i ) = ( real( ab( 1, i ) ) / bii ) / bii
            DO 730 j = i1, i - 1
               ab( i-j+1, j ) = ab( i-j+1, j ) / bii
  730       CONTINUE
            DO 740 j = i + 1, min( n, i+ka )
               ab( j-i+1, i ) = ab( j-i+1, i ) / bii
  740       CONTINUE
            DO 770 k = i + 1, i + kbt
               DO 750 j = k, i + kbt
                  ab( j-k+1, k ) = ab( j-k+1, k ) -
     $                             bb( j-i+1, i )*conjg( ab( k-i+1,
     $                             i ) ) - conjg( bb( k-i+1, i ) )*
     $                             ab( j-i+1, i ) + real( ab( 1, i ) )*
     $                             bb( j-i+1, i )*conjg( bb( k-i+1,
     $                             i ) )
  750          CONTINUE
               DO 760 j = i + kbt + 1, min( n, i+ka )
                  ab( j-k+1, k ) = ab( j-k+1, k ) -
     $                             conjg( bb( k-i+1, i ) )*
     $                             ab( j-i+1, i )
  760          CONTINUE
  770       CONTINUE
            DO 790 j = i1, i
               DO 780 k = i + 1, min( j+ka, i+kbt )
                  ab( k-j+1, j ) = ab( k-j+1, j ) -
     $                             bb( k-i+1, i )*ab( i-j+1, j )
  780          CONTINUE
  790       CONTINUE
*
            IF( wantx ) THEN
*
*              post-multiply X by inv(S(i))
*
               CALL csscal( nx, one / bii, x( 1, i ), 1 )
               IF( kbt.GT.0 )
     $            CALL cgerc( nx, kbt, -cone, x( 1, i ), 1, bb( 2, i ),
     $                        1, x( 1, i+1 ), ldx )
            END IF
*
*           store a(i,i1) in RA1 for use in next loop over K
*
            ra1 = ab( i-i1+1, i1 )
         END IF
*
*        Generate and apply vectors of rotations to chase all the
*        existing bulges KA positions up toward the top of the band
*
         DO 840 k = 1, kb - 1
            IF( update ) THEN
*
*              Determine the rotations which would annihilate the bulge
*              which has in theory just been created
*
               IF( i+k-ka1.GT.0 .AND. i+k.LT.m ) THEN
*
*                 generate rotation to annihilate a(i,i+k-ka-1)
*
                  CALL clartg( ab( ka1-k, i+k-ka ), ra1,
     $                         rwork( i+k-ka ), work( i+k-ka ), ra )
*
*                 create nonzero element a(i+k,i+k-ka-1) outside the
*                 band and store it in WORK(m-kb+i+k)
*
                  t = -bb( k+1, i )*ra1
                  work( m-kb+i+k ) = rwork( i+k-ka )*t -
     $                               conjg( work( i+k-ka ) )*
     $                               ab( ka1, i+k-ka )
                  ab( ka1, i+k-ka ) = work( i+k-ka )*t +
     $                                rwork( i+k-ka )*ab( ka1, i+k-ka )
                  ra1 = ra
               END IF
            END IF
            j2 = i + k + 1 - max( 1, k+i0-m+1 )*ka1
            nr = ( j2+ka-1 ) / ka1
            j1 = j2 - ( nr-1 )*ka1
            IF( update ) THEN
               j2t = min( j2, i-2*ka+k-1 )
            ELSE
               j2t = j2
            END IF
            nrt = ( j2t+ka-1 ) / ka1
            DO 800 j = j1, j2t, ka1
*
*              create nonzero element a(j+ka,j-1) outside the band
*              and store it in WORK(j)
*
               work( j ) = work( j )*ab( ka1, j-1 )
               ab( ka1, j-1 ) = rwork( j )*ab( ka1, j-1 )
  800       CONTINUE
*
*           generate rotations in 1st set to annihilate elements which
*           have been created outside the band
*
            IF( nrt.GT.0 )
     $         CALL clargv( nrt, ab( ka1, j1 ), inca, work( j1 ), ka1,
     $                      rwork( j1 ), ka1 )
            IF( nr.GT.0 ) THEN
*
*              apply rotations in 1st set from the right
*
               DO 810 l = 1, ka - 1
                  CALL clartv( nr, ab( l+1, j1 ), inca, ab( l+2, j1-1 ),
     $                         inca, rwork( j1 ), work( j1 ), ka1 )
  810          CONTINUE
*
*              apply rotations in 1st set from both sides to diagonal
*              blocks
*
               CALL clar2v( nr, ab( 1, j1 ), ab( 1, j1-1 ),
     $                      ab( 2, j1-1 ), inca, rwork( j1 ),
     $                      work( j1 ), ka1 )
*
               CALL clacgv( nr, work( j1 ), ka1 )
            END IF
*
*           start applying rotations in 1st set from the left
*
            DO 820 l = ka - 1, kb - k + 1, -1
               nrt = ( j2+l-1 ) / ka1
               j1t = j2 - ( nrt-1 )*ka1
               IF( nrt.GT.0 )
     $            CALL clartv( nrt, ab( ka1-l+1, j1t-ka1+l ), inca,
     $                         ab( ka1-l, j1t-ka1+l ), inca,
     $                         rwork( j1t ), work( j1t ), ka1 )
  820       CONTINUE
*
            IF( wantx ) THEN
*
*              post-multiply X by product of rotations in 1st set
*
               DO 830 j = j1, j2, ka1
                  CALL crot( nx, x( 1, j ), 1, x( 1, j-1 ), 1,
     $                       rwork( j ), conjg( work( j ) ) )
  830          CONTINUE
            END IF
  840    CONTINUE
*
         IF( update ) THEN
            IF( i2.GT.0 .AND. kbt.GT.0 ) THEN
*
*              create nonzero element a(i+kbt,i+kbt-ka-1) outside the
*              band and store it in WORK(m-kb+i+kbt)
*
               work( m-kb+i+kbt ) = -bb( kbt+1, i )*ra1
            END IF
         END IF
*
         DO 880 k = kb, 1, -1
            IF( update ) THEN
               j2 = i + k + 1 - max( 2, k+i0-m )*ka1
            ELSE
               j2 = i + k + 1 - max( 1, k+i0-m )*ka1
            END IF
*
*           finish applying rotations in 2nd set from the left
*
            DO 850 l = kb - k, 1, -1
               nrt = ( j2+ka+l-1 ) / ka1
               j1t = j2 - ( nrt-1 )*ka1
               IF( nrt.GT.0 )
     $            CALL clartv( nrt, ab( ka1-l+1, j1t+l-1 ), inca,
     $                         ab( ka1-l, j1t+l-1 ), inca,
     $                         rwork( m-kb+j1t+ka ),
     $                         work( m-kb+j1t+ka ), ka1 )
  850       CONTINUE
            nr = ( j2+ka-1 ) / ka1
            j1 = j2 - ( nr-1 )*ka1
            DO 860 j = j1, j2, ka1
               work( m-kb+j ) = work( m-kb+j+ka )
               rwork( m-kb+j ) = rwork( m-kb+j+ka )
  860       CONTINUE
            DO 870 j = j1, j2, ka1
*
*              create nonzero element a(j+ka,j-1) outside the band
*              and store it in WORK(m-kb+j)
*
               work( m-kb+j ) = work( m-kb+j )*ab( ka1, j-1 )
               ab( ka1, j-1 ) = rwork( m-kb+j )*ab( ka1, j-1 )
  870       CONTINUE
            IF( update ) THEN
               IF( i+k.GT.ka1 .AND. k.LE.kbt )
     $            work( m-kb+i+k-ka ) = work( m-kb+i+k )
            END IF
  880    CONTINUE
*
         DO 920 k = kb, 1, -1
            j2 = i + k + 1 - max( 1, k+i0-m )*ka1
            nr = ( j2+ka-1 ) / ka1
            j1 = j2 - ( nr-1 )*ka1
            IF( nr.GT.0 ) THEN
*
*              generate rotations in 2nd set to annihilate elements
*              which have been created outside the band
*
               CALL clargv( nr, ab( ka1, j1 ), inca, work( m-kb+j1 ),
     $                      ka1, rwork( m-kb+j1 ), ka1 )
*
*              apply rotations in 2nd set from the right
*
               DO 890 l = 1, ka - 1
                  CALL clartv( nr, ab( l+1, j1 ), inca, ab( l+2, j1-1 ),
     $                         inca, rwork( m-kb+j1 ), work( m-kb+j1 ),
     $                         ka1 )
  890          CONTINUE
*
*              apply rotations in 2nd set from both sides to diagonal
*              blocks
*
               CALL clar2v( nr, ab( 1, j1 ), ab( 1, j1-1 ),
     $                      ab( 2, j1-1 ), inca, rwork( m-kb+j1 ),
     $                      work( m-kb+j1 ), ka1 )
*
               CALL clacgv( nr, work( m-kb+j1 ), ka1 )
            END IF
*
*           start applying rotations in 2nd set from the left
*
            DO 900 l = ka - 1, kb - k + 1, -1
               nrt = ( j2+l-1 ) / ka1
               j1t = j2 - ( nrt-1 )*ka1
               IF( nrt.GT.0 )
     $            CALL clartv( nrt, ab( ka1-l+1, j1t-ka1+l ), inca,
     $                         ab( ka1-l, j1t-ka1+l ), inca,
     $                         rwork( m-kb+j1t ), work( m-kb+j1t ),
     $                         ka1 )
  900       CONTINUE
*
            IF( wantx ) THEN
*
*              post-multiply X by product of rotations in 2nd set
*
               DO 910 j = j1, j2, ka1
                  CALL crot( nx, x( 1, j ), 1, x( 1, j-1 ), 1,
     $                       rwork( m-kb+j ), conjg( work( m-kb+j ) ) )
  910          CONTINUE
            END IF
  920    CONTINUE
*
         DO 940 k = 1, kb - 1
            j2 = i + k + 1 - max( 1, k+i0-m+1 )*ka1
*
*           finish applying rotations in 1st set from the left
*
            DO 930 l = kb - k, 1, -1
               nrt = ( j2+l-1 ) / ka1
               j1t = j2 - ( nrt-1 )*ka1
               IF( nrt.GT.0 )
     $            CALL clartv( nrt, ab( ka1-l+1, j1t-ka1+l ), inca,
     $                         ab( ka1-l, j1t-ka1+l ), inca,
     $                         rwork( j1t ), work( j1t ), ka1 )
  930       CONTINUE
  940    CONTINUE
*
         IF( kb.GT.1 ) THEN
            DO 950 j = 2, i2 - ka
               rwork( j ) = rwork( j+ka )
               work( j ) = work( j+ka )
  950       CONTINUE
         END IF
*
      END IF
*
      GO TO 490
*
*     End of CHBGST
*

◆ chbtrd()

subroutine chbtrd	(	character	vect,
		character	uplo,
		integer	n,
		integer	kd,
		complex, dimension( ldab, * )	ab,
		integer	ldab,
		real, dimension( * )	d,
		real, dimension( * )	e,
		complex, dimension( ldq, * )	q,
		integer	ldq,
		complex, dimension( * )	work,
		integer	info )

CHBTRD

Download CHBTRD + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CHBTRD reduces a complex Hermitian band matrix A to real symmetric
!> tridiagonal form T by a unitary similarity transformation:
!> Q**H * A * Q = T.
!>

Parameters

[in]	VECT	!> VECT is CHARACTER1 !> = 'N': do not form Q; !> = 'V': form Q; !> = 'U': update a matrix X, by forming XQ. !>
[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': Upper triangle of A is stored; !> = 'L': Lower triangle of A is stored. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in]	KD	!> KD is INTEGER !> The number of superdiagonals of the matrix A if UPLO = 'U', !> or the number of subdiagonals if UPLO = 'L'. KD >= 0. !>
[in,out]	AB	!> AB is COMPLEX array, dimension (LDAB,N) !> On entry, the upper or lower triangle of the Hermitian band !> matrix A, stored in the first KD+1 rows of the array. The !> j-th column of A is stored in the j-th column of the array AB !> as follows: !> if UPLO = 'U', AB(kd+1+i-j,j) = A(i,j) for max(1,j-kd)<=i<=j; !> if UPLO = 'L', AB(1+i-j,j) = A(i,j) for j<=i<=min(n,j+kd). !> On exit, the diagonal elements of AB are overwritten by the !> diagonal elements of the tridiagonal matrix T; if KD > 0, the !> elements on the first superdiagonal (if UPLO = 'U') or the !> first subdiagonal (if UPLO = 'L') are overwritten by the !> off-diagonal elements of T; the rest of AB is overwritten by !> values generated during the reduction. !>
[in]	LDAB	!> LDAB is INTEGER !> The leading dimension of the array AB. LDAB >= KD+1. !>
[out]	D	!> D is REAL array, dimension (N) !> The diagonal elements of the tridiagonal matrix T. !>
[out]	E	!> E is REAL array, dimension (N-1) !> The off-diagonal elements of the tridiagonal matrix T: !> E(i) = T(i,i+1) if UPLO = 'U'; E(i) = T(i+1,i) if UPLO = 'L'. !>
[in,out]	Q	!> Q is COMPLEX array, dimension (LDQ,N) !> On entry, if VECT = 'U', then Q must contain an N-by-N !> matrix X; if VECT = 'N' or 'V', then Q need not be set. !> !> On exit: !> if VECT = 'V', Q contains the N-by-N unitary matrix Q; !> if VECT = 'U', Q contains the product X*Q; !> if VECT = 'N', the array Q is not referenced. !>
[in]	LDQ	!> LDQ is INTEGER !> The leading dimension of the array Q. !> LDQ >= 1, and LDQ >= N if VECT = 'V' or 'U'. !>
[out]	WORK	!> WORK is COMPLEX array, dimension (N) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  Modified by Linda Kaufman, Bell Labs.
!>

Definition at line 161 of file chbtrd.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          UPLO, VECT
      INTEGER            INFO, KD, LDAB, LDQ, N
*     ..
*     .. Array Arguments ..
      REAL               D( * ), E( * )
      COMPLEX            AB( LDAB, * ), Q( LDQ, * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ZERO
      parameter( zero = 0.0e+0 )
      COMPLEX            CZERO, CONE
      parameter( czero = ( 0.0e+0, 0.0e+0 ),
     $                   cone = ( 1.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      LOGICAL            INITQ, UPPER, WANTQ
      INTEGER            I, I2, IBL, INCA, INCX, IQAEND, IQB, IQEND, J,
     $                   J1, J1END, J1INC, J2, JEND, JIN, JINC, K, KD1,
     $                   KDM1, KDN, L, LAST, LEND, NQ, NR, NRT
      REAL               ABST
      COMPLEX            T, TEMP
*     ..
*     .. External Subroutines ..
      EXTERNAL           clacgv, clar2v, clargv, clartg, clartv, claset,
     $                   crot, cscal, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, conjg, max, min, real
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters
*
      initq = lsame( vect, 'V' )
      wantq = initq .OR. lsame( vect, 'U' )
      upper = lsame( uplo, 'U' )
      kd1 = kd + 1
      kdm1 = kd - 1
      incx = ldab - 1
      iqend = 1
*
      info = 0
      IF( .NOT.wantq .AND. .NOT.lsame( vect, 'N' ) ) THEN
         info = -1
      ELSE IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -2
      ELSE IF( n.LT.0 ) THEN
         info = -3
      ELSE IF( kd.LT.0 ) THEN
         info = -4
      ELSE IF( ldab.LT.kd1 ) THEN
         info = -6
      ELSE IF( ldq.LT.max( 1, n ) .AND. wantq ) THEN
         info = -10
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CHBTRD', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
*     Initialize Q to the unit matrix, if needed
*
      IF( initq )
     $   CALL claset( 'Full', n, n, czero, cone, q, ldq )
*
*     Wherever possible, plane rotations are generated and applied in
*     vector operations of length NR over the index set J1:J2:KD1.
*
*     The real cosines and complex sines of the plane rotations are
*     stored in the arrays D and WORK.
*
      inca = kd1*ldab
      kdn = min( n-1, kd )
      IF( upper ) THEN
*
         IF( kd.GT.1 ) THEN
*
*           Reduce to complex Hermitian tridiagonal form, working with
*           the upper triangle
*
            nr = 0
            j1 = kdn + 2
            j2 = 1
*
            ab( kd1, 1 ) = real( ab( kd1, 1 ) )
            DO 90 i = 1, n - 2
*
*              Reduce i-th row of matrix to tridiagonal form
*
               DO 80 k = kdn + 1, 2, -1
                  j1 = j1 + kdn
                  j2 = j2 + kdn
*
                  IF( nr.GT.0 ) THEN
*
*                    generate plane rotations to annihilate nonzero
*                    elements which have been created outside the band
*
                     CALL clargv( nr, ab( 1, j1-1 ), inca, work( j1 ),
     $                            kd1, d( j1 ), kd1 )
*
*                    apply rotations from the right
*
*
*                    Dependent on the the number of diagonals either
*                    CLARTV or CROT is used
*
                     IF( nr.GE.2*kd-1 ) THEN
                        DO 10 l = 1, kd - 1
                           CALL clartv( nr, ab( l+1, j1-1 ), inca,
     $                                  ab( l, j1 ), inca, d( j1 ),
     $                                  work( j1 ), kd1 )
   10                   CONTINUE
*
                     ELSE
                        jend = j1 + ( nr-1 )*kd1
                        DO 20 jinc = j1, jend, kd1
                           CALL crot( kdm1, ab( 2, jinc-1 ), 1,
     $                                ab( 1, jinc ), 1, d( jinc ),
     $                                work( jinc ) )
   20                   CONTINUE
                     END IF
                  END IF
*
*
                  IF( k.GT.2 ) THEN
                     IF( k.LE.n-i+1 ) THEN
*
*                       generate plane rotation to annihilate a(i,i+k-1)
*                       within the band
*
                        CALL clartg( ab( kd-k+3, i+k-2 ),
     $                               ab( kd-k+2, i+k-1 ), d( i+k-1 ),
     $                               work( i+k-1 ), temp )
                        ab( kd-k+3, i+k-2 ) = temp
*
*                       apply rotation from the right
*
                        CALL crot( k-3, ab( kd-k+4, i+k-2 ), 1,
     $                             ab( kd-k+3, i+k-1 ), 1, d( i+k-1 ),
     $                             work( i+k-1 ) )
                     END IF
                     nr = nr + 1
                     j1 = j1 - kdn - 1
                  END IF
*
*                 apply plane rotations from both sides to diagonal
*                 blocks
*
                  IF( nr.GT.0 )
     $               CALL clar2v( nr, ab( kd1, j1-1 ), ab( kd1, j1 ),
     $                            ab( kd, j1 ), inca, d( j1 ),
     $                            work( j1 ), kd1 )
*
*                 apply plane rotations from the left
*
                  IF( nr.GT.0 ) THEN
                     CALL clacgv( nr, work( j1 ), kd1 )
                     IF( 2*kd-1.LT.nr ) THEN
*
*                    Dependent on the the number of diagonals either
*                    CLARTV or CROT is used
*
                        DO 30 l = 1, kd - 1
                           IF( j2+l.GT.n ) THEN
                              nrt = nr - 1
                           ELSE
                              nrt = nr
                           END IF
                           IF( nrt.GT.0 )
     $                        CALL clartv( nrt, ab( kd-l, j1+l ), inca,
     $                                     ab( kd-l+1, j1+l ), inca,
     $                                     d( j1 ), work( j1 ), kd1 )
   30                   CONTINUE
                     ELSE
                        j1end = j1 + kd1*( nr-2 )
                        IF( j1end.GE.j1 ) THEN
                           DO 40 jin = j1, j1end, kd1
                              CALL crot( kd-1, ab( kd-1, jin+1 ), incx,
     $                                   ab( kd, jin+1 ), incx,
     $                                   d( jin ), work( jin ) )
   40                      CONTINUE
                        END IF
                        lend = min( kdm1, n-j2 )
                        last = j1end + kd1
                        IF( lend.GT.0 )
     $                     CALL crot( lend, ab( kd-1, last+1 ), incx,
     $                                ab( kd, last+1 ), incx, d( last ),
     $                                work( last ) )
                     END IF
                  END IF
*
                  IF( wantq ) THEN
*
*                    accumulate product of plane rotations in Q
*
                     IF( initq ) THEN
*
*                 take advantage of the fact that Q was
*                 initially the Identity matrix
*
                        iqend = max( iqend, j2 )
                        i2 = max( 0, k-3 )
                        iqaend = 1 + i*kd
                        IF( k.EQ.2 )
     $                     iqaend = iqaend + kd
                        iqaend = min( iqaend, iqend )
                        DO 50 j = j1, j2, kd1
                           ibl = i - i2 / kdm1
                           i2 = i2 + 1
                           iqb = max( 1, j-ibl )
                           nq = 1 + iqaend - iqb
                           iqaend = min( iqaend+kd, iqend )
                           CALL crot( nq, q( iqb, j-1 ), 1, q( iqb, j ),
     $                                1, d( j ), conjg( work( j ) ) )
   50                   CONTINUE
                     ELSE
*
                        DO 60 j = j1, j2, kd1
                           CALL crot( n, q( 1, j-1 ), 1, q( 1, j ), 1,
     $                                d( j ), conjg( work( j ) ) )
   60                   CONTINUE
                     END IF
*
                  END IF
*
                  IF( j2+kdn.GT.n ) THEN
*
*                    adjust J2 to keep within the bounds of the matrix
*
                     nr = nr - 1
                     j2 = j2 - kdn - 1
                  END IF
*
                  DO 70 j = j1, j2, kd1
*
*                    create nonzero element a(j-1,j+kd) outside the band
*                    and store it in WORK
*
                     work( j+kd ) = work( j )*ab( 1, j+kd )
                     ab( 1, j+kd ) = d( j )*ab( 1, j+kd )
   70             CONTINUE
   80          CONTINUE
   90       CONTINUE
         END IF
*
         IF( kd.GT.0 ) THEN
*
*           make off-diagonal elements real and copy them to E
*
            DO 100 i = 1, n - 1
               t = ab( kd, i+1 )
               abst = abs( t )
               ab( kd, i+1 ) = abst
               e( i ) = abst
               IF( abst.NE.zero ) THEN
                  t = t / abst
               ELSE
                  t = cone
               END IF
               IF( i.LT.n-1 )
     $            ab( kd, i+2 ) = ab( kd, i+2 )*t
               IF( wantq ) THEN
                  CALL cscal( n, conjg( t ), q( 1, i+1 ), 1 )
               END IF
  100       CONTINUE
         ELSE
*
*           set E to zero if original matrix was diagonal
*
            DO 110 i = 1, n - 1
               e( i ) = zero
  110       CONTINUE
         END IF
*
*        copy diagonal elements to D
*
         DO 120 i = 1, n
            d( i ) = real( ab( kd1, i ) )
  120    CONTINUE
*
      ELSE
*
         IF( kd.GT.1 ) THEN
*
*           Reduce to complex Hermitian tridiagonal form, working with
*           the lower triangle
*
            nr = 0
            j1 = kdn + 2
            j2 = 1
*
            ab( 1, 1 ) = real( ab( 1, 1 ) )
            DO 210 i = 1, n - 2
*
*              Reduce i-th column of matrix to tridiagonal form
*
               DO 200 k = kdn + 1, 2, -1
                  j1 = j1 + kdn
                  j2 = j2 + kdn
*
                  IF( nr.GT.0 ) THEN
*
*                    generate plane rotations to annihilate nonzero
*                    elements which have been created outside the band
*
                     CALL clargv( nr, ab( kd1, j1-kd1 ), inca,
     $                            work( j1 ), kd1, d( j1 ), kd1 )
*
*                    apply plane rotations from one side
*
*
*                    Dependent on the the number of diagonals either
*                    CLARTV or CROT is used
*
                     IF( nr.GT.2*kd-1 ) THEN
                        DO 130 l = 1, kd - 1
                           CALL clartv( nr, ab( kd1-l, j1-kd1+l ), inca,
     $                                  ab( kd1-l+1, j1-kd1+l ), inca,
     $                                  d( j1 ), work( j1 ), kd1 )
  130                   CONTINUE
                     ELSE
                        jend = j1 + kd1*( nr-1 )
                        DO 140 jinc = j1, jend, kd1
                           CALL crot( kdm1, ab( kd, jinc-kd ), incx,
     $                                ab( kd1, jinc-kd ), incx,
     $                                d( jinc ), work( jinc ) )
  140                   CONTINUE
                     END IF
*
                  END IF
*
                  IF( k.GT.2 ) THEN
                     IF( k.LE.n-i+1 ) THEN
*
*                       generate plane rotation to annihilate a(i+k-1,i)
*                       within the band
*
                        CALL clartg( ab( k-1, i ), ab( k, i ),
     $                               d( i+k-1 ), work( i+k-1 ), temp )
                        ab( k-1, i ) = temp
*
*                       apply rotation from the left
*
                        CALL crot( k-3, ab( k-2, i+1 ), ldab-1,
     $                             ab( k-1, i+1 ), ldab-1, d( i+k-1 ),
     $                             work( i+k-1 ) )
                     END IF
                     nr = nr + 1
                     j1 = j1 - kdn - 1
                  END IF
*
*                 apply plane rotations from both sides to diagonal
*                 blocks
*
                  IF( nr.GT.0 )
     $               CALL clar2v( nr, ab( 1, j1-1 ), ab( 1, j1 ),
     $                            ab( 2, j1-1 ), inca, d( j1 ),
     $                            work( j1 ), kd1 )
*
*                 apply plane rotations from the right
*
*
*                    Dependent on the the number of diagonals either
*                    CLARTV or CROT is used
*
                  IF( nr.GT.0 ) THEN
                     CALL clacgv( nr, work( j1 ), kd1 )
                     IF( nr.GT.2*kd-1 ) THEN
                        DO 150 l = 1, kd - 1
                           IF( j2+l.GT.n ) THEN
                              nrt = nr - 1
                           ELSE
                              nrt = nr
                           END IF
                           IF( nrt.GT.0 )
     $                        CALL clartv( nrt, ab( l+2, j1-1 ), inca,
     $                                     ab( l+1, j1 ), inca, d( j1 ),
     $                                     work( j1 ), kd1 )
  150                   CONTINUE
                     ELSE
                        j1end = j1 + kd1*( nr-2 )
                        IF( j1end.GE.j1 ) THEN
                           DO 160 j1inc = j1, j1end, kd1
                              CALL crot( kdm1, ab( 3, j1inc-1 ), 1,
     $                                   ab( 2, j1inc ), 1, d( j1inc ),
     $                                   work( j1inc ) )
  160                      CONTINUE
                        END IF
                        lend = min( kdm1, n-j2 )
                        last = j1end + kd1
                        IF( lend.GT.0 )
     $                     CALL crot( lend, ab( 3, last-1 ), 1,
     $                                ab( 2, last ), 1, d( last ),
     $                                work( last ) )
                     END IF
                  END IF
*
*
*
                  IF( wantq ) THEN
*
*                    accumulate product of plane rotations in Q
*
                     IF( initq ) THEN
*
*                 take advantage of the fact that Q was
*                 initially the Identity matrix
*
                        iqend = max( iqend, j2 )
                        i2 = max( 0, k-3 )
                        iqaend = 1 + i*kd
                        IF( k.EQ.2 )
     $                     iqaend = iqaend + kd
                        iqaend = min( iqaend, iqend )
                        DO 170 j = j1, j2, kd1
                           ibl = i - i2 / kdm1
                           i2 = i2 + 1
                           iqb = max( 1, j-ibl )
                           nq = 1 + iqaend - iqb
                           iqaend = min( iqaend+kd, iqend )
                           CALL crot( nq, q( iqb, j-1 ), 1, q( iqb, j ),
     $                                1, d( j ), work( j ) )
  170                   CONTINUE
                     ELSE
*
                        DO 180 j = j1, j2, kd1
                           CALL crot( n, q( 1, j-1 ), 1, q( 1, j ), 1,
     $                                d( j ), work( j ) )
  180                   CONTINUE
                     END IF
                  END IF
*
                  IF( j2+kdn.GT.n ) THEN
*
*                    adjust J2 to keep within the bounds of the matrix
*
                     nr = nr - 1
                     j2 = j2 - kdn - 1
                  END IF
*
                  DO 190 j = j1, j2, kd1
*
*                    create nonzero element a(j+kd,j-1) outside the
*                    band and store it in WORK
*
                     work( j+kd ) = work( j )*ab( kd1, j )
                     ab( kd1, j ) = d( j )*ab( kd1, j )
  190             CONTINUE
  200          CONTINUE
  210       CONTINUE
         END IF
*
         IF( kd.GT.0 ) THEN
*
*           make off-diagonal elements real and copy them to E
*
            DO 220 i = 1, n - 1
               t = ab( 2, i )
               abst = abs( t )
               ab( 2, i ) = abst
               e( i ) = abst
               IF( abst.NE.zero ) THEN
                  t = t / abst
               ELSE
                  t = cone
               END IF
               IF( i.LT.n-1 )
     $            ab( 2, i+1 ) = ab( 2, i+1 )*t
               IF( wantq ) THEN
                  CALL cscal( n, t, q( 1, i+1 ), 1 )
               END IF
  220       CONTINUE
         ELSE
*
*           set E to zero if original matrix was diagonal
*
            DO 230 i = 1, n - 1
               e( i ) = zero
  230       CONTINUE
         END IF
*
*        copy diagonal elements to D
*
         DO 240 i = 1, n
            d( i ) = real( ab( 1, i ) )
  240    CONTINUE
      END IF
*
      RETURN
*
*     End of CHBTRD
*

◆ chetrd_hb2st()

subroutine chetrd_hb2st	(	character	stage1,
		character	vect,
		character	uplo,
		integer	n,
		integer	kd,
		complex, dimension( ldab, * )	ab,
		integer	ldab,
		real, dimension( * )	d,
		real, dimension( * )	e,
		complex, dimension( * )	hous,
		integer	lhous,
		complex, dimension( * )	work,
		integer	lwork,
		integer	info )

CHETRD_HB2ST reduces a complex Hermitian band matrix A to real symmetric tridiagonal form T

Download CHETRD_HB2ST + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CHETRD_HB2ST reduces a complex Hermitian band matrix A to real symmetric
!> tridiagonal form T by a unitary similarity transformation:
!> Q**H * A * Q = T.
!>

Parameters

[in]	STAGE1	!> STAGE1 is CHARACTER*1 !> = 'N': : to mention that the stage 1 of the reduction !> from dense to band using the chetrd_he2hb routine !> was not called before this routine to reproduce AB. !> In other term this routine is called as standalone. !> = 'Y': : to mention that the stage 1 of the !> reduction from dense to band using the chetrd_he2hb !> routine has been called to produce AB (e.g., AB is !> the output of chetrd_he2hb. !>
[in]	VECT	!> VECT is CHARACTER1 !> = 'N': No need for the Housholder representation, !> and thus LHOUS is of size max(1, 4N); !> = 'V': the Householder representation is needed to !> either generate or to apply Q later on, !> then LHOUS is to be queried and computed. !> (NOT AVAILABLE IN THIS RELEASE). !>
[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': Upper triangle of A is stored; !> = 'L': Lower triangle of A is stored. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in]	KD	!> KD is INTEGER !> The number of superdiagonals of the matrix A if UPLO = 'U', !> or the number of subdiagonals if UPLO = 'L'. KD >= 0. !>
[in,out]	AB	!> AB is COMPLEX array, dimension (LDAB,N) !> On entry, the upper or lower triangle of the Hermitian band !> matrix A, stored in the first KD+1 rows of the array. The !> j-th column of A is stored in the j-th column of the array AB !> as follows: !> if UPLO = 'U', AB(kd+1+i-j,j) = A(i,j) for max(1,j-kd)<=i<=j; !> if UPLO = 'L', AB(1+i-j,j) = A(i,j) for j<=i<=min(n,j+kd). !> On exit, the diagonal elements of AB are overwritten by the !> diagonal elements of the tridiagonal matrix T; if KD > 0, the !> elements on the first superdiagonal (if UPLO = 'U') or the !> first subdiagonal (if UPLO = 'L') are overwritten by the !> off-diagonal elements of T; the rest of AB is overwritten by !> values generated during the reduction. !>
[in]	LDAB	!> LDAB is INTEGER !> The leading dimension of the array AB. LDAB >= KD+1. !>
[out]	D	!> D is REAL array, dimension (N) !> The diagonal elements of the tridiagonal matrix T. !>
[out]	E	!> E is REAL array, dimension (N-1) !> The off-diagonal elements of the tridiagonal matrix T: !> E(i) = T(i,i+1) if UPLO = 'U'; E(i) = T(i+1,i) if UPLO = 'L'. !>
[out]	HOUS	!> HOUS is COMPLEX array, dimension LHOUS, that !> store the Householder representation. !>
[in]	LHOUS	!> LHOUS is INTEGER !> The dimension of the array HOUS. LHOUS = MAX(1, dimension) !> If LWORK = -1, or LHOUS=-1, !> then a query is assumed; the routine !> only calculates the optimal size of the HOUS array, returns !> this value as the first entry of the HOUS array, and no error !> message related to LHOUS is issued by XERBLA. !> LHOUS = MAX(1, dimension) where !> dimension = 4*N if VECT='N' !> not available now if VECT='H' !>
[out]	WORK	!> WORK is COMPLEX array, dimension LWORK. !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the array WORK. LWORK = MAX(1, dimension) !> If LWORK = -1, or LHOUS=-1, !> then a workspace query is assumed; the routine !> only calculates the optimal size of the WORK array, returns !> this value as the first entry of the WORK array, and no error !> message related to LWORK is issued by XERBLA. !> LWORK = MAX(1, dimension) where !> dimension = (2KD+1)N + KDNTHREADS !> where KD is the blocking size of the reduction, !> FACTOPTNB is the blocking used by the QR or LQ !> algorithm, usually FACTOPTNB=128 is a good choice !> NTHREADS is the number of threads used when !> openMP compilation is enabled, otherwise =1. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  Implemented by Azzam Haidar.
!>
!>  All details are available on technical report, SC11, SC13 papers.
!>
!>  Azzam Haidar, Hatem Ltaief, and Jack Dongarra.
!>  Parallel reduction to condensed forms for symmetric eigenvalue problems
!>  using aggregated fine-grained and memory-aware kernels. In Proceedings
!>  of 2011 International Conference for High Performance Computing,
!>  Networking, Storage and Analysis (SC '11), New York, NY, USA,
!>  Article 8 , 11 pages.
!>  http://doi.acm.org/10.1145/2063384.2063394
!>
!>  A. Haidar, J. Kurzak, P. Luszczek, 2013.
!>  An improved parallel singular value algorithm and its implementation 
!>  for multicore hardware, In Proceedings of 2013 International Conference
!>  for High Performance Computing, Networking, Storage and Analysis (SC '13).
!>  Denver, Colorado, USA, 2013.
!>  Article 90, 12 pages.
!>  http://doi.acm.org/10.1145/2503210.2503292
!>
!>  A. Haidar, R. Solca, S. Tomov, T. Schulthess and J. Dongarra.
!>  A novel hybrid CPU-GPU generalized eigensolver for electronic structure 
!>  calculations based on fine-grained memory aware tasks.
!>  International Journal of High Performance Computing Applications.
!>  Volume 28 Issue 2, Pages 196-209, May 2014.
!>  http://hpc.sagepub.com/content/28/2/196 
!>
!>

Definition at line 228 of file chetrd_hb2st.F.

*
*
#if defined(_OPENMP)
      use omp_lib
#endif
*
      IMPLICIT NONE
*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          STAGE1, UPLO, VECT
      INTEGER            N, KD, LDAB, LHOUS, LWORK, INFO
*     ..
*     .. Array Arguments ..
      REAL               D( * ), E( * )
      COMPLEX            AB( LDAB, * ), HOUS( * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               RZERO
      COMPLEX            ZERO, ONE
      parameter( rzero = 0.0e+0,
     $                   zero = ( 0.0e+0, 0.0e+0 ),
     $                   one  = ( 1.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      LOGICAL            LQUERY, WANTQ, UPPER, AFTERS1
      INTEGER            I, M, K, IB, SWEEPID, MYID, SHIFT, STT, ST, 
     $                   ED, STIND, EDIND, BLKLASTIND, COLPT, THED,
     $                   STEPERCOL, GRSIZ, THGRSIZ, THGRNB, THGRID,
     $                   NBTILES, TTYPE, TID, NTHREADS, DEBUG,
     $                   ABDPOS, ABOFDPOS, DPOS, OFDPOS, AWPOS, 
     $                   INDA, INDW, APOS, SIZEA, LDA, INDV, INDTAU,
     $                   SICEV, SIZETAU, LDV, LHMIN, LWMIN
      REAL               ABSTMP
      COMPLEX            TMP
*     ..
*     .. External Subroutines ..
      EXTERNAL           chb2st_kernels, clacpy, claset, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          min, max, ceiling, real
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      INTEGER            ILAENV2STAGE 
      EXTERNAL           lsame, ilaenv2stage
*     ..
*     .. Executable Statements ..
*
*     Determine the minimal workspace size required.
*     Test the input parameters
*
      debug   = 0
      info    = 0
      afters1 = lsame( stage1, 'Y' )
      wantq   = lsame( vect, 'V' )
      upper   = lsame( uplo, 'U' )
      lquery  = ( lwork.EQ.-1 ) .OR. ( lhous.EQ.-1 )
*
*     Determine the block size, the workspace size and the hous size.
*
      ib     = ilaenv2stage( 2, 'CHETRD_HB2ST', vect, n, kd, -1, -1 )
      lhmin  = ilaenv2stage( 3, 'CHETRD_HB2ST', vect, n, kd, ib, -1 )
      lwmin  = ilaenv2stage( 4, 'CHETRD_HB2ST', vect, n, kd, ib, -1 )
*
      IF( .NOT.afters1 .AND. .NOT.lsame( stage1, 'N' ) ) THEN
         info = -1
      ELSE IF( .NOT.lsame( vect, 'N' ) ) THEN
         info = -2
      ELSE IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -3
      ELSE IF( n.LT.0 ) THEN
         info = -4
      ELSE IF( kd.LT.0 ) THEN
         info = -5
      ELSE IF( ldab.LT.(kd+1) ) THEN
         info = -7
      ELSE IF( lhous.LT.lhmin .AND. .NOT.lquery ) THEN
         info = -11
      ELSE IF( lwork.LT.lwmin .AND. .NOT.lquery ) THEN
         info = -13
      END IF
*
      IF( info.EQ.0 ) THEN
         hous( 1 ) = lhmin
         work( 1 ) = lwmin
      END IF
*
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CHETRD_HB2ST', -info )
         RETURN
      ELSE IF( lquery ) THEN
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 ) THEN
          hous( 1 ) = 1
          work( 1 ) = 1
          RETURN
      END IF
*
*     Determine pointer position
*
      ldv      = kd + ib
      sizetau  = 2 * n
      sicev    = 2 * n
      indtau   = 1
      indv     = indtau + sizetau
      lda      = 2 * kd + 1
      sizea    = lda * n
      inda     = 1
      indw     = inda + sizea
      nthreads = 1
      tid      = 0
*
      IF( upper ) THEN
          apos     = inda + kd
          awpos    = inda
          dpos     = apos + kd
          ofdpos   = dpos - 1
          abdpos   = kd + 1
          abofdpos = kd
      ELSE
          apos     = inda 
          awpos    = inda + kd + 1
          dpos     = apos
          ofdpos   = dpos + 1
          abdpos   = 1
          abofdpos = 2
 
      ENDIF
*      
*     Case KD=0: 
*     The matrix is diagonal. We just copy it (convert to "real" for 
*     complex because D is double and the imaginary part should be 0) 
*     and store it in D. A sequential code here is better or 
*     in a parallel environment it might need two cores for D and E
*
      IF( kd.EQ.0 ) THEN
          DO 30 i = 1, n
              d( i ) = real( ab( abdpos, i ) )
   30     CONTINUE
          DO 40 i = 1, n-1
              e( i ) = rzero
   40     CONTINUE
*
          hous( 1 ) = 1
          work( 1 ) = 1
          RETURN
      END IF
*      
*     Case KD=1: 
*     The matrix is already Tridiagonal. We have to make diagonal 
*     and offdiagonal elements real, and store them in D and E.
*     For that, for real precision just copy the diag and offdiag 
*     to D and E while for the COMPLEX case the bulge chasing is  
*     performed to convert the hermetian tridiagonal to symmetric 
*     tridiagonal. A simpler conversion formula might be used, but then 
*     updating the Q matrix will be required and based if Q is generated
*     or not this might complicate the story. 
*      
      IF( kd.EQ.1 ) THEN
          DO 50 i = 1, n
              d( i ) = real( ab( abdpos, i ) )
   50     CONTINUE
*
*         make off-diagonal elements real and copy them to E
*
          IF( upper ) THEN
              DO 60 i = 1, n - 1
                  tmp = ab( abofdpos, i+1 )
                  abstmp = abs( tmp )
                  ab( abofdpos, i+1 ) = abstmp
                  e( i ) = abstmp
                  IF( abstmp.NE.rzero ) THEN
                     tmp = tmp / abstmp
                  ELSE
                     tmp = one
                  END IF
                  IF( i.LT.n-1 )
     $               ab( abofdpos, i+2 ) = ab( abofdpos, i+2 )*tmp
C                  IF( WANTZ ) THEN
C                     CALL CSCAL( N, CONJG( TMP ), Q( 1, I+1 ), 1 )
C                  END IF
   60         CONTINUE
          ELSE
              DO 70 i = 1, n - 1
                 tmp = ab( abofdpos, i )
                 abstmp = abs( tmp )
                 ab( abofdpos, i ) = abstmp
                 e( i ) = abstmp
                 IF( abstmp.NE.rzero ) THEN
                    tmp = tmp / abstmp
                 ELSE
                    tmp = one
                 END IF
                 IF( i.LT.n-1 )
     $              ab( abofdpos, i+1 ) = ab( abofdpos, i+1 )*tmp
C                 IF( WANTQ ) THEN
C                    CALL CSCAL( N, TMP, Q( 1, I+1 ), 1 )
C                 END IF
   70         CONTINUE
          ENDIF
*
          hous( 1 ) = 1
          work( 1 ) = 1
          RETURN
      END IF
*
*     Main code start here. 
*     Reduce the hermitian band of A to a tridiagonal matrix.
*
      thgrsiz   = n
      grsiz     = 1
      shift     = 3
      nbtiles   = ceiling( real(n)/real(kd) )
      stepercol = ceiling( real(shift)/real(grsiz) )
      thgrnb    = ceiling( real(n-1)/real(thgrsiz) )
*      
      CALL clacpy( "A", kd+1, n, ab, ldab, work( apos ), lda )
      CALL claset( "A", kd,   n, zero, zero, work( awpos ), lda )
*
*
*     openMP parallelisation start here
*
#if defined(_OPENMP)
!$OMP PARALLEL PRIVATE( TID, THGRID, BLKLASTIND )
!$OMP$         PRIVATE( THED, I, M, K, ST, ED, STT, SWEEPID ) 
!$OMP$         PRIVATE( MYID, TTYPE, COLPT, STIND, EDIND )
!$OMP$         SHARED ( UPLO, WANTQ, INDV, INDTAU, HOUS, WORK)
!$OMP$         SHARED ( N, KD, IB, NBTILES, LDA, LDV, INDA )
!$OMP$         SHARED ( STEPERCOL, THGRNB, THGRSIZ, GRSIZ, SHIFT )
!$OMP MASTER
#endif
*
*     main bulge chasing loop
*      
      DO 100 thgrid = 1, thgrnb
          stt  = (thgrid-1)*thgrsiz+1
          thed = min( (stt + thgrsiz -1), (n-1))
          DO 110 i = stt, n-1
              ed = min( i, thed )
              IF( stt.GT.ed ) EXIT
              DO 120 m = 1, stepercol
                  st = stt
                  DO 130 sweepid = st, ed
                      DO 140 k = 1, grsiz
                          myid  = (i-sweepid)*(stepercol*grsiz) 
     $                           + (m-1)*grsiz + k
                          IF ( myid.EQ.1 ) THEN
                              ttype = 1
                          ELSE
                              ttype = mod( myid, 2 ) + 2
                          ENDIF
 
                          IF( ttype.EQ.2 ) THEN
                              colpt      = (myid/2)*kd + sweepid
                              stind      = colpt-kd+1
                              edind      = min(colpt,n)
                              blklastind = colpt
                          ELSE
                              colpt      = ((myid+1)/2)*kd + sweepid
                              stind      = colpt-kd+1
                              edind      = min(colpt,n)
                              IF( ( stind.GE.edind-1 ).AND.
     $                            ( edind.EQ.n ) ) THEN
                                  blklastind = n
                              ELSE
                                  blklastind = 0
                              ENDIF
                          ENDIF
*
*                         Call the kernel
*                             
#if defined(_OPENMP) && _OPENMP >= 201307
                          IF( ttype.NE.1 ) THEN      
!$OMP TASK DEPEND(in:WORK(MYID+SHIFT-1))
!$OMP$     DEPEND(in:WORK(MYID-1))
!$OMP$     DEPEND(out:WORK(MYID))
                              tid      = omp_get_thread_num()
                              CALL chb2st_kernels( uplo, wantq, ttype, 
     $                             stind, edind, sweepid, n, kd, ib,
     $                             work( inda ), lda, 
     $                             hous( indv ), hous( indtau ), ldv,
     $                             work( indw + tid*kd ) )
!$OMP END TASK
                          ELSE
!$OMP TASK DEPEND(in:WORK(MYID+SHIFT-1))
!$OMP$     DEPEND(out:WORK(MYID))
                              tid      = omp_get_thread_num()
                              CALL chb2st_kernels( uplo, wantq, ttype, 
     $                             stind, edind, sweepid, n, kd, ib,
     $                             work( inda ), lda, 
     $                             hous( indv ), hous( indtau ), ldv,
     $                             work( indw + tid*kd ) )
!$OMP END TASK
                          ENDIF
#else
                          CALL chb2st_kernels( uplo, wantq, ttype, 
     $                         stind, edind, sweepid, n, kd, ib,
     $                         work( inda ), lda, 
     $                         hous( indv ), hous( indtau ), ldv,
     $                         work( indw + tid*kd ) )
#endif 
                          IF ( blklastind.GE.(n-1) ) THEN
                              stt = stt + 1
                              EXIT
                          ENDIF
  140                 CONTINUE
  130             CONTINUE
  120         CONTINUE
  110     CONTINUE
  100 CONTINUE
*
#if defined(_OPENMP)
!$OMP END MASTER
!$OMP END PARALLEL
#endif
*      
*     Copy the diagonal from A to D. Note that D is REAL thus only
*     the Real part is needed, the imaginary part should be zero.
*
      DO 150 i = 1, n
          d( i ) = real( work( dpos+(i-1)*lda ) )
  150 CONTINUE
*      
*     Copy the off diagonal from A to E. Note that E is REAL thus only
*     the Real part is needed, the imaginary part should be zero.
*
      IF( upper ) THEN
          DO 160 i = 1, n-1
             e( i ) = real( work( ofdpos+i*lda ) )
  160     CONTINUE
      ELSE
          DO 170 i = 1, n-1
             e( i ) = real( work( ofdpos+(i-1)*lda ) )
  170     CONTINUE
      ENDIF
*
      hous( 1 ) = lhmin
      work( 1 ) = lwmin
      RETURN
*
*     End of CHETRD_HB2ST
*

◆ chfrk()

subroutine chfrk	(	character	transr,
		character	uplo,
		character	trans,
		integer	n,
		integer	k,
		real	alpha,
		complex, dimension( lda, * )	a,
		integer	lda,
		real	beta,
		complex, dimension( * )	c )

CHFRK performs a Hermitian rank-k operation for matrix in RFP format.

Download CHFRK + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> Level 3 BLAS like routine for C in RFP Format.
!>
!> CHFRK performs one of the Hermitian rank--k operations
!>
!>    C := alpha*A*A**H + beta*C,
!>
!> or
!>
!>    C := alpha*A**H*A + beta*C,
!>
!> where alpha and beta are real scalars, C is an n--by--n Hermitian
!> matrix and A is an n--by--k matrix in the first case and a k--by--n
!> matrix in the second case.
!>

Parameters

[in]	TRANSR	!> TRANSR is CHARACTER*1 !> = 'N': The Normal Form of RFP A is stored; !> = 'C': The Conjugate-transpose Form of RFP A is stored. !>
[in]	UPLO	!> UPLO is CHARACTER*1 !> On entry, UPLO specifies whether the upper or lower !> triangular part of the array C is to be referenced as !> follows: !> !> UPLO = 'U' or 'u' Only the upper triangular part of C !> is to be referenced. !> !> UPLO = 'L' or 'l' Only the lower triangular part of C !> is to be referenced. !> !> Unchanged on exit. !>
[in]	TRANS	!> TRANS is CHARACTER1 !> On entry, TRANS specifies the operation to be performed as !> follows: !> !> TRANS = 'N' or 'n' C := alphaAAH + betaC. !> !> TRANS = 'C' or 'c' C := alphaAHA + beta*C. !> !> Unchanged on exit. !>
[in]	N	!> N is INTEGER !> On entry, N specifies the order of the matrix C. N must be !> at least zero. !> Unchanged on exit. !>
[in]	K	!> K is INTEGER !> On entry with TRANS = 'N' or 'n', K specifies the number !> of columns of the matrix A, and on entry with !> TRANS = 'C' or 'c', K specifies the number of rows of the !> matrix A. K must be at least zero. !> Unchanged on exit. !>
[in]	ALPHA	!> ALPHA is REAL !> On entry, ALPHA specifies the scalar alpha. !> Unchanged on exit. !>
[in]	A	!> A is COMPLEX array, dimension (LDA,ka) !> where KA !> is K when TRANS = 'N' or 'n', and is N otherwise. Before !> entry with TRANS = 'N' or 'n', the leading N--by--K part of !> the array A must contain the matrix A, otherwise the leading !> K--by--N part of the array A must contain the matrix A. !> Unchanged on exit. !>
[in]	LDA	!> LDA is INTEGER !> On entry, LDA specifies the first dimension of A as declared !> in the calling (sub) program. When TRANS = 'N' or 'n' !> then LDA must be at least max( 1, n ), otherwise LDA must !> be at least max( 1, k ). !> Unchanged on exit. !>
[in]	BETA	!> BETA is REAL !> On entry, BETA specifies the scalar beta. !> Unchanged on exit. !>
[in,out]	C	!> C is COMPLEX array, dimension (N*(N+1)/2) !> On entry, the matrix A in RFP Format. RFP Format is !> described by TRANSR, UPLO and N. Note that the imaginary !> parts of the diagonal elements need not be set, they are !> assumed to be zero, and on exit they are set to zero. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 166 of file chfrk.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      REAL               ALPHA, BETA
      INTEGER            K, LDA, N
      CHARACTER          TRANS, TRANSR, UPLO
*     ..
*     .. Array Arguments ..
      COMPLEX            A( LDA, * ), C( * )
*     ..
*
*  =====================================================================
*
*     ..
*     .. Parameters ..
      REAL               ONE, ZERO
      COMPLEX            CZERO
      parameter( one = 1.0e+0, zero = 0.0e+0 )
      parameter( czero = ( 0.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      LOGICAL            LOWER, NORMALTRANSR, NISODD, NOTRANS
      INTEGER            INFO, NROWA, J, NK, N1, N2
      COMPLEX            CALPHA, CBETA
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           cgemm, cherk, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, cmplx
*     ..
*     .. Executable Statements ..
*
*
*     Test the input parameters.
*
      info = 0
      normaltransr = lsame( transr, 'N' )
      lower = lsame( uplo, 'L' )
      notrans = lsame( trans, 'N' )
*
      IF( notrans ) THEN
         nrowa = n
      ELSE
         nrowa = k
      END IF
*
      IF( .NOT.normaltransr .AND. .NOT.lsame( transr, 'C' ) ) THEN
         info = -1
      ELSE IF( .NOT.lower .AND. .NOT.lsame( uplo, 'U' ) ) THEN
         info = -2
      ELSE IF( .NOT.notrans .AND. .NOT.lsame( trans, 'C' ) ) THEN
         info = -3
      ELSE IF( n.LT.0 ) THEN
         info = -4
      ELSE IF( k.LT.0 ) THEN
         info = -5
      ELSE IF( lda.LT.max( 1, nrowa ) ) THEN
         info = -8
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CHFRK ', -info )
         RETURN
      END IF
*
*     Quick return if possible.
*
*     The quick return case: ((ALPHA.EQ.0).AND.(BETA.NE.ZERO)) is not
*     done (it is in CHERK for example) and left in the general case.
*
      IF( ( n.EQ.0 ) .OR. ( ( ( alpha.EQ.zero ) .OR. ( k.EQ.0 ) ) .AND.
     $    ( beta.EQ.one ) ) )RETURN
*
      IF( ( alpha.EQ.zero ) .AND. ( beta.EQ.zero ) ) THEN
         DO j = 1, ( ( n*( n+1 ) ) / 2 )
            c( j ) = czero
         END DO
         RETURN
      END IF
*
      calpha = cmplx( alpha, zero )
      cbeta = cmplx( beta, zero )
*
*     C is N-by-N.
*     If N is odd, set NISODD = .TRUE., and N1 and N2.
*     If N is even, NISODD = .FALSE., and NK.
*
      IF( mod( n, 2 ).EQ.0 ) THEN
         nisodd = .false.
         nk = n / 2
      ELSE
         nisodd = .true.
         IF( lower ) THEN
            n2 = n / 2
            n1 = n - n2
         ELSE
            n1 = n / 2
            n2 = n - n1
         END IF
      END IF
*
      IF( nisodd ) THEN
*
*        N is odd
*
         IF( normaltransr ) THEN
*
*           N is odd and TRANSR = 'N'
*
            IF( lower ) THEN
*
*              N is odd, TRANSR = 'N', and UPLO = 'L'
*
               IF( notrans ) THEN
*
*                 N is odd, TRANSR = 'N', UPLO = 'L', and TRANS = 'N'
*
                  CALL cherk( 'L', 'N', n1, k, alpha, a( 1, 1 ), lda,
     $                        beta, c( 1 ), n )
                  CALL cherk( 'U', 'N', n2, k, alpha, a( n1+1, 1 ), lda,
     $                        beta, c( n+1 ), n )
                  CALL cgemm( 'N', 'C', n2, n1, k, calpha, a( n1+1, 1 ),
     $                        lda, a( 1, 1 ), lda, cbeta, c( n1+1 ), n )
*
               ELSE
*
*                 N is odd, TRANSR = 'N', UPLO = 'L', and TRANS = 'C'
*
                  CALL cherk( 'L', 'C', n1, k, alpha, a( 1, 1 ), lda,
     $                        beta, c( 1 ), n )
                  CALL cherk( 'U', 'C', n2, k, alpha, a( 1, n1+1 ), lda,
     $                        beta, c( n+1 ), n )
                  CALL cgemm( 'C', 'N', n2, n1, k, calpha, a( 1, n1+1 ),
     $                        lda, a( 1, 1 ), lda, cbeta, c( n1+1 ), n )
*
               END IF
*
            ELSE
*
*              N is odd, TRANSR = 'N', and UPLO = 'U'
*
               IF( notrans ) THEN
*
*                 N is odd, TRANSR = 'N', UPLO = 'U', and TRANS = 'N'
*
                  CALL cherk( 'L', 'N', n1, k, alpha, a( 1, 1 ), lda,
     $                        beta, c( n2+1 ), n )
                  CALL cherk( 'U', 'N', n2, k, alpha, a( n2, 1 ), lda,
     $                        beta, c( n1+1 ), n )
                  CALL cgemm( 'N', 'C', n1, n2, k, calpha, a( 1, 1 ),
     $                        lda, a( n2, 1 ), lda, cbeta, c( 1 ), n )
*
               ELSE
*
*                 N is odd, TRANSR = 'N', UPLO = 'U', and TRANS = 'C'
*
                  CALL cherk( 'L', 'C', n1, k, alpha, a( 1, 1 ), lda,
     $                        beta, c( n2+1 ), n )
                  CALL cherk( 'U', 'C', n2, k, alpha, a( 1, n2 ), lda,
     $                        beta, c( n1+1 ), n )
                  CALL cgemm( 'C', 'N', n1, n2, k, calpha, a( 1, 1 ),
     $                        lda, a( 1, n2 ), lda, cbeta, c( 1 ), n )
*
               END IF
*
            END IF
*
         ELSE
*
*           N is odd, and TRANSR = 'C'
*
            IF( lower ) THEN
*
*              N is odd, TRANSR = 'C', and UPLO = 'L'
*
               IF( notrans ) THEN
*
*                 N is odd, TRANSR = 'C', UPLO = 'L', and TRANS = 'N'
*
                  CALL cherk( 'U', 'N', n1, k, alpha, a( 1, 1 ), lda,
     $                        beta, c( 1 ), n1 )
                  CALL cherk( 'L', 'N', n2, k, alpha, a( n1+1, 1 ), lda,
     $                        beta, c( 2 ), n1 )
                  CALL cgemm( 'N', 'C', n1, n2, k, calpha, a( 1, 1 ),
     $                        lda, a( n1+1, 1 ), lda, cbeta,
     $                        c( n1*n1+1 ), n1 )
*
               ELSE
*
*                 N is odd, TRANSR = 'C', UPLO = 'L', and TRANS = 'C'
*
                  CALL cherk( 'U', 'C', n1, k, alpha, a( 1, 1 ), lda,
     $                        beta, c( 1 ), n1 )
                  CALL cherk( 'L', 'C', n2, k, alpha, a( 1, n1+1 ), lda,
     $                        beta, c( 2 ), n1 )
                  CALL cgemm( 'C', 'N', n1, n2, k, calpha, a( 1, 1 ),
     $                        lda, a( 1, n1+1 ), lda, cbeta,
     $                        c( n1*n1+1 ), n1 )
*
               END IF
*
            ELSE
*
*              N is odd, TRANSR = 'C', and UPLO = 'U'
*
               IF( notrans ) THEN
*
*                 N is odd, TRANSR = 'C', UPLO = 'U', and TRANS = 'N'
*
                  CALL cherk( 'U', 'N', n1, k, alpha, a( 1, 1 ), lda,
     $                        beta, c( n2*n2+1 ), n2 )
                  CALL cherk( 'L', 'N', n2, k, alpha, a( n1+1, 1 ), lda,
     $                        beta, c( n1*n2+1 ), n2 )
                  CALL cgemm( 'N', 'C', n2, n1, k, calpha, a( n1+1, 1 ),
     $                        lda, a( 1, 1 ), lda, cbeta, c( 1 ), n2 )
*
               ELSE
*
*                 N is odd, TRANSR = 'C', UPLO = 'U', and TRANS = 'C'
*
                  CALL cherk( 'U', 'C', n1, k, alpha, a( 1, 1 ), lda,
     $                        beta, c( n2*n2+1 ), n2 )
                  CALL cherk( 'L', 'C', n2, k, alpha, a( 1, n1+1 ), lda,
     $                        beta, c( n1*n2+1 ), n2 )
                  CALL cgemm( 'C', 'N', n2, n1, k, calpha, a( 1, n1+1 ),
     $                        lda, a( 1, 1 ), lda, cbeta, c( 1 ), n2 )
*
               END IF
*
            END IF
*
         END IF
*
      ELSE
*
*        N is even
*
         IF( normaltransr ) THEN
*
*           N is even and TRANSR = 'N'
*
            IF( lower ) THEN
*
*              N is even, TRANSR = 'N', and UPLO = 'L'
*
               IF( notrans ) THEN
*
*                 N is even, TRANSR = 'N', UPLO = 'L', and TRANS = 'N'
*
                  CALL cherk( 'L', 'N', nk, k, alpha, a( 1, 1 ), lda,
     $                        beta, c( 2 ), n+1 )
                  CALL cherk( 'U', 'N', nk, k, alpha, a( nk+1, 1 ), lda,
     $                        beta, c( 1 ), n+1 )
                  CALL cgemm( 'N', 'C', nk, nk, k, calpha, a( nk+1, 1 ),
     $                        lda, a( 1, 1 ), lda, cbeta, c( nk+2 ),
     $                        n+1 )
*
               ELSE
*
*                 N is even, TRANSR = 'N', UPLO = 'L', and TRANS = 'C'
*
                  CALL cherk( 'L', 'C', nk, k, alpha, a( 1, 1 ), lda,
     $                        beta, c( 2 ), n+1 )
                  CALL cherk( 'U', 'C', nk, k, alpha, a( 1, nk+1 ), lda,
     $                        beta, c( 1 ), n+1 )
                  CALL cgemm( 'C', 'N', nk, nk, k, calpha, a( 1, nk+1 ),
     $                        lda, a( 1, 1 ), lda, cbeta, c( nk+2 ),
     $                        n+1 )
*
               END IF
*
            ELSE
*
*              N is even, TRANSR = 'N', and UPLO = 'U'
*
               IF( notrans ) THEN
*
*                 N is even, TRANSR = 'N', UPLO = 'U', and TRANS = 'N'
*
                  CALL cherk( 'L', 'N', nk, k, alpha, a( 1, 1 ), lda,
     $                        beta, c( nk+2 ), n+1 )
                  CALL cherk( 'U', 'N', nk, k, alpha, a( nk+1, 1 ), lda,
     $                        beta, c( nk+1 ), n+1 )
                  CALL cgemm( 'N', 'C', nk, nk, k, calpha, a( 1, 1 ),
     $                        lda, a( nk+1, 1 ), lda, cbeta, c( 1 ),
     $                        n+1 )
*
               ELSE
*
*                 N is even, TRANSR = 'N', UPLO = 'U', and TRANS = 'C'
*
                  CALL cherk( 'L', 'C', nk, k, alpha, a( 1, 1 ), lda,
     $                        beta, c( nk+2 ), n+1 )
                  CALL cherk( 'U', 'C', nk, k, alpha, a( 1, nk+1 ), lda,
     $                        beta, c( nk+1 ), n+1 )
                  CALL cgemm( 'C', 'N', nk, nk, k, calpha, a( 1, 1 ),
     $                        lda, a( 1, nk+1 ), lda, cbeta, c( 1 ),
     $                        n+1 )
*
               END IF
*
            END IF
*
         ELSE
*
*           N is even, and TRANSR = 'C'
*
            IF( lower ) THEN
*
*              N is even, TRANSR = 'C', and UPLO = 'L'
*
               IF( notrans ) THEN
*
*                 N is even, TRANSR = 'C', UPLO = 'L', and TRANS = 'N'
*
                  CALL cherk( 'U', 'N', nk, k, alpha, a( 1, 1 ), lda,
     $                        beta, c( nk+1 ), nk )
                  CALL cherk( 'L', 'N', nk, k, alpha, a( nk+1, 1 ), lda,
     $                        beta, c( 1 ), nk )
                  CALL cgemm( 'N', 'C', nk, nk, k, calpha, a( 1, 1 ),
     $                        lda, a( nk+1, 1 ), lda, cbeta,
     $                        c( ( ( nk+1 )*nk )+1 ), nk )
*
               ELSE
*
*                 N is even, TRANSR = 'C', UPLO = 'L', and TRANS = 'C'
*
                  CALL cherk( 'U', 'C', nk, k, alpha, a( 1, 1 ), lda,
     $                        beta, c( nk+1 ), nk )
                  CALL cherk( 'L', 'C', nk, k, alpha, a( 1, nk+1 ), lda,
     $                        beta, c( 1 ), nk )
                  CALL cgemm( 'C', 'N', nk, nk, k, calpha, a( 1, 1 ),
     $                        lda, a( 1, nk+1 ), lda, cbeta,
     $                        c( ( ( nk+1 )*nk )+1 ), nk )
*
               END IF
*
            ELSE
*
*              N is even, TRANSR = 'C', and UPLO = 'U'
*
               IF( notrans ) THEN
*
*                 N is even, TRANSR = 'C', UPLO = 'U', and TRANS = 'N'
*
                  CALL cherk( 'U', 'N', nk, k, alpha, a( 1, 1 ), lda,
     $                        beta, c( nk*( nk+1 )+1 ), nk )
                  CALL cherk( 'L', 'N', nk, k, alpha, a( nk+1, 1 ), lda,
     $                        beta, c( nk*nk+1 ), nk )
                  CALL cgemm( 'N', 'C', nk, nk, k, calpha, a( nk+1, 1 ),
     $                        lda, a( 1, 1 ), lda, cbeta, c( 1 ), nk )
*
               ELSE
*
*                 N is even, TRANSR = 'C', UPLO = 'U', and TRANS = 'C'
*
                  CALL cherk( 'U', 'C', nk, k, alpha, a( 1, 1 ), lda,
     $                        beta, c( nk*( nk+1 )+1 ), nk )
                  CALL cherk( 'L', 'C', nk, k, alpha, a( 1, nk+1 ), lda,
     $                        beta, c( nk*nk+1 ), nk )
                  CALL cgemm( 'C', 'N', nk, nk, k, calpha, a( 1, nk+1 ),
     $                        lda, a( 1, 1 ), lda, cbeta, c( 1 ), nk )
*
               END IF
*
            END IF
*
         END IF
*
      END IF
*
      RETURN
*
*     End of CHFRK
*

◆ chpcon()

subroutine chpcon	(	character	uplo,
		integer	n,
		complex, dimension( * )	ap,
		integer, dimension( * )	ipiv,
		real	anorm,
		real	rcond,
		complex, dimension( * )	work,
		integer	info )

CHPCON

Download CHPCON + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CHPCON estimates the reciprocal of the condition number of a complex
!> Hermitian packed matrix A using the factorization A = U*D*U**H or
!> A = L*D*L**H computed by CHPTRF.
!>
!> An estimate is obtained for norm(inv(A)), and the reciprocal of the
!> condition number is computed as RCOND = 1 / (ANORM * norm(inv(A))).
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER1 !> Specifies whether the details of the factorization are stored !> as an upper or lower triangular matrix. !> = 'U': Upper triangular, form is A = UDUH; !> = 'L': Lower triangular, form is A = LDL*H. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in]	AP	!> AP is COMPLEX array, dimension (N*(N+1)/2) !> The block diagonal matrix D and the multipliers used to !> obtain the factor U or L as computed by CHPTRF, stored as a !> packed triangular matrix. !>
[in]	IPIV	!> IPIV is INTEGER array, dimension (N) !> Details of the interchanges and the block structure of D !> as determined by CHPTRF. !>
[in]	ANORM	!> ANORM is REAL !> The 1-norm of the original matrix A. !>
[out]	RCOND	!> RCOND is REAL !> The reciprocal of the condition number of the matrix A, !> computed as RCOND = 1/(ANORM * AINVNM), where AINVNM is an !> estimate of the 1-norm of inv(A) computed in this routine. !>
[out]	WORK	!> WORK is COMPLEX array, dimension (2*N) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 117 of file chpcon.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          UPLO
      INTEGER            INFO, N
      REAL               ANORM, RCOND
*     ..
*     .. Array Arguments ..
      INTEGER            IPIV( * )
      COMPLEX            AP( * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ONE, ZERO
      parameter( one = 1.0e+0, zero = 0.0e+0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            UPPER
      INTEGER            I, IP, KASE
      REAL               AINVNM
*     ..
*     .. Local Arrays ..
      INTEGER            ISAVE( 3 )
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           chptrs, clacn2, xerbla
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      upper = lsame( uplo, 'U' )
      IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( anorm.LT.zero ) THEN
         info = -5
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CHPCON', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      rcond = zero
      IF( n.EQ.0 ) THEN
         rcond = one
         RETURN
      ELSE IF( anorm.LE.zero ) THEN
         RETURN
      END IF
*
*     Check that the diagonal matrix D is nonsingular.
*
      IF( upper ) THEN
*
*        Upper triangular storage: examine D from bottom to top
*
         ip = n*( n+1 ) / 2
         DO 10 i = n, 1, -1
            IF( ipiv( i ).GT.0 .AND. ap( ip ).EQ.zero )
     $         RETURN
            ip = ip - i
   10    CONTINUE
      ELSE
*
*        Lower triangular storage: examine D from top to bottom.
*
         ip = 1
         DO 20 i = 1, n
            IF( ipiv( i ).GT.0 .AND. ap( ip ).EQ.zero )
     $         RETURN
            ip = ip + n - i + 1
   20    CONTINUE
      END IF
*
*     Estimate the 1-norm of the inverse.
*
      kase = 0
   30 CONTINUE
      CALL clacn2( n, work( n+1 ), work, ainvnm, kase, isave )
      IF( kase.NE.0 ) THEN
*
*        Multiply by inv(L*D*L**H) or inv(U*D*U**H).
*
         CALL chptrs( uplo, n, 1, ap, ipiv, work, n, info )
         GO TO 30
      END IF
*
*     Compute the estimate of the reciprocal condition number.
*
      IF( ainvnm.NE.zero )
     $   rcond = ( one / ainvnm ) / anorm
*
      RETURN
*
*     End of CHPCON
*

◆ chpgst()

subroutine chpgst	(	integer	itype,
		character	uplo,
		integer	n,
		complex, dimension( * )	ap,
		complex, dimension( * )	bp,
		integer	info )

CHPGST

Download CHPGST + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CHPGST reduces a complex Hermitian-definite generalized
!> eigenproblem to standard form, using packed storage.
!>
!> If ITYPE = 1, the problem is A*x = lambda*B*x,
!> and A is overwritten by inv(U**H)*A*inv(U) or inv(L)*A*inv(L**H)
!>
!> If ITYPE = 2 or 3, the problem is A*B*x = lambda*x or
!> B*A*x = lambda*x, and A is overwritten by U*A*U**H or L**H*A*L.
!>
!> B must have been previously factorized as U**H*U or L*L**H by CPPTRF.
!>

Parameters

[in]	ITYPE	!> ITYPE is INTEGER !> = 1: compute inv(U*H)Ainv(U) or inv(L)Ainv(LH); !> = 2 or 3: compute UAUH or LHA*L. !>
[in]	UPLO	!> UPLO is CHARACTER1 !> = 'U': Upper triangle of A is stored and B is factored as !> UHU; !> = 'L': Lower triangle of A is stored and B is factored as !> LL*H. !>
[in]	N	!> N is INTEGER !> The order of the matrices A and B. N >= 0. !>
[in,out]	AP	!> AP is COMPLEX array, dimension (N(N+1)/2) !> On entry, the upper or lower triangle of the Hermitian matrix !> A, packed columnwise in a linear array. The j-th column of A !> is stored in the array AP as follows: !> if UPLO = 'U', AP(i + (j-1)j/2) = A(i,j) for 1<=i<=j; !> if UPLO = 'L', AP(i + (j-1)*(2n-j)/2) = A(i,j) for j<=i<=n. !> !> On exit, if INFO = 0, the transformed matrix, stored in the !> same format as A. !>
[in]	BP	!> BP is COMPLEX array, dimension (N*(N+1)/2) !> The triangular factor from the Cholesky factorization of B, !> stored in the same format as A, as returned by CPPTRF. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 112 of file chpgst.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          UPLO
      INTEGER            INFO, ITYPE, N
*     ..
*     .. Array Arguments ..
      COMPLEX            AP( * ), BP( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ONE, HALF
      parameter( one = 1.0e+0, half = 0.5e+0 )
      COMPLEX            CONE
      parameter( cone = ( 1.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      LOGICAL            UPPER
      INTEGER            J, J1, J1J1, JJ, K, K1, K1K1, KK
      REAL               AJJ, AKK, BJJ, BKK
      COMPLEX            CT
*     ..
*     .. External Subroutines ..
      EXTERNAL           caxpy, chpmv, chpr2, csscal, ctpmv, ctpsv,
     $                   xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          real
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      COMPLEX            CDOTC
      EXTERNAL           lsame, cdotc
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      upper = lsame( uplo, 'U' )
      IF( itype.LT.1 .OR. itype.GT.3 ) THEN
         info = -1
      ELSE IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -2
      ELSE IF( n.LT.0 ) THEN
         info = -3
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CHPGST', -info )
         RETURN
      END IF
*
      IF( itype.EQ.1 ) THEN
         IF( upper ) THEN
*
*           Compute inv(U**H)*A*inv(U)
*
*           J1 and JJ are the indices of A(1,j) and A(j,j)
*
            jj = 0
            DO 10 j = 1, n
               j1 = jj + 1
               jj = jj + j
*
*              Compute the j-th column of the upper triangle of A
*
               ap( jj ) = real( ap( jj ) )
               bjj = real( bp( jj ) )
               CALL ctpsv( uplo, 'Conjugate transpose', 'Non-unit', j,
     $                     bp, ap( j1 ), 1 )
               CALL chpmv( uplo, j-1, -cone, ap, bp( j1 ), 1, cone,
     $                     ap( j1 ), 1 )
               CALL csscal( j-1, one / bjj, ap( j1 ), 1 )
               ap( jj ) = ( ap( jj )-cdotc( j-1, ap( j1 ), 1, bp( j1 ),
     $                    1 ) ) / bjj
   10       CONTINUE
         ELSE
*
*           Compute inv(L)*A*inv(L**H)
*
*           KK and K1K1 are the indices of A(k,k) and A(k+1,k+1)
*
            kk = 1
            DO 20 k = 1, n
               k1k1 = kk + n - k + 1
*
*              Update the lower triangle of A(k:n,k:n)
*
               akk = real( ap( kk ) )
               bkk = real( bp( kk ) )
               akk = akk / bkk**2
               ap( kk ) = akk
               IF( k.LT.n ) THEN
                  CALL csscal( n-k, one / bkk, ap( kk+1 ), 1 )
                  ct = -half*akk
                  CALL caxpy( n-k, ct, bp( kk+1 ), 1, ap( kk+1 ), 1 )
                  CALL chpr2( uplo, n-k, -cone, ap( kk+1 ), 1,
     $                        bp( kk+1 ), 1, ap( k1k1 ) )
                  CALL caxpy( n-k, ct, bp( kk+1 ), 1, ap( kk+1 ), 1 )
                  CALL ctpsv( uplo, 'No transpose', 'Non-unit', n-k,
     $                        bp( k1k1 ), ap( kk+1 ), 1 )
               END IF
               kk = k1k1
   20       CONTINUE
         END IF
      ELSE
         IF( upper ) THEN
*
*           Compute U*A*U**H
*
*           K1 and KK are the indices of A(1,k) and A(k,k)
*
            kk = 0
            DO 30 k = 1, n
               k1 = kk + 1
               kk = kk + k
*
*              Update the upper triangle of A(1:k,1:k)
*
               akk = real( ap( kk ) )
               bkk = real( bp( kk ) )
               CALL ctpmv( uplo, 'No transpose', 'Non-unit', k-1, bp,
     $                     ap( k1 ), 1 )
               ct = half*akk
               CALL caxpy( k-1, ct, bp( k1 ), 1, ap( k1 ), 1 )
               CALL chpr2( uplo, k-1, cone, ap( k1 ), 1, bp( k1 ), 1,
     $                     ap )
               CALL caxpy( k-1, ct, bp( k1 ), 1, ap( k1 ), 1 )
               CALL csscal( k-1, bkk, ap( k1 ), 1 )
               ap( kk ) = akk*bkk**2
   30       CONTINUE
         ELSE
*
*           Compute L**H *A*L
*
*           JJ and J1J1 are the indices of A(j,j) and A(j+1,j+1)
*
            jj = 1
            DO 40 j = 1, n
               j1j1 = jj + n - j + 1
*
*              Compute the j-th column of the lower triangle of A
*
               ajj = real( ap( jj ) )
               bjj = real( bp( jj ) )
               ap( jj ) = ajj*bjj + cdotc( n-j, ap( jj+1 ), 1,
     $                    bp( jj+1 ), 1 )
               CALL csscal( n-j, bjj, ap( jj+1 ), 1 )
               CALL chpmv( uplo, n-j, cone, ap( j1j1 ), bp( jj+1 ), 1,
     $                     cone, ap( jj+1 ), 1 )
               CALL ctpmv( uplo, 'Conjugate transpose', 'Non-unit',
     $                     n-j+1, bp( jj ), ap( jj ), 1 )
               jj = j1j1
   40       CONTINUE
         END IF
      END IF
      RETURN
*
*     End of CHPGST
*

◆ chprfs()

subroutine chprfs	(	character	uplo,
		integer	n,
		integer	nrhs,
		complex, dimension( * )	ap,
		complex, dimension( * )	afp,
		integer, dimension( * )	ipiv,
		complex, dimension( ldb, * )	b,
		integer	ldb,
		complex, dimension( ldx, * )	x,
		integer	ldx,
		real, dimension( * )	ferr,
		real, dimension( * )	berr,
		complex, dimension( * )	work,
		real, dimension( * )	rwork,
		integer	info )

CHPRFS

Download CHPRFS + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CHPRFS improves the computed solution to a system of linear
!> equations when the coefficient matrix is Hermitian indefinite
!> and packed, and provides error bounds and backward error estimates
!> for the solution.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': Upper triangle of A is stored; !> = 'L': Lower triangle of A is stored. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in]	NRHS	!> NRHS is INTEGER !> The number of right hand sides, i.e., the number of columns !> of the matrices B and X. NRHS >= 0. !>
[in]	AP	!> AP is COMPLEX array, dimension (N(N+1)/2) !> The upper or lower triangle of the Hermitian matrix A, packed !> columnwise in a linear array. The j-th column of A is stored !> in the array AP as follows: !> if UPLO = 'U', AP(i + (j-1)j/2) = A(i,j) for 1<=i<=j; !> if UPLO = 'L', AP(i + (j-1)(2n-j)/2) = A(i,j) for j<=i<=n. !>
[in]	AFP	!> AFP is COMPLEX array, dimension (N(N+1)/2) !> The factored form of the matrix A. AFP contains the block !> diagonal matrix D and the multipliers used to obtain the !> factor U or L from the factorization A = UDUH or !> A = LDL*H as computed by CHPTRF, stored as a packed !> triangular matrix. !>
[in]	IPIV	!> IPIV is INTEGER array, dimension (N) !> Details of the interchanges and the block structure of D !> as determined by CHPTRF. !>
[in]	B	!> B is COMPLEX array, dimension (LDB,NRHS) !> The right hand side matrix B. !>
[in]	LDB	!> LDB is INTEGER !> The leading dimension of the array B. LDB >= max(1,N). !>
[in,out]	X	!> X is COMPLEX array, dimension (LDX,NRHS) !> On entry, the solution matrix X, as computed by CHPTRS. !> On exit, the improved solution matrix X. !>
[in]	LDX	!> LDX is INTEGER !> The leading dimension of the array X. LDX >= max(1,N). !>
[out]	FERR	!> FERR is REAL array, dimension (NRHS) !> The estimated forward error bound for each solution vector !> X(j) (the j-th column of the solution matrix X). !> If XTRUE is the true solution corresponding to X(j), FERR(j) !> is an estimated upper bound for the magnitude of the largest !> element in (X(j) - XTRUE) divided by the magnitude of the !> largest element in X(j). The estimate is as reliable as !> the estimate for RCOND, and is almost always a slight !> overestimate of the true error. !>
[out]	BERR	!> BERR is REAL array, dimension (NRHS) !> The componentwise relative backward error of each solution !> vector X(j) (i.e., the smallest relative change in !> any element of A or B that makes X(j) an exact solution). !>
[out]	WORK	!> WORK is COMPLEX array, dimension (2*N) !>
[out]	RWORK	!> RWORK is REAL array, dimension (N) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Internal Parameters:

!>  ITMAX is the maximum number of steps of iterative refinement.
!>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 178 of file chprfs.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          UPLO
      INTEGER            INFO, LDB, LDX, N, NRHS
*     ..
*     .. Array Arguments ..
      INTEGER            IPIV( * )
      REAL               BERR( * ), FERR( * ), RWORK( * )
      COMPLEX            AFP( * ), AP( * ), B( LDB, * ), WORK( * ),
     $                   X( LDX, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      INTEGER            ITMAX
      parameter( itmax = 5 )
      REAL               ZERO
      parameter( zero = 0.0e+0 )
      COMPLEX            ONE
      parameter( one = ( 1.0e+0, 0.0e+0 ) )
      REAL               TWO
      parameter( two = 2.0e+0 )
      REAL               THREE
      parameter( three = 3.0e+0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            UPPER
      INTEGER            COUNT, I, IK, J, K, KASE, KK, NZ
      REAL               EPS, LSTRES, S, SAFE1, SAFE2, SAFMIN, XK
      COMPLEX            ZDUM
*     ..
*     .. Local Arrays ..
      INTEGER            ISAVE( 3 )
*     ..
*     .. External Subroutines ..
      EXTERNAL           caxpy, ccopy, chpmv, chptrs, clacn2, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, aimag, max, real
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      REAL               SLAMCH
      EXTERNAL           lsame, slamch
*     ..
*     .. Statement Functions ..
      REAL               CABS1
*     ..
*     .. Statement Function definitions ..
      cabs1( zdum ) = abs( real( zdum ) ) + abs( aimag( zdum ) )
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      upper = lsame( uplo, 'U' )
      IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( nrhs.LT.0 ) THEN
         info = -3
      ELSE IF( ldb.LT.max( 1, n ) ) THEN
         info = -8
      ELSE IF( ldx.LT.max( 1, n ) ) THEN
         info = -10
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CHPRFS', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 .OR. nrhs.EQ.0 ) THEN
         DO 10 j = 1, nrhs
            ferr( j ) = zero
            berr( j ) = zero
   10    CONTINUE
         RETURN
      END IF
*
*     NZ = maximum number of nonzero elements in each row of A, plus 1
*
      nz = n + 1
      eps = slamch( 'Epsilon' )
      safmin = slamch( 'Safe minimum' )
      safe1 = nz*safmin
      safe2 = safe1 / eps
*
*     Do for each right hand side
*
      DO 140 j = 1, nrhs
*
         count = 1
         lstres = three
   20    CONTINUE
*
*        Loop until stopping criterion is satisfied.
*
*        Compute residual R = B - A * X
*
         CALL ccopy( n, b( 1, j ), 1, work, 1 )
         CALL chpmv( uplo, n, -one, ap, x( 1, j ), 1, one, work, 1 )
*
*        Compute componentwise relative backward error from formula
*
*        max(i) ( abs(R(i)) / ( abs(A)*abs(X) + abs(B) )(i) )
*
*        where abs(Z) is the componentwise absolute value of the matrix
*        or vector Z.  If the i-th component of the denominator is less
*        than SAFE2, then SAFE1 is added to the i-th components of the
*        numerator and denominator before dividing.
*
         DO 30 i = 1, n
            rwork( i ) = cabs1( b( i, j ) )
   30    CONTINUE
*
*        Compute abs(A)*abs(X) + abs(B).
*
         kk = 1
         IF( upper ) THEN
            DO 50 k = 1, n
               s = zero
               xk = cabs1( x( k, j ) )
               ik = kk
               DO 40 i = 1, k - 1
                  rwork( i ) = rwork( i ) + cabs1( ap( ik ) )*xk
                  s = s + cabs1( ap( ik ) )*cabs1( x( i, j ) )
                  ik = ik + 1
   40          CONTINUE
               rwork( k ) = rwork( k ) + abs( real( ap( kk+k-1 ) ) )*
     $                      xk + s
               kk = kk + k
   50       CONTINUE
         ELSE
            DO 70 k = 1, n
               s = zero
               xk = cabs1( x( k, j ) )
               rwork( k ) = rwork( k ) + abs( real( ap( kk ) ) )*xk
               ik = kk + 1
               DO 60 i = k + 1, n
                  rwork( i ) = rwork( i ) + cabs1( ap( ik ) )*xk
                  s = s + cabs1( ap( ik ) )*cabs1( x( i, j ) )
                  ik = ik + 1
   60          CONTINUE
               rwork( k ) = rwork( k ) + s
               kk = kk + ( n-k+1 )
   70       CONTINUE
         END IF
         s = zero
         DO 80 i = 1, n
            IF( rwork( i ).GT.safe2 ) THEN
               s = max( s, cabs1( work( i ) ) / rwork( i ) )
            ELSE
               s = max( s, ( cabs1( work( i ) )+safe1 ) /
     $             ( rwork( i )+safe1 ) )
            END IF
   80    CONTINUE
         berr( j ) = s
*
*        Test stopping criterion. Continue iterating if
*           1) The residual BERR(J) is larger than machine epsilon, and
*           2) BERR(J) decreased by at least a factor of 2 during the
*              last iteration, and
*           3) At most ITMAX iterations tried.
*
         IF( berr( j ).GT.eps .AND. two*berr( j ).LE.lstres .AND.
     $       count.LE.itmax ) THEN
*
*           Update solution and try again.
*
            CALL chptrs( uplo, n, 1, afp, ipiv, work, n, info )
            CALL caxpy( n, one, work, 1, x( 1, j ), 1 )
            lstres = berr( j )
            count = count + 1
            GO TO 20
         END IF
*
*        Bound error from formula
*
*        norm(X - XTRUE) / norm(X) .le. FERR =
*        norm( abs(inv(A))*
*           ( abs(R) + NZ*EPS*( abs(A)*abs(X)+abs(B) ))) / norm(X)
*
*        where
*          norm(Z) is the magnitude of the largest component of Z
*          inv(A) is the inverse of A
*          abs(Z) is the componentwise absolute value of the matrix or
*             vector Z
*          NZ is the maximum number of nonzeros in any row of A, plus 1
*          EPS is machine epsilon
*
*        The i-th component of abs(R)+NZ*EPS*(abs(A)*abs(X)+abs(B))
*        is incremented by SAFE1 if the i-th component of
*        abs(A)*abs(X) + abs(B) is less than SAFE2.
*
*        Use CLACN2 to estimate the infinity-norm of the matrix
*           inv(A) * diag(W),
*        where W = abs(R) + NZ*EPS*( abs(A)*abs(X)+abs(B) )))
*
         DO 90 i = 1, n
            IF( rwork( i ).GT.safe2 ) THEN
               rwork( i ) = cabs1( work( i ) ) + nz*eps*rwork( i )
            ELSE
               rwork( i ) = cabs1( work( i ) ) + nz*eps*rwork( i ) +
     $                      safe1
            END IF
   90    CONTINUE
*
         kase = 0
  100    CONTINUE
         CALL clacn2( n, work( n+1 ), work, ferr( j ), kase, isave )
         IF( kase.NE.0 ) THEN
            IF( kase.EQ.1 ) THEN
*
*              Multiply by diag(W)*inv(A**H).
*
               CALL chptrs( uplo, n, 1, afp, ipiv, work, n, info )
               DO 110 i = 1, n
                  work( i ) = rwork( i )*work( i )
  110          CONTINUE
            ELSE IF( kase.EQ.2 ) THEN
*
*              Multiply by inv(A)*diag(W).
*
               DO 120 i = 1, n
                  work( i ) = rwork( i )*work( i )
  120          CONTINUE
               CALL chptrs( uplo, n, 1, afp, ipiv, work, n, info )
            END IF
            GO TO 100
         END IF
*
*        Normalize error.
*
         lstres = zero
         DO 130 i = 1, n
            lstres = max( lstres, cabs1( x( i, j ) ) )
  130    CONTINUE
         IF( lstres.NE.zero )
     $      ferr( j ) = ferr( j ) / lstres
*
  140 CONTINUE
*
      RETURN
*
*     End of CHPRFS
*

◆ chptrd()

subroutine chptrd	(	character	uplo,
		integer	n,
		complex, dimension( * )	ap,
		real, dimension( * )	d,
		real, dimension( * )	e,
		complex, dimension( * )	tau,
		integer	info )

CHPTRD

Download CHPTRD + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CHPTRD reduces a complex Hermitian matrix A stored in packed form to
!> real symmetric tridiagonal form T by a unitary similarity
!> transformation: Q**H * A * Q = T.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': Upper triangle of A is stored; !> = 'L': Lower triangle of A is stored. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in,out]	AP	!> AP is COMPLEX array, dimension (N(N+1)/2) !> On entry, the upper or lower triangle of the Hermitian matrix !> A, packed columnwise in a linear array. The j-th column of A !> is stored in the array AP as follows: !> if UPLO = 'U', AP(i + (j-1)j/2) = A(i,j) for 1<=i<=j; !> if UPLO = 'L', AP(i + (j-1)(2n-j)/2) = A(i,j) for j<=i<=n. !> On exit, if UPLO = 'U', the diagonal and first superdiagonal !> of A are overwritten by the corresponding elements of the !> tridiagonal matrix T, and the elements above the first !> superdiagonal, with the array TAU, represent the unitary !> matrix Q as a product of elementary reflectors; if UPLO !> = 'L', the diagonal and first subdiagonal of A are over- !> written by the corresponding elements of the tridiagonal !> matrix T, and the elements below the first subdiagonal, with !> the array TAU, represent the unitary matrix Q as a product !> of elementary reflectors. See Further Details. !>
[out]	D	!> D is REAL array, dimension (N) !> The diagonal elements of the tridiagonal matrix T: !> D(i) = A(i,i). !>
[out]	E	!> E is REAL array, dimension (N-1) !> The off-diagonal elements of the tridiagonal matrix T: !> E(i) = A(i,i+1) if UPLO = 'U', E(i) = A(i+1,i) if UPLO = 'L'. !>
[out]	TAU	!> TAU is COMPLEX array, dimension (N-1) !> The scalar factors of the elementary reflectors (see Further !> Details). !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  If UPLO = 'U', the matrix Q is represented as a product of elementary
!>  reflectors
!>
!>     Q = H(n-1) . . . H(2) H(1).
!>
!>  Each H(i) has the form
!>
!>     H(i) = I - tau * v * v**H
!>
!>  where tau is a complex scalar, and v is a complex vector with
!>  v(i+1:n) = 0 and v(i) = 1; v(1:i-1) is stored on exit in AP,
!>  overwriting A(1:i-1,i+1), and tau is stored in TAU(i).
!>
!>  If UPLO = 'L', the matrix Q is represented as a product of elementary
!>  reflectors
!>
!>     Q = H(1) H(2) . . . H(n-1).
!>
!>  Each H(i) has the form
!>
!>     H(i) = I - tau * v * v**H
!>
!>  where tau is a complex scalar, and v is a complex vector with
!>  v(1:i) = 0 and v(i+1) = 1; v(i+2:n) is stored on exit in AP,
!>  overwriting A(i+2:n,i), and tau is stored in TAU(i).
!>

Definition at line 150 of file chptrd.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          UPLO
      INTEGER            INFO, N
*     ..
*     .. Array Arguments ..
      REAL               D( * ), E( * )
      COMPLEX            AP( * ), TAU( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            ONE, ZERO, HALF
      parameter( one = ( 1.0e+0, 0.0e+0 ),
     $                   zero = ( 0.0e+0, 0.0e+0 ),
     $                   half = ( 0.5e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      LOGICAL            UPPER
      INTEGER            I, I1, I1I1, II
      COMPLEX            ALPHA, TAUI
*     ..
*     .. External Subroutines ..
      EXTERNAL           caxpy, chpmv, chpr2, clarfg, xerbla
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      COMPLEX            CDOTC
      EXTERNAL           lsame, cdotc
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          real
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters
*
      info = 0
      upper = lsame( uplo, 'U' )
      IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CHPTRD', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.LE.0 )
     $   RETURN
*
      IF( upper ) THEN
*
*        Reduce the upper triangle of A.
*        I1 is the index in AP of A(1,I+1).
*
         i1 = n*( n-1 ) / 2 + 1
         ap( i1+n-1 ) = real( ap( i1+n-1 ) )
         DO 10 i = n - 1, 1, -1
*
*           Generate elementary reflector H(i) = I - tau * v * v**H
*           to annihilate A(1:i-1,i+1)
*
            alpha = ap( i1+i-1 )
            CALL clarfg( i, alpha, ap( i1 ), 1, taui )
            e( i ) = real( alpha )
*
            IF( taui.NE.zero ) THEN
*
*              Apply H(i) from both sides to A(1:i,1:i)
*
               ap( i1+i-1 ) = one
*
*              Compute  y := tau * A * v  storing y in TAU(1:i)
*
               CALL chpmv( uplo, i, taui, ap, ap( i1 ), 1, zero, tau,
     $                     1 )
*
*              Compute  w := y - 1/2 * tau * (y**H *v) * v
*
               alpha = -half*taui*cdotc( i, tau, 1, ap( i1 ), 1 )
               CALL caxpy( i, alpha, ap( i1 ), 1, tau, 1 )
*
*              Apply the transformation as a rank-2 update:
*                 A := A - v * w**H - w * v**H
*
               CALL chpr2( uplo, i, -one, ap( i1 ), 1, tau, 1, ap )
*
            END IF
            ap( i1+i-1 ) = e( i )
            d( i+1 ) = real( ap( i1+i ) )
            tau( i ) = taui
            i1 = i1 - i
   10    CONTINUE
         d( 1 ) = real( ap( 1 ) )
      ELSE
*
*        Reduce the lower triangle of A. II is the index in AP of
*        A(i,i) and I1I1 is the index of A(i+1,i+1).
*
         ii = 1
         ap( 1 ) = real( ap( 1 ) )
         DO 20 i = 1, n - 1
            i1i1 = ii + n - i + 1
*
*           Generate elementary reflector H(i) = I - tau * v * v**H
*           to annihilate A(i+2:n,i)
*
            alpha = ap( ii+1 )
            CALL clarfg( n-i, alpha, ap( ii+2 ), 1, taui )
            e( i ) = real( alpha )
*
            IF( taui.NE.zero ) THEN
*
*              Apply H(i) from both sides to A(i+1:n,i+1:n)
*
               ap( ii+1 ) = one
*
*              Compute  y := tau * A * v  storing y in TAU(i:n-1)
*
               CALL chpmv( uplo, n-i, taui, ap( i1i1 ), ap( ii+1 ), 1,
     $                     zero, tau( i ), 1 )
*
*              Compute  w := y - 1/2 * tau * (y**H *v) * v
*
               alpha = -half*taui*cdotc( n-i, tau( i ), 1, ap( ii+1 ),
     $                 1 )
               CALL caxpy( n-i, alpha, ap( ii+1 ), 1, tau( i ), 1 )
*
*              Apply the transformation as a rank-2 update:
*                 A := A - v * w**H - w * v**H
*
               CALL chpr2( uplo, n-i, -one, ap( ii+1 ), 1, tau( i ), 1,
     $                     ap( i1i1 ) )
*
            END IF
            ap( ii+1 ) = e( i )
            d( i ) = real( ap( ii ) )
            tau( i ) = taui
            ii = i1i1
   20    CONTINUE
         d( n ) = real( ap( ii ) )
      END IF
*
      RETURN
*
*     End of CHPTRD
*

◆ chptrf()

subroutine chptrf	(	character	uplo,
		integer	n,
		complex, dimension( * )	ap,
		integer, dimension( * )	ipiv,
		integer	info )

CHPTRF

Download CHPTRF + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CHPTRF computes the factorization of a complex Hermitian packed
!> matrix A using the Bunch-Kaufman diagonal pivoting method:
!>
!>    A = U*D*U**H  or  A = L*D*L**H
!>
!> where U (or L) is a product of permutation and unit upper (lower)
!> triangular matrices, and D is Hermitian and block diagonal with
!> 1-by-1 and 2-by-2 diagonal blocks.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': Upper triangle of A is stored; !> = 'L': Lower triangle of A is stored. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in,out]	AP	!> AP is COMPLEX array, dimension (N(N+1)/2) !> On entry, the upper or lower triangle of the Hermitian matrix !> A, packed columnwise in a linear array. The j-th column of A !> is stored in the array AP as follows: !> if UPLO = 'U', AP(i + (j-1)j/2) = A(i,j) for 1<=i<=j; !> if UPLO = 'L', AP(i + (j-1)*(2n-j)/2) = A(i,j) for j<=i<=n. !> !> On exit, the block diagonal matrix D and the multipliers used !> to obtain the factor U or L, stored as a packed triangular !> matrix overwriting A (see below for further details). !>
[out]	IPIV	!> IPIV is INTEGER array, dimension (N) !> Details of the interchanges and the block structure of D. !> If IPIV(k) > 0, then rows and columns k and IPIV(k) were !> interchanged and D(k,k) is a 1-by-1 diagonal block. !> If UPLO = 'U' and IPIV(k) = IPIV(k-1) < 0, then rows and !> columns k-1 and -IPIV(k) were interchanged and D(k-1:k,k-1:k) !> is a 2-by-2 diagonal block. If UPLO = 'L' and IPIV(k) = !> IPIV(k+1) < 0, then rows and columns k+1 and -IPIV(k) were !> interchanged and D(k:k+1,k:k+1) is a 2-by-2 diagonal block. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !> > 0: if INFO = i, D(i,i) is exactly zero. The factorization !> has been completed, but the block diagonal matrix D is !> exactly singular, and division by zero will occur if it !> is used to solve a system of equations. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  If UPLO = 'U', then A = U*D*U**H, where
!>     U = P(n)*U(n)* ... *P(k)U(k)* ...,
!>  i.e., U is a product of terms P(k)*U(k), where k decreases from n to
!>  1 in steps of 1 or 2, and D is a block diagonal matrix with 1-by-1
!>  and 2-by-2 diagonal blocks D(k).  P(k) is a permutation matrix as
!>  defined by IPIV(k), and U(k) is a unit upper triangular matrix, such
!>  that if the diagonal block D(k) is of order s (s = 1 or 2), then
!>
!>             (   I    v    0   )   k-s
!>     U(k) =  (   0    I    0   )   s
!>             (   0    0    I   )   n-k
!>                k-s   s   n-k
!>
!>  If s = 1, D(k) overwrites A(k,k), and v overwrites A(1:k-1,k).
!>  If s = 2, the upper triangle of D(k) overwrites A(k-1,k-1), A(k-1,k),
!>  and A(k,k), and v overwrites A(1:k-2,k-1:k).
!>
!>  If UPLO = 'L', then A = L*D*L**H, where
!>     L = P(1)*L(1)* ... *P(k)*L(k)* ...,
!>  i.e., L is a product of terms P(k)*L(k), where k increases from 1 to
!>  n in steps of 1 or 2, and D is a block diagonal matrix with 1-by-1
!>  and 2-by-2 diagonal blocks D(k).  P(k) is a permutation matrix as
!>  defined by IPIV(k), and L(k) is a unit lower triangular matrix, such
!>  that if the diagonal block D(k) is of order s (s = 1 or 2), then
!>
!>             (   I    0     0   )  k-1
!>     L(k) =  (   0    I     0   )  s
!>             (   0    v     I   )  n-k-s+1
!>                k-1   s  n-k-s+1
!>
!>  If s = 1, D(k) overwrites A(k,k), and v overwrites A(k+1:n,k).
!>  If s = 2, the lower triangle of D(k) overwrites A(k,k), A(k+1,k),
!>  and A(k+1,k+1), and v overwrites A(k+2:n,k:k+1).
!>

Contributors:: J. Lewis, Boeing Computer Services Company

Definition at line 158 of file chptrf.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          UPLO
      INTEGER            INFO, N
*     ..
*     .. Array Arguments ..
      INTEGER            IPIV( * )
      COMPLEX            AP( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ZERO, ONE
      parameter( zero = 0.0e+0, one = 1.0e+0 )
      REAL               EIGHT, SEVTEN
      parameter( eight = 8.0e+0, sevten = 17.0e+0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            UPPER
      INTEGER            I, IMAX, J, JMAX, K, KC, KK, KNC, KP, KPC,
     $                   KSTEP, KX, NPP
      REAL               ABSAKK, ALPHA, COLMAX, D, D11, D22, R1, ROWMAX,
     $                   TT
      COMPLEX            D12, D21, T, WK, WKM1, WKP1, ZDUM
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      INTEGER            ICAMAX
      REAL               SLAPY2
      EXTERNAL           lsame, icamax, slapy2
*     ..
*     .. External Subroutines ..
      EXTERNAL           chpr, csscal, cswap, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, aimag, cmplx, conjg, max, real, sqrt
*     ..
*     .. Statement Functions ..
      REAL               CABS1
*     ..
*     .. Statement Function definitions ..
      cabs1( zdum ) = abs( real( zdum ) ) + abs( aimag( zdum ) )
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      upper = lsame( uplo, 'U' )
      IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CHPTRF', -info )
         RETURN
      END IF
*
*     Initialize ALPHA for use in choosing pivot block size.
*
      alpha = ( one+sqrt( sevten ) ) / eight
*
      IF( upper ) THEN
*
*        Factorize A as U*D*U**H using the upper triangle of A
*
*        K is the main loop index, decreasing from N to 1 in steps of
*        1 or 2
*
         k = n
         kc = ( n-1 )*n / 2 + 1
   10    CONTINUE
         knc = kc
*
*        If K < 1, exit from loop
*
         IF( k.LT.1 )
     $      GO TO 110
         kstep = 1
*
*        Determine rows and columns to be interchanged and whether
*        a 1-by-1 or 2-by-2 pivot block will be used
*
         absakk = abs( real( ap( kc+k-1 ) ) )
*
*        IMAX is the row-index of the largest off-diagonal element in
*        column K, and COLMAX is its absolute value
*
         IF( k.GT.1 ) THEN
            imax = icamax( k-1, ap( kc ), 1 )
            colmax = cabs1( ap( kc+imax-1 ) )
         ELSE
            colmax = zero
         END IF
*
         IF( max( absakk, colmax ).EQ.zero ) THEN
*
*           Column K is zero: set INFO and continue
*
            IF( info.EQ.0 )
     $         info = k
            kp = k
            ap( kc+k-1 ) = real( ap( kc+k-1 ) )
         ELSE
            IF( absakk.GE.alpha*colmax ) THEN
*
*              no interchange, use 1-by-1 pivot block
*
               kp = k
            ELSE
*
*              JMAX is the column-index of the largest off-diagonal
*              element in row IMAX, and ROWMAX is its absolute value
*
               rowmax = zero
               jmax = imax
               kx = imax*( imax+1 ) / 2 + imax
               DO 20 j = imax + 1, k
                  IF( cabs1( ap( kx ) ).GT.rowmax ) THEN
                     rowmax = cabs1( ap( kx ) )
                     jmax = j
                  END IF
                  kx = kx + j
   20          CONTINUE
               kpc = ( imax-1 )*imax / 2 + 1
               IF( imax.GT.1 ) THEN
                  jmax = icamax( imax-1, ap( kpc ), 1 )
                  rowmax = max( rowmax, cabs1( ap( kpc+jmax-1 ) ) )
               END IF
*
               IF( absakk.GE.alpha*colmax*( colmax / rowmax ) ) THEN
*
*                 no interchange, use 1-by-1 pivot block
*
                  kp = k
               ELSE IF( abs( real( ap( kpc+imax-1 ) ) ).GE.alpha*
     $                  rowmax ) THEN
*
*                 interchange rows and columns K and IMAX, use 1-by-1
*                 pivot block
*
                  kp = imax
               ELSE
*
*                 interchange rows and columns K-1 and IMAX, use 2-by-2
*                 pivot block
*
                  kp = imax
                  kstep = 2
               END IF
            END IF
*
            kk = k - kstep + 1
            IF( kstep.EQ.2 )
     $         knc = knc - k + 1
            IF( kp.NE.kk ) THEN
*
*              Interchange rows and columns KK and KP in the leading
*              submatrix A(1:k,1:k)
*
               CALL cswap( kp-1, ap( knc ), 1, ap( kpc ), 1 )
               kx = kpc + kp - 1
               DO 30 j = kp + 1, kk - 1
                  kx = kx + j - 1
                  t = conjg( ap( knc+j-1 ) )
                  ap( knc+j-1 ) = conjg( ap( kx ) )
                  ap( kx ) = t
   30          CONTINUE
               ap( kx+kk-1 ) = conjg( ap( kx+kk-1 ) )
               r1 = real( ap( knc+kk-1 ) )
               ap( knc+kk-1 ) = real( ap( kpc+kp-1 ) )
               ap( kpc+kp-1 ) = r1
               IF( kstep.EQ.2 ) THEN
                  ap( kc+k-1 ) = real( ap( kc+k-1 ) )
                  t = ap( kc+k-2 )
                  ap( kc+k-2 ) = ap( kc+kp-1 )
                  ap( kc+kp-1 ) = t
               END IF
            ELSE
               ap( kc+k-1 ) = real( ap( kc+k-1 ) )
               IF( kstep.EQ.2 )
     $            ap( kc-1 ) = real( ap( kc-1 ) )
            END IF
*
*           Update the leading submatrix
*
            IF( kstep.EQ.1 ) THEN
*
*              1-by-1 pivot block D(k): column k now holds
*
*              W(k) = U(k)*D(k)
*
*              where U(k) is the k-th column of U
*
*              Perform a rank-1 update of A(1:k-1,1:k-1) as
*
*              A := A - U(k)*D(k)*U(k)**H = A - W(k)*1/D(k)*W(k)**H
*
               r1 = one / real( ap( kc+k-1 ) )
               CALL chpr( uplo, k-1, -r1, ap( kc ), 1, ap )
*
*              Store U(k) in column k
*
               CALL csscal( k-1, r1, ap( kc ), 1 )
            ELSE
*
*              2-by-2 pivot block D(k): columns k and k-1 now hold
*
*              ( W(k-1) W(k) ) = ( U(k-1) U(k) )*D(k)
*
*              where U(k) and U(k-1) are the k-th and (k-1)-th columns
*              of U
*
*              Perform a rank-2 update of A(1:k-2,1:k-2) as
*
*              A := A - ( U(k-1) U(k) )*D(k)*( U(k-1) U(k) )**H
*                 = A - ( W(k-1) W(k) )*inv(D(k))*( W(k-1) W(k) )**H
*
               IF( k.GT.2 ) THEN
*
                  d = slapy2( real( ap( k-1+( k-1 )*k / 2 ) ),
     $                aimag( ap( k-1+( k-1 )*k / 2 ) ) )
                  d22 = real( ap( k-1+( k-2 )*( k-1 ) / 2 ) ) / d
                  d11 = real( ap( k+( k-1 )*k / 2 ) ) / d
                  tt = one / ( d11*d22-one )
                  d12 = ap( k-1+( k-1 )*k / 2 ) / d
                  d = tt / d
*
                  DO 50 j = k - 2, 1, -1
                     wkm1 = d*( d11*ap( j+( k-2 )*( k-1 ) / 2 )-
     $                      conjg( d12 )*ap( j+( k-1 )*k / 2 ) )
                     wk = d*( d22*ap( j+( k-1 )*k / 2 )-d12*
     $                    ap( j+( k-2 )*( k-1 ) / 2 ) )
                     DO 40 i = j, 1, -1
                        ap( i+( j-1 )*j / 2 ) = ap( i+( j-1 )*j / 2 ) -
     $                     ap( i+( k-1 )*k / 2 )*conjg( wk ) -
     $                     ap( i+( k-2 )*( k-1 ) / 2 )*conjg( wkm1 )
   40                CONTINUE
                     ap( j+( k-1 )*k / 2 ) = wk
                     ap( j+( k-2 )*( k-1 ) / 2 ) = wkm1
                     ap( j+( j-1 )*j / 2 ) = cmplx( real( ap( j+( j-1 )*
     $                                       j / 2 ) ), 0.0e+0 )
   50             CONTINUE
*
               END IF
*
            END IF
         END IF
*
*        Store details of the interchanges in IPIV
*
         IF( kstep.EQ.1 ) THEN
            ipiv( k ) = kp
         ELSE
            ipiv( k ) = -kp
            ipiv( k-1 ) = -kp
         END IF
*
*        Decrease K and return to the start of the main loop
*
         k = k - kstep
         kc = knc - k
         GO TO 10
*
      ELSE
*
*        Factorize A as L*D*L**H using the lower triangle of A
*
*        K is the main loop index, increasing from 1 to N in steps of
*        1 or 2
*
         k = 1
         kc = 1
         npp = n*( n+1 ) / 2
   60    CONTINUE
         knc = kc
*
*        If K > N, exit from loop
*
         IF( k.GT.n )
     $      GO TO 110
         kstep = 1
*
*        Determine rows and columns to be interchanged and whether
*        a 1-by-1 or 2-by-2 pivot block will be used
*
         absakk = abs( real( ap( kc ) ) )
*
*        IMAX is the row-index of the largest off-diagonal element in
*        column K, and COLMAX is its absolute value
*
         IF( k.LT.n ) THEN
            imax = k + icamax( n-k, ap( kc+1 ), 1 )
            colmax = cabs1( ap( kc+imax-k ) )
         ELSE
            colmax = zero
         END IF
*
         IF( max( absakk, colmax ).EQ.zero ) THEN
*
*           Column K is zero: set INFO and continue
*
            IF( info.EQ.0 )
     $         info = k
            kp = k
            ap( kc ) = real( ap( kc ) )
         ELSE
            IF( absakk.GE.alpha*colmax ) THEN
*
*              no interchange, use 1-by-1 pivot block
*
               kp = k
            ELSE
*
*              JMAX is the column-index of the largest off-diagonal
*              element in row IMAX, and ROWMAX is its absolute value
*
               rowmax = zero
               kx = kc + imax - k
               DO 70 j = k, imax - 1
                  IF( cabs1( ap( kx ) ).GT.rowmax ) THEN
                     rowmax = cabs1( ap( kx ) )
                     jmax = j
                  END IF
                  kx = kx + n - j
   70          CONTINUE
               kpc = npp - ( n-imax+1 )*( n-imax+2 ) / 2 + 1
               IF( imax.LT.n ) THEN
                  jmax = imax + icamax( n-imax, ap( kpc+1 ), 1 )
                  rowmax = max( rowmax, cabs1( ap( kpc+jmax-imax ) ) )
               END IF
*
               IF( absakk.GE.alpha*colmax*( colmax / rowmax ) ) THEN
*
*                 no interchange, use 1-by-1 pivot block
*
                  kp = k
               ELSE IF( abs( real( ap( kpc ) ) ).GE.alpha*rowmax ) THEN
*
*                 interchange rows and columns K and IMAX, use 1-by-1
*                 pivot block
*
                  kp = imax
               ELSE
*
*                 interchange rows and columns K+1 and IMAX, use 2-by-2
*                 pivot block
*
                  kp = imax
                  kstep = 2
               END IF
            END IF
*
            kk = k + kstep - 1
            IF( kstep.EQ.2 )
     $         knc = knc + n - k + 1
            IF( kp.NE.kk ) THEN
*
*              Interchange rows and columns KK and KP in the trailing
*              submatrix A(k:n,k:n)
*
               IF( kp.LT.n )
     $            CALL cswap( n-kp, ap( knc+kp-kk+1 ), 1, ap( kpc+1 ),
     $                        1 )
               kx = knc + kp - kk
               DO 80 j = kk + 1, kp - 1
                  kx = kx + n - j + 1
                  t = conjg( ap( knc+j-kk ) )
                  ap( knc+j-kk ) = conjg( ap( kx ) )
                  ap( kx ) = t
   80          CONTINUE
               ap( knc+kp-kk ) = conjg( ap( knc+kp-kk ) )
               r1 = real( ap( knc ) )
               ap( knc ) = real( ap( kpc ) )
               ap( kpc ) = r1
               IF( kstep.EQ.2 ) THEN
                  ap( kc ) = real( ap( kc ) )
                  t = ap( kc+1 )
                  ap( kc+1 ) = ap( kc+kp-k )
                  ap( kc+kp-k ) = t
               END IF
            ELSE
               ap( kc ) = real( ap( kc ) )
               IF( kstep.EQ.2 )
     $            ap( knc ) = real( ap( knc ) )
            END IF
*
*           Update the trailing submatrix
*
            IF( kstep.EQ.1 ) THEN
*
*              1-by-1 pivot block D(k): column k now holds
*
*              W(k) = L(k)*D(k)
*
*              where L(k) is the k-th column of L
*
               IF( k.LT.n ) THEN
*
*                 Perform a rank-1 update of A(k+1:n,k+1:n) as
*
*                 A := A - L(k)*D(k)*L(k)**H = A - W(k)*(1/D(k))*W(k)**H
*
                  r1 = one / real( ap( kc ) )
                  CALL chpr( uplo, n-k, -r1, ap( kc+1 ), 1,
     $                       ap( kc+n-k+1 ) )
*
*                 Store L(k) in column K
*
                  CALL csscal( n-k, r1, ap( kc+1 ), 1 )
               END IF
            ELSE
*
*              2-by-2 pivot block D(k): columns K and K+1 now hold
*
*              ( W(k) W(k+1) ) = ( L(k) L(k+1) )*D(k)
*
*              where L(k) and L(k+1) are the k-th and (k+1)-th columns
*              of L
*
               IF( k.LT.n-1 ) THEN
*
*                 Perform a rank-2 update of A(k+2:n,k+2:n) as
*
*                 A := A - ( L(k) L(k+1) )*D(k)*( L(k) L(k+1) )**H
*                    = A - ( W(k) W(k+1) )*inv(D(k))*( W(k) W(k+1) )**H
*
*                 where L(k) and L(k+1) are the k-th and (k+1)-th
*                 columns of L
*
                  d = slapy2( real( ap( k+1+( k-1 )*( 2*n-k ) / 2 ) ),
     $                aimag( ap( k+1+( k-1 )*( 2*n-k ) / 2 ) ) )
                  d11 = real( ap( k+1+k*( 2*n-k-1 ) / 2 ) ) / d
                  d22 = real( ap( k+( k-1 )*( 2*n-k ) / 2 ) ) / d
                  tt = one / ( d11*d22-one )
                  d21 = ap( k+1+( k-1 )*( 2*n-k ) / 2 ) / d
                  d = tt / d
*
                  DO 100 j = k + 2, n
                     wk = d*( d11*ap( j+( k-1 )*( 2*n-k ) / 2 )-d21*
     $                    ap( j+k*( 2*n-k-1 ) / 2 ) )
                     wkp1 = d*( d22*ap( j+k*( 2*n-k-1 ) / 2 )-
     $                      conjg( d21 )*ap( j+( k-1 )*( 2*n-k ) / 2 ) )
                     DO 90 i = j, n
                        ap( i+( j-1 )*( 2*n-j ) / 2 ) = ap( i+( j-1 )*
     $                     ( 2*n-j ) / 2 ) - ap( i+( k-1 )*( 2*n-k ) /
     $                     2 )*conjg( wk ) - ap( i+k*( 2*n-k-1 ) / 2 )*
     $                     conjg( wkp1 )
   90                CONTINUE
                     ap( j+( k-1 )*( 2*n-k ) / 2 ) = wk
                     ap( j+k*( 2*n-k-1 ) / 2 ) = wkp1
                     ap( j+( j-1 )*( 2*n-j ) / 2 )
     $                  = cmplx( real( ap( j+( j-1 )*( 2*n-j ) / 2 ) ),
     $                  0.0e+0 )
  100             CONTINUE
               END IF
            END IF
         END IF
*
*        Store details of the interchanges in IPIV
*
         IF( kstep.EQ.1 ) THEN
            ipiv( k ) = kp
         ELSE
            ipiv( k ) = -kp
            ipiv( k+1 ) = -kp
         END IF
*
*        Increase K and return to the start of the main loop
*
         k = k + kstep
         kc = knc + n - k + 2
         GO TO 60
*
      END IF
*
  110 CONTINUE
      RETURN
*
*     End of CHPTRF
*

◆ chptri()

subroutine chptri	(	character	uplo,
		integer	n,
		complex, dimension( * )	ap,
		integer, dimension( * )	ipiv,
		complex, dimension( * )	work,
		integer	info )

CHPTRI

Download CHPTRI + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CHPTRI computes the inverse of a complex Hermitian indefinite matrix
!> A in packed storage using the factorization A = U*D*U**H or
!> A = L*D*L**H computed by CHPTRF.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER1 !> Specifies whether the details of the factorization are stored !> as an upper or lower triangular matrix. !> = 'U': Upper triangular, form is A = UDUH; !> = 'L': Lower triangular, form is A = LDL*H. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in,out]	AP	!> AP is COMPLEX array, dimension (N(N+1)/2) !> On entry, the block diagonal matrix D and the multipliers !> used to obtain the factor U or L as computed by CHPTRF, !> stored as a packed triangular matrix. !> !> On exit, if INFO = 0, the (Hermitian) inverse of the original !> matrix, stored as a packed triangular matrix. The j-th column !> of inv(A) is stored in the array AP as follows: !> if UPLO = 'U', AP(i + (j-1)j/2) = inv(A)(i,j) for 1<=i<=j; !> if UPLO = 'L', !> AP(i + (j-1)*(2n-j)/2) = inv(A)(i,j) for j<=i<=n. !>
[in]	IPIV	!> IPIV is INTEGER array, dimension (N) !> Details of the interchanges and the block structure of D !> as determined by CHPTRF. !>
[out]	WORK	!> WORK is COMPLEX array, dimension (N) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !> > 0: if INFO = i, D(i,i) = 0; the matrix is singular and its !> inverse could not be computed. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 108 of file chptri.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          UPLO
      INTEGER            INFO, N
*     ..
*     .. Array Arguments ..
      INTEGER            IPIV( * )
      COMPLEX            AP( * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ONE
      COMPLEX            CONE, ZERO
      parameter( one = 1.0e+0, cone = ( 1.0e+0, 0.0e+0 ),
     $                   zero = ( 0.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      LOGICAL            UPPER
      INTEGER            J, K, KC, KCNEXT, KP, KPC, KSTEP, KX, NPP
      REAL               AK, AKP1, D, T
      COMPLEX            AKKP1, TEMP
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      COMPLEX            CDOTC
      EXTERNAL           lsame, cdotc
*     ..
*     .. External Subroutines ..
      EXTERNAL           ccopy, chpmv, cswap, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, conjg, real
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      upper = lsame( uplo, 'U' )
      IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CHPTRI', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
*     Check that the diagonal matrix D is nonsingular.
*
      IF( upper ) THEN
*
*        Upper triangular storage: examine D from bottom to top
*
         kp = n*( n+1 ) / 2
         DO 10 info = n, 1, -1
            IF( ipiv( info ).GT.0 .AND. ap( kp ).EQ.zero )
     $         RETURN
            kp = kp - info
   10    CONTINUE
      ELSE
*
*        Lower triangular storage: examine D from top to bottom.
*
         kp = 1
         DO 20 info = 1, n
            IF( ipiv( info ).GT.0 .AND. ap( kp ).EQ.zero )
     $         RETURN
            kp = kp + n - info + 1
   20    CONTINUE
      END IF
      info = 0
*
      IF( upper ) THEN
*
*        Compute inv(A) from the factorization A = U*D*U**H.
*
*        K is the main loop index, increasing from 1 to N in steps of
*        1 or 2, depending on the size of the diagonal blocks.
*
         k = 1
         kc = 1
   30    CONTINUE
*
*        If K > N, exit from loop.
*
         IF( k.GT.n )
     $      GO TO 50
*
         kcnext = kc + k
         IF( ipiv( k ).GT.0 ) THEN
*
*           1 x 1 diagonal block
*
*           Invert the diagonal block.
*
            ap( kc+k-1 ) = one / real( ap( kc+k-1 ) )
*
*           Compute column K of the inverse.
*
            IF( k.GT.1 ) THEN
               CALL ccopy( k-1, ap( kc ), 1, work, 1 )
               CALL chpmv( uplo, k-1, -cone, ap, work, 1, zero,
     $                     ap( kc ), 1 )
               ap( kc+k-1 ) = ap( kc+k-1 ) -
     $                        real( cdotc( k-1, work, 1, ap( kc ), 1 ) )
            END IF
            kstep = 1
         ELSE
*
*           2 x 2 diagonal block
*
*           Invert the diagonal block.
*
            t = abs( ap( kcnext+k-1 ) )
            ak = real( ap( kc+k-1 ) ) / t
            akp1 = real( ap( kcnext+k ) ) / t
            akkp1 = ap( kcnext+k-1 ) / t
            d = t*( ak*akp1-one )
            ap( kc+k-1 ) = akp1 / d
            ap( kcnext+k ) = ak / d
            ap( kcnext+k-1 ) = -akkp1 / d
*
*           Compute columns K and K+1 of the inverse.
*
            IF( k.GT.1 ) THEN
               CALL ccopy( k-1, ap( kc ), 1, work, 1 )
               CALL chpmv( uplo, k-1, -cone, ap, work, 1, zero,
     $                     ap( kc ), 1 )
               ap( kc+k-1 ) = ap( kc+k-1 ) -
     $                        real( cdotc( k-1, work, 1, ap( kc ), 1 ) )
               ap( kcnext+k-1 ) = ap( kcnext+k-1 ) -
     $                            cdotc( k-1, ap( kc ), 1, ap( kcnext ),
     $                            1 )
               CALL ccopy( k-1, ap( kcnext ), 1, work, 1 )
               CALL chpmv( uplo, k-1, -cone, ap, work, 1, zero,
     $                     ap( kcnext ), 1 )
               ap( kcnext+k ) = ap( kcnext+k ) -
     $                          real( cdotc( k-1, work, 1, ap( kcnext ),
     $                          1 ) )
            END IF
            kstep = 2
            kcnext = kcnext + k + 1
         END IF
*
         kp = abs( ipiv( k ) )
         IF( kp.NE.k ) THEN
*
*           Interchange rows and columns K and KP in the leading
*           submatrix A(1:k+1,1:k+1)
*
            kpc = ( kp-1 )*kp / 2 + 1
            CALL cswap( kp-1, ap( kc ), 1, ap( kpc ), 1 )
            kx = kpc + kp - 1
            DO 40 j = kp + 1, k - 1
               kx = kx + j - 1
               temp = conjg( ap( kc+j-1 ) )
               ap( kc+j-1 ) = conjg( ap( kx ) )
               ap( kx ) = temp
   40       CONTINUE
            ap( kc+kp-1 ) = conjg( ap( kc+kp-1 ) )
            temp = ap( kc+k-1 )
            ap( kc+k-1 ) = ap( kpc+kp-1 )
            ap( kpc+kp-1 ) = temp
            IF( kstep.EQ.2 ) THEN
               temp = ap( kc+k+k-1 )
               ap( kc+k+k-1 ) = ap( kc+k+kp-1 )
               ap( kc+k+kp-1 ) = temp
            END IF
         END IF
*
         k = k + kstep
         kc = kcnext
         GO TO 30
   50    CONTINUE
*
      ELSE
*
*        Compute inv(A) from the factorization A = L*D*L**H.
*
*        K is the main loop index, increasing from 1 to N in steps of
*        1 or 2, depending on the size of the diagonal blocks.
*
         npp = n*( n+1 ) / 2
         k = n
         kc = npp
   60    CONTINUE
*
*        If K < 1, exit from loop.
*
         IF( k.LT.1 )
     $      GO TO 80
*
         kcnext = kc - ( n-k+2 )
         IF( ipiv( k ).GT.0 ) THEN
*
*           1 x 1 diagonal block
*
*           Invert the diagonal block.
*
            ap( kc ) = one / real( ap( kc ) )
*
*           Compute column K of the inverse.
*
            IF( k.LT.n ) THEN
               CALL ccopy( n-k, ap( kc+1 ), 1, work, 1 )
               CALL chpmv( uplo, n-k, -cone, ap( kc+n-k+1 ), work, 1,
     $                     zero, ap( kc+1 ), 1 )
               ap( kc ) = ap( kc ) - real( cdotc( n-k, work, 1,
     $                    ap( kc+1 ), 1 ) )
            END IF
            kstep = 1
         ELSE
*
*           2 x 2 diagonal block
*
*           Invert the diagonal block.
*
            t = abs( ap( kcnext+1 ) )
            ak = real( ap( kcnext ) ) / t
            akp1 = real( ap( kc ) ) / t
            akkp1 = ap( kcnext+1 ) / t
            d = t*( ak*akp1-one )
            ap( kcnext ) = akp1 / d
            ap( kc ) = ak / d
            ap( kcnext+1 ) = -akkp1 / d
*
*           Compute columns K-1 and K of the inverse.
*
            IF( k.LT.n ) THEN
               CALL ccopy( n-k, ap( kc+1 ), 1, work, 1 )
               CALL chpmv( uplo, n-k, -cone, ap( kc+( n-k+1 ) ), work,
     $                     1, zero, ap( kc+1 ), 1 )
               ap( kc ) = ap( kc ) - real( cdotc( n-k, work, 1,
     $                    ap( kc+1 ), 1 ) )
               ap( kcnext+1 ) = ap( kcnext+1 ) -
     $                          cdotc( n-k, ap( kc+1 ), 1,
     $                          ap( kcnext+2 ), 1 )
               CALL ccopy( n-k, ap( kcnext+2 ), 1, work, 1 )
               CALL chpmv( uplo, n-k, -cone, ap( kc+( n-k+1 ) ), work,
     $                     1, zero, ap( kcnext+2 ), 1 )
               ap( kcnext ) = ap( kcnext ) -
     $                        real( cdotc( n-k, work, 1, ap( kcnext+2 ),
     $                        1 ) )
            END IF
            kstep = 2
            kcnext = kcnext - ( n-k+3 )
         END IF
*
         kp = abs( ipiv( k ) )
         IF( kp.NE.k ) THEN
*
*           Interchange rows and columns K and KP in the trailing
*           submatrix A(k-1:n,k-1:n)
*
            kpc = npp - ( n-kp+1 )*( n-kp+2 ) / 2 + 1
            IF( kp.LT.n )
     $         CALL cswap( n-kp, ap( kc+kp-k+1 ), 1, ap( kpc+1 ), 1 )
            kx = kc + kp - k
            DO 70 j = k + 1, kp - 1
               kx = kx + n - j + 1
               temp = conjg( ap( kc+j-k ) )
               ap( kc+j-k ) = conjg( ap( kx ) )
               ap( kx ) = temp
   70       CONTINUE
            ap( kc+kp-k ) = conjg( ap( kc+kp-k ) )
            temp = ap( kc )
            ap( kc ) = ap( kpc )
            ap( kpc ) = temp
            IF( kstep.EQ.2 ) THEN
               temp = ap( kc-n+k-1 )
               ap( kc-n+k-1 ) = ap( kc-n+kp-1 )
               ap( kc-n+kp-1 ) = temp
            END IF
         END IF
*
         k = k - kstep
         kc = kcnext
         GO TO 60
   80    CONTINUE
      END IF
*
      RETURN
*
*     End of CHPTRI
*

◆ chptrs()

subroutine chptrs	(	character	uplo,
		integer	n,
		integer	nrhs,
		complex, dimension( * )	ap,
		integer, dimension( * )	ipiv,
		complex, dimension( ldb, * )	b,
		integer	ldb,
		integer	info )

CHPTRS

Download CHPTRS + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CHPTRS solves a system of linear equations A*X = B with a complex
!> Hermitian matrix A stored in packed format using the factorization
!> A = U*D*U**H or A = L*D*L**H computed by CHPTRF.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER1 !> Specifies whether the details of the factorization are stored !> as an upper or lower triangular matrix. !> = 'U': Upper triangular, form is A = UDUH; !> = 'L': Lower triangular, form is A = LDL*H. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in]	NRHS	!> NRHS is INTEGER !> The number of right hand sides, i.e., the number of columns !> of the matrix B. NRHS >= 0. !>
[in]	AP	!> AP is COMPLEX array, dimension (N*(N+1)/2) !> The block diagonal matrix D and the multipliers used to !> obtain the factor U or L as computed by CHPTRF, stored as a !> packed triangular matrix. !>
[in]	IPIV	!> IPIV is INTEGER array, dimension (N) !> Details of the interchanges and the block structure of D !> as determined by CHPTRF. !>
[in,out]	B	!> B is COMPLEX array, dimension (LDB,NRHS) !> On entry, the right hand side matrix B. !> On exit, the solution matrix X. !>
[in]	LDB	!> LDB is INTEGER !> The leading dimension of the array B. LDB >= max(1,N). !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 114 of file chptrs.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          UPLO
      INTEGER            INFO, LDB, N, NRHS
*     ..
*     .. Array Arguments ..
      INTEGER            IPIV( * )
      COMPLEX            AP( * ), B( LDB, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            ONE
      parameter( one = ( 1.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      LOGICAL            UPPER
      INTEGER            J, K, KC, KP
      REAL               S
      COMPLEX            AK, AKM1, AKM1K, BK, BKM1, DENOM
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           cgemv, cgeru, clacgv, csscal, cswap, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          conjg, max, real
*     ..
*     .. Executable Statements ..
*
      info = 0
      upper = lsame( uplo, 'U' )
      IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( nrhs.LT.0 ) THEN
         info = -3
      ELSE IF( ldb.LT.max( 1, n ) ) THEN
         info = -7
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CHPTRS', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 .OR. nrhs.EQ.0 )
     $   RETURN
*
      IF( upper ) THEN
*
*        Solve A*X = B, where A = U*D*U**H.
*
*        First solve U*D*X = B, overwriting B with X.
*
*        K is the main loop index, decreasing from N to 1 in steps of
*        1 or 2, depending on the size of the diagonal blocks.
*
         k = n
         kc = n*( n+1 ) / 2 + 1
   10    CONTINUE
*
*        If K < 1, exit from loop.
*
         IF( k.LT.1 )
     $      GO TO 30
*
         kc = kc - k
         IF( ipiv( k ).GT.0 ) THEN
*
*           1 x 1 diagonal block
*
*           Interchange rows K and IPIV(K).
*
            kp = ipiv( k )
            IF( kp.NE.k )
     $         CALL cswap( nrhs, b( k, 1 ), ldb, b( kp, 1 ), ldb )
*
*           Multiply by inv(U(K)), where U(K) is the transformation
*           stored in column K of A.
*
            CALL cgeru( k-1, nrhs, -one, ap( kc ), 1, b( k, 1 ), ldb,
     $                  b( 1, 1 ), ldb )
*
*           Multiply by the inverse of the diagonal block.
*
            s = real( one ) / real( ap( kc+k-1 ) )
            CALL csscal( nrhs, s, b( k, 1 ), ldb )
            k = k - 1
         ELSE
*
*           2 x 2 diagonal block
*
*           Interchange rows K-1 and -IPIV(K).
*
            kp = -ipiv( k )
            IF( kp.NE.k-1 )
     $         CALL cswap( nrhs, b( k-1, 1 ), ldb, b( kp, 1 ), ldb )
*
*           Multiply by inv(U(K)), where U(K) is the transformation
*           stored in columns K-1 and K of A.
*
            CALL cgeru( k-2, nrhs, -one, ap( kc ), 1, b( k, 1 ), ldb,
     $                  b( 1, 1 ), ldb )
            CALL cgeru( k-2, nrhs, -one, ap( kc-( k-1 ) ), 1,
     $                  b( k-1, 1 ), ldb, b( 1, 1 ), ldb )
*
*           Multiply by the inverse of the diagonal block.
*
            akm1k = ap( kc+k-2 )
            akm1 = ap( kc-1 ) / akm1k
            ak = ap( kc+k-1 ) / conjg( akm1k )
            denom = akm1*ak - one
            DO 20 j = 1, nrhs
               bkm1 = b( k-1, j ) / akm1k
               bk = b( k, j ) / conjg( akm1k )
               b( k-1, j ) = ( ak*bkm1-bk ) / denom
               b( k, j ) = ( akm1*bk-bkm1 ) / denom
   20       CONTINUE
            kc = kc - k + 1
            k = k - 2
         END IF
*
         GO TO 10
   30    CONTINUE
*
*        Next solve U**H *X = B, overwriting B with X.
*
*        K is the main loop index, increasing from 1 to N in steps of
*        1 or 2, depending on the size of the diagonal blocks.
*
         k = 1
         kc = 1
   40    CONTINUE
*
*        If K > N, exit from loop.
*
         IF( k.GT.n )
     $      GO TO 50
*
         IF( ipiv( k ).GT.0 ) THEN
*
*           1 x 1 diagonal block
*
*           Multiply by inv(U**H(K)), where U(K) is the transformation
*           stored in column K of A.
*
            IF( k.GT.1 ) THEN
               CALL clacgv( nrhs, b( k, 1 ), ldb )
               CALL cgemv( 'Conjugate transpose', k-1, nrhs, -one, b,
     $                     ldb, ap( kc ), 1, one, b( k, 1 ), ldb )
               CALL clacgv( nrhs, b( k, 1 ), ldb )
            END IF
*
*           Interchange rows K and IPIV(K).
*
            kp = ipiv( k )
            IF( kp.NE.k )
     $         CALL cswap( nrhs, b( k, 1 ), ldb, b( kp, 1 ), ldb )
            kc = kc + k
            k = k + 1
         ELSE
*
*           2 x 2 diagonal block
*
*           Multiply by inv(U**H(K+1)), where U(K+1) is the transformation
*           stored in columns K and K+1 of A.
*
            IF( k.GT.1 ) THEN
               CALL clacgv( nrhs, b( k, 1 ), ldb )
               CALL cgemv( 'Conjugate transpose', k-1, nrhs, -one, b,
     $                     ldb, ap( kc ), 1, one, b( k, 1 ), ldb )
               CALL clacgv( nrhs, b( k, 1 ), ldb )
*
               CALL clacgv( nrhs, b( k+1, 1 ), ldb )
               CALL cgemv( 'Conjugate transpose', k-1, nrhs, -one, b,
     $                     ldb, ap( kc+k ), 1, one, b( k+1, 1 ), ldb )
               CALL clacgv( nrhs, b( k+1, 1 ), ldb )
            END IF
*
*           Interchange rows K and -IPIV(K).
*
            kp = -ipiv( k )
            IF( kp.NE.k )
     $         CALL cswap( nrhs, b( k, 1 ), ldb, b( kp, 1 ), ldb )
            kc = kc + 2*k + 1
            k = k + 2
         END IF
*
         GO TO 40
   50    CONTINUE
*
      ELSE
*
*        Solve A*X = B, where A = L*D*L**H.
*
*        First solve L*D*X = B, overwriting B with X.
*
*        K is the main loop index, increasing from 1 to N in steps of
*        1 or 2, depending on the size of the diagonal blocks.
*
         k = 1
         kc = 1
   60    CONTINUE
*
*        If K > N, exit from loop.
*
         IF( k.GT.n )
     $      GO TO 80
*
         IF( ipiv( k ).GT.0 ) THEN
*
*           1 x 1 diagonal block
*
*           Interchange rows K and IPIV(K).
*
            kp = ipiv( k )
            IF( kp.NE.k )
     $         CALL cswap( nrhs, b( k, 1 ), ldb, b( kp, 1 ), ldb )
*
*           Multiply by inv(L(K)), where L(K) is the transformation
*           stored in column K of A.
*
            IF( k.LT.n )
     $         CALL cgeru( n-k, nrhs, -one, ap( kc+1 ), 1, b( k, 1 ),
     $                     ldb, b( k+1, 1 ), ldb )
*
*           Multiply by the inverse of the diagonal block.
*
            s = real( one ) / real( ap( kc ) )
            CALL csscal( nrhs, s, b( k, 1 ), ldb )
            kc = kc + n - k + 1
            k = k + 1
         ELSE
*
*           2 x 2 diagonal block
*
*           Interchange rows K+1 and -IPIV(K).
*
            kp = -ipiv( k )
            IF( kp.NE.k+1 )
     $         CALL cswap( nrhs, b( k+1, 1 ), ldb, b( kp, 1 ), ldb )
*
*           Multiply by inv(L(K)), where L(K) is the transformation
*           stored in columns K and K+1 of A.
*
            IF( k.LT.n-1 ) THEN
               CALL cgeru( n-k-1, nrhs, -one, ap( kc+2 ), 1, b( k, 1 ),
     $                     ldb, b( k+2, 1 ), ldb )
               CALL cgeru( n-k-1, nrhs, -one, ap( kc+n-k+2 ), 1,
     $                     b( k+1, 1 ), ldb, b( k+2, 1 ), ldb )
            END IF
*
*           Multiply by the inverse of the diagonal block.
*
            akm1k = ap( kc+1 )
            akm1 = ap( kc ) / conjg( akm1k )
            ak = ap( kc+n-k+1 ) / akm1k
            denom = akm1*ak - one
            DO 70 j = 1, nrhs
               bkm1 = b( k, j ) / conjg( akm1k )
               bk = b( k+1, j ) / akm1k
               b( k, j ) = ( ak*bkm1-bk ) / denom
               b( k+1, j ) = ( akm1*bk-bkm1 ) / denom
   70       CONTINUE
            kc = kc + 2*( n-k ) + 1
            k = k + 2
         END IF
*
         GO TO 60
   80    CONTINUE
*
*        Next solve L**H *X = B, overwriting B with X.
*
*        K is the main loop index, decreasing from N to 1 in steps of
*        1 or 2, depending on the size of the diagonal blocks.
*
         k = n
         kc = n*( n+1 ) / 2 + 1
   90    CONTINUE
*
*        If K < 1, exit from loop.
*
         IF( k.LT.1 )
     $      GO TO 100
*
         kc = kc - ( n-k+1 )
         IF( ipiv( k ).GT.0 ) THEN
*
*           1 x 1 diagonal block
*
*           Multiply by inv(L**H(K)), where L(K) is the transformation
*           stored in column K of A.
*
            IF( k.LT.n ) THEN
               CALL clacgv( nrhs, b( k, 1 ), ldb )
               CALL cgemv( 'Conjugate transpose', n-k, nrhs, -one,
     $                     b( k+1, 1 ), ldb, ap( kc+1 ), 1, one,
     $                     b( k, 1 ), ldb )
               CALL clacgv( nrhs, b( k, 1 ), ldb )
            END IF
*
*           Interchange rows K and IPIV(K).
*
            kp = ipiv( k )
            IF( kp.NE.k )
     $         CALL cswap( nrhs, b( k, 1 ), ldb, b( kp, 1 ), ldb )
            k = k - 1
         ELSE
*
*           2 x 2 diagonal block
*
*           Multiply by inv(L**H(K-1)), where L(K-1) is the transformation
*           stored in columns K-1 and K of A.
*
            IF( k.LT.n ) THEN
               CALL clacgv( nrhs, b( k, 1 ), ldb )
               CALL cgemv( 'Conjugate transpose', n-k, nrhs, -one,
     $                     b( k+1, 1 ), ldb, ap( kc+1 ), 1, one,
     $                     b( k, 1 ), ldb )
               CALL clacgv( nrhs, b( k, 1 ), ldb )
*
               CALL clacgv( nrhs, b( k-1, 1 ), ldb )
               CALL cgemv( 'Conjugate transpose', n-k, nrhs, -one,
     $                     b( k+1, 1 ), ldb, ap( kc-( n-k ) ), 1, one,
     $                     b( k-1, 1 ), ldb )
               CALL clacgv( nrhs, b( k-1, 1 ), ldb )
            END IF
*
*           Interchange rows K and -IPIV(K).
*
            kp = -ipiv( k )
            IF( kp.NE.k )
     $         CALL cswap( nrhs, b( k, 1 ), ldb, b( kp, 1 ), ldb )
            kc = kc - ( n-k+2 )
            k = k - 2
         END IF
*
         GO TO 90
  100    CONTINUE
      END IF
*
      RETURN
*
*     End of CHPTRS
*

◆ chsein()

subroutine chsein	(	character	side,
		character	eigsrc,
		character	initv,
		logical, dimension( * )	select,
		integer	n,
		complex, dimension( ldh, * )	h,
		integer	ldh,
		complex, dimension( * )	w,
		complex, dimension( ldvl, * )	vl,
		integer	ldvl,
		complex, dimension( ldvr, * )	vr,
		integer	ldvr,
		integer	mm,
		integer	m,
		complex, dimension( * )	work,
		real, dimension( * )	rwork,
		integer, dimension( * )	ifaill,
		integer, dimension( * )	ifailr,
		integer	info )

CHSEIN

Download CHSEIN + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CHSEIN uses inverse iteration to find specified right and/or left
!> eigenvectors of a complex upper Hessenberg matrix H.
!>
!> The right eigenvector x and the left eigenvector y of the matrix H
!> corresponding to an eigenvalue w are defined by:
!>
!>              H * x = w * x,     y**h * H = w * y**h
!>
!> where y**h denotes the conjugate transpose of the vector y.
!>

Parameters

[in]	SIDE	!> SIDE is CHARACTER*1 !> = 'R': compute right eigenvectors only; !> = 'L': compute left eigenvectors only; !> = 'B': compute both right and left eigenvectors. !>
[in]	EIGSRC	!> EIGSRC is CHARACTER*1 !> Specifies the source of eigenvalues supplied in W: !> = 'Q': the eigenvalues were found using CHSEQR; thus, if !> H has zero subdiagonal elements, and so is !> block-triangular, then the j-th eigenvalue can be !> assumed to be an eigenvalue of the block containing !> the j-th row/column. This property allows CHSEIN to !> perform inverse iteration on just one diagonal block. !> = 'N': no assumptions are made on the correspondence !> between eigenvalues and diagonal blocks. In this !> case, CHSEIN must always perform inverse iteration !> using the whole matrix H. !>
[in]	INITV	!> INITV is CHARACTER*1 !> = 'N': no initial vectors are supplied; !> = 'U': user-supplied initial vectors are stored in the arrays !> VL and/or VR. !>
[in]	SELECT	!> SELECT is LOGICAL array, dimension (N) !> Specifies the eigenvectors to be computed. To select the !> eigenvector corresponding to the eigenvalue W(j), !> SELECT(j) must be set to .TRUE.. !>
[in]	N	!> N is INTEGER !> The order of the matrix H. N >= 0. !>
[in]	H	!> H is COMPLEX array, dimension (LDH,N) !> The upper Hessenberg matrix H. !> If a NaN is detected in H, the routine will return with INFO=-6. !>
[in]	LDH	!> LDH is INTEGER !> The leading dimension of the array H. LDH >= max(1,N). !>
[in,out]	W	!> W is COMPLEX array, dimension (N) !> On entry, the eigenvalues of H. !> On exit, the real parts of W may have been altered since !> close eigenvalues are perturbed slightly in searching for !> independent eigenvectors. !>
[in,out]	VL	!> VL is COMPLEX array, dimension (LDVL,MM) !> On entry, if INITV = 'U' and SIDE = 'L' or 'B', VL must !> contain starting vectors for the inverse iteration for the !> left eigenvectors; the starting vector for each eigenvector !> must be in the same column in which the eigenvector will be !> stored. !> On exit, if SIDE = 'L' or 'B', the left eigenvectors !> specified by SELECT will be stored consecutively in the !> columns of VL, in the same order as their eigenvalues. !> If SIDE = 'R', VL is not referenced. !>
[in]	LDVL	!> LDVL is INTEGER !> The leading dimension of the array VL. !> LDVL >= max(1,N) if SIDE = 'L' or 'B'; LDVL >= 1 otherwise. !>
[in,out]	VR	!> VR is COMPLEX array, dimension (LDVR,MM) !> On entry, if INITV = 'U' and SIDE = 'R' or 'B', VR must !> contain starting vectors for the inverse iteration for the !> right eigenvectors; the starting vector for each eigenvector !> must be in the same column in which the eigenvector will be !> stored. !> On exit, if SIDE = 'R' or 'B', the right eigenvectors !> specified by SELECT will be stored consecutively in the !> columns of VR, in the same order as their eigenvalues. !> If SIDE = 'L', VR is not referenced. !>
[in]	LDVR	!> LDVR is INTEGER !> The leading dimension of the array VR. !> LDVR >= max(1,N) if SIDE = 'R' or 'B'; LDVR >= 1 otherwise. !>
[in]	MM	!> MM is INTEGER !> The number of columns in the arrays VL and/or VR. MM >= M. !>
[out]	M	!> M is INTEGER !> The number of columns in the arrays VL and/or VR required to !> store the eigenvectors (= the number of .TRUE. elements in !> SELECT). !>
[out]	WORK	!> WORK is COMPLEX array, dimension (N*N) !>
[out]	RWORK	!> RWORK is REAL array, dimension (N) !>
[out]	IFAILL	!> IFAILL is INTEGER array, dimension (MM) !> If SIDE = 'L' or 'B', IFAILL(i) = j > 0 if the left !> eigenvector in the i-th column of VL (corresponding to the !> eigenvalue w(j)) failed to converge; IFAILL(i) = 0 if the !> eigenvector converged satisfactorily. !> If SIDE = 'R', IFAILL is not referenced. !>
[out]	IFAILR	!> IFAILR is INTEGER array, dimension (MM) !> If SIDE = 'R' or 'B', IFAILR(i) = j > 0 if the right !> eigenvector in the i-th column of VR (corresponding to the !> eigenvalue w(j)) failed to converge; IFAILR(i) = 0 if the !> eigenvector converged satisfactorily. !> If SIDE = 'L', IFAILR is not referenced. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !> > 0: if INFO = i, i is the number of eigenvectors which !> failed to converge; see IFAILL and IFAILR for further !> details. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  Each eigenvector is normalized so that the element of largest
!>  magnitude has magnitude 1; here the magnitude of a complex number
!>  (x,y) is taken to be |x|+|y|.
!>

Definition at line 242 of file chsein.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          EIGSRC, INITV, SIDE
      INTEGER            INFO, LDH, LDVL, LDVR, M, MM, N
*     ..
*     .. Array Arguments ..
      LOGICAL            SELECT( * )
      INTEGER            IFAILL( * ), IFAILR( * )
      REAL               RWORK( * )
      COMPLEX            H( LDH, * ), VL( LDVL, * ), VR( LDVR, * ),
     $                   W( * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            ZERO
      parameter( zero = ( 0.0e+0, 0.0e+0 ) )
      REAL               RZERO
      parameter( rzero = 0.0e+0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            BOTHV, FROMQR, LEFTV, NOINIT, RIGHTV
      INTEGER            I, IINFO, K, KL, KLN, KR, KS, LDWORK
      REAL               EPS3, HNORM, SMLNUM, ULP, UNFL
      COMPLEX            CDUM, WK
*     ..
*     .. External Functions ..
      LOGICAL            LSAME, SISNAN
      REAL               CLANHS, SLAMCH
      EXTERNAL           lsame, clanhs, slamch, sisnan
*     ..
*     .. External Subroutines ..
      EXTERNAL           claein, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, aimag, max, real
*     ..
*     .. Statement Functions ..
      REAL               CABS1
*     ..
*     .. Statement Function definitions ..
      cabs1( cdum ) = abs( real( cdum ) ) + abs( aimag( cdum ) )
*     ..
*     .. Executable Statements ..
*
*     Decode and test the input parameters.
*
      bothv = lsame( side, 'B' )
      rightv = lsame( side, 'R' ) .OR. bothv
      leftv = lsame( side, 'L' ) .OR. bothv
*
      fromqr = lsame( eigsrc, 'Q' )
*
      noinit = lsame( initv, 'N' )
*
*     Set M to the number of columns required to store the selected
*     eigenvectors.
*
      m = 0
      DO 10 k = 1, n
         IF( SELECT( k ) )
     $      m = m + 1
   10 CONTINUE
*
      info = 0
      IF( .NOT.rightv .AND. .NOT.leftv ) THEN
         info = -1
      ELSE IF( .NOT.fromqr .AND. .NOT.lsame( eigsrc, 'N' ) ) THEN
         info = -2
      ELSE IF( .NOT.noinit .AND. .NOT.lsame( initv, 'U' ) ) THEN
         info = -3
      ELSE IF( n.LT.0 ) THEN
         info = -5
      ELSE IF( ldh.LT.max( 1, n ) ) THEN
         info = -7
      ELSE IF( ldvl.LT.1 .OR. ( leftv .AND. ldvl.LT.n ) ) THEN
         info = -10
      ELSE IF( ldvr.LT.1 .OR. ( rightv .AND. ldvr.LT.n ) ) THEN
         info = -12
      ELSE IF( mm.LT.m ) THEN
         info = -13
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CHSEIN', -info )
         RETURN
      END IF
*
*     Quick return if possible.
*
      IF( n.EQ.0 )
     $   RETURN
*
*     Set machine-dependent constants.
*
      unfl = slamch( 'Safe minimum' )
      ulp = slamch( 'Precision' )
      smlnum = unfl*( n / ulp )
*
      ldwork = n
*
      kl = 1
      kln = 0
      IF( fromqr ) THEN
         kr = 0
      ELSE
         kr = n
      END IF
      ks = 1
*
      DO 100 k = 1, n
         IF( SELECT( k ) ) THEN
*
*           Compute eigenvector(s) corresponding to W(K).
*
            IF( fromqr ) THEN
*
*              If affiliation of eigenvalues is known, check whether
*              the matrix splits.
*
*              Determine KL and KR such that 1 <= KL <= K <= KR <= N
*              and H(KL,KL-1) and H(KR+1,KR) are zero (or KL = 1 or
*              KR = N).
*
*              Then inverse iteration can be performed with the
*              submatrix H(KL:N,KL:N) for a left eigenvector, and with
*              the submatrix H(1:KR,1:KR) for a right eigenvector.
*
               DO 20 i = k, kl + 1, -1
                  IF( h( i, i-1 ).EQ.zero )
     $               GO TO 30
   20          CONTINUE
   30          CONTINUE
               kl = i
               IF( k.GT.kr ) THEN
                  DO 40 i = k, n - 1
                     IF( h( i+1, i ).EQ.zero )
     $                  GO TO 50
   40             CONTINUE
   50             CONTINUE
                  kr = i
               END IF
            END IF
*
            IF( kl.NE.kln ) THEN
               kln = kl
*
*              Compute infinity-norm of submatrix H(KL:KR,KL:KR) if it
*              has not ben computed before.
*
               hnorm = clanhs( 'I', kr-kl+1, h( kl, kl ), ldh, rwork )
               IF( sisnan( hnorm ) ) THEN
                  info = -6
                  RETURN
               ELSE IF( (hnorm.GT.rzero) ) THEN
                  eps3 = hnorm*ulp
               ELSE
                  eps3 = smlnum
               END IF
            END IF
*
*           Perturb eigenvalue if it is close to any previous
*           selected eigenvalues affiliated to the submatrix
*           H(KL:KR,KL:KR). Close roots are modified by EPS3.
*
            wk = w( k )
   60       CONTINUE
            DO 70 i = k - 1, kl, -1
               IF( SELECT( i ) .AND. cabs1( w( i )-wk ).LT.eps3 ) THEN
                  wk = wk + eps3
                  GO TO 60
               END IF
   70       CONTINUE
            w( k ) = wk
*
            IF( leftv ) THEN
*
*              Compute left eigenvector.
*
               CALL claein( .false., noinit, n-kl+1, h( kl, kl ), ldh,
     $                      wk, vl( kl, ks ), work, ldwork, rwork, eps3,
     $                      smlnum, iinfo )
               IF( iinfo.GT.0 ) THEN
                  info = info + 1
                  ifaill( ks ) = k
               ELSE
                  ifaill( ks ) = 0
               END IF
               DO 80 i = 1, kl - 1
                  vl( i, ks ) = zero
   80          CONTINUE
            END IF
            IF( rightv ) THEN
*
*              Compute right eigenvector.
*
               CALL claein( .true., noinit, kr, h, ldh, wk, vr( 1, ks ),
     $                      work, ldwork, rwork, eps3, smlnum, iinfo )
               IF( iinfo.GT.0 ) THEN
                  info = info + 1
                  ifailr( ks ) = k
               ELSE
                  ifailr( ks ) = 0
               END IF
               DO 90 i = kr + 1, n
                  vr( i, ks ) = zero
   90          CONTINUE
            END IF
            ks = ks + 1
         END IF
  100 CONTINUE
*
      RETURN
*
*     End of CHSEIN
*

◆ chseqr()

subroutine chseqr	(	character	job,
		character	compz,
		integer	n,
		integer	ilo,
		integer	ihi,
		complex, dimension( ldh, * )	h,
		integer	ldh,
		complex, dimension( * )	w,
		complex, dimension( ldz, * )	z,
		integer	ldz,
		complex, dimension( * )	work,
		integer	lwork,
		integer	info )

CHSEQR

Download CHSEQR + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!>    CHSEQR computes the eigenvalues of a Hessenberg matrix H
!>    and, optionally, the matrices T and Z from the Schur decomposition
!>    H = Z T Z**H, where T is an upper triangular matrix (the
!>    Schur form), and Z is the unitary matrix of Schur vectors.
!>
!>    Optionally Z may be postmultiplied into an input unitary
!>    matrix Q so that this routine can give the Schur factorization
!>    of a matrix A which has been reduced to the Hessenberg form H
!>    by the unitary matrix Q:  A = Q*H*Q**H = (QZ)*T*(QZ)**H.
!>

Parameters

[in]	JOB	!> JOB is CHARACTER*1 !> = 'E': compute eigenvalues only; !> = 'S': compute eigenvalues and the Schur form T. !>
[in]	COMPZ	!> COMPZ is CHARACTER1 !> = 'N': no Schur vectors are computed; !> = 'I': Z is initialized to the unit matrix and the matrix Z !> of Schur vectors of H is returned; !> = 'V': Z must contain an unitary matrix Q on entry, and !> the product QZ is returned. !>
[in]	N	!> N is INTEGER !> The order of the matrix H. N >= 0. !>
[in]	ILO	!> ILO is INTEGER !>
[in]	IHI	!> IHI is INTEGER !> !> It is assumed that H is already upper triangular in rows !> and columns 1:ILO-1 and IHI+1:N. ILO and IHI are normally !> set by a previous call to CGEBAL, and then passed to ZGEHRD !> when the matrix output by CGEBAL is reduced to Hessenberg !> form. Otherwise ILO and IHI should be set to 1 and N !> respectively. If N > 0, then 1 <= ILO <= IHI <= N. !> If N = 0, then ILO = 1 and IHI = 0. !>
[in,out]	H	!> H is COMPLEX array, dimension (LDH,N) !> On entry, the upper Hessenberg matrix H. !> On exit, if INFO = 0 and JOB = 'S', H contains the upper !> triangular matrix T from the Schur decomposition (the !> Schur form). If INFO = 0 and JOB = 'E', the contents of !> H are unspecified on exit. (The output value of H when !> INFO > 0 is given under the description of INFO below.) !> !> Unlike earlier versions of CHSEQR, this subroutine may !> explicitly H(i,j) = 0 for i > j and j = 1, 2, ... ILO-1 !> or j = IHI+1, IHI+2, ... N. !>
[in]	LDH	!> LDH is INTEGER !> The leading dimension of the array H. LDH >= max(1,N). !>
[out]	W	!> W is COMPLEX array, dimension (N) !> The computed eigenvalues. If JOB = 'S', the eigenvalues are !> stored in the same order as on the diagonal of the Schur !> form returned in H, with W(i) = H(i,i). !>
[in,out]	Z	!> Z is COMPLEX array, dimension (LDZ,N) !> If COMPZ = 'N', Z is not referenced. !> If COMPZ = 'I', on entry Z need not be set and on exit, !> if INFO = 0, Z contains the unitary matrix Z of the Schur !> vectors of H. If COMPZ = 'V', on entry Z must contain an !> N-by-N matrix Q, which is assumed to be equal to the unit !> matrix except for the submatrix Z(ILO:IHI,ILO:IHI). On exit, !> if INFO = 0, Z contains Q*Z. !> Normally Q is the unitary matrix generated by CUNGHR !> after the call to CGEHRD which formed the Hessenberg matrix !> H. (The output value of Z when INFO > 0 is given under !> the description of INFO below.) !>
[in]	LDZ	!> LDZ is INTEGER !> The leading dimension of the array Z. if COMPZ = 'I' or !> COMPZ = 'V', then LDZ >= MAX(1,N). Otherwise, LDZ >= 1. !>
[out]	WORK	!> WORK is COMPLEX array, dimension (LWORK) !> On exit, if INFO = 0, WORK(1) returns an estimate of !> the optimal value for LWORK. !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the array WORK. LWORK >= max(1,N) !> is sufficient and delivers very good and sometimes !> optimal performance. However, LWORK as large as 11*N !> may be required for optimal performance. A workspace !> query is recommended to determine the optimal workspace !> size. !> !> If LWORK = -1, then CHSEQR does a workspace query. !> In this case, CHSEQR checks the input parameters and !> estimates the optimal workspace size for the given !> values of N, ILO and IHI. The estimate is returned !> in WORK(1). No error message related to LWORK is !> issued by XERBLA. Neither H nor Z are accessed. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal !> value !> > 0: if INFO = i, CHSEQR failed to compute all of !> the eigenvalues. Elements 1:ilo-1 and i+1:n of W !> contain those eigenvalues which have been !> successfully computed. (Failures are rare.) !> !> If INFO > 0 and JOB = 'E', then on exit, the !> remaining unconverged eigenvalues are the eigen- !> values of the upper Hessenberg matrix rows and !> columns ILO through INFO of the final, output !> value of H. !> !> If INFO > 0 and JOB = 'S', then on exit !> !> () (initial value of H)U = U(final value of H) !> !> where U is a unitary matrix. The final !> value of H is upper Hessenberg and triangular in !> rows and columns INFO+1 through IHI. !> !> If INFO > 0 and COMPZ = 'V', then on exit !> !> (final value of Z) = (initial value of Z)U !> !> where U is the unitary matrix in () (regard- !> less of the value of JOB.) !> !> If INFO > 0 and COMPZ = 'I', then on exit !> (final value of Z) = U !> where U is the unitary matrix in () (regard- !> less of the value of JOB.) !> !> If INFO > 0 and COMPZ = 'N', then Z is not !> accessed. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: Karen Braman and Ralph Byers, Department of Mathematics, University of Kansas, USA

Further Details:

!>
!>             Default values supplied by
!>             ILAENV(ISPEC,'CHSEQR',JOB(:1)//COMPZ(:1),N,ILO,IHI,LWORK).
!>             It is suggested that these defaults be adjusted in order
!>             to attain best performance in each particular
!>             computational environment.
!>
!>            ISPEC=12: The CLAHQR vs CLAQR0 crossover point.
!>                      Default: 75. (Must be at least 11.)
!>
!>            ISPEC=13: Recommended deflation window size.
!>                      This depends on ILO, IHI and NS.  NS is the
!>                      number of simultaneous shifts returned
!>                      by ILAENV(ISPEC=15).  (See ISPEC=15 below.)
!>                      The default for (IHI-ILO+1) <= 500 is NS.
!>                      The default for (IHI-ILO+1) >  500 is 3*NS/2.
!>
!>            ISPEC=14: Nibble crossover point. (See IPARMQ for
!>                      details.)  Default: 14% of deflation window
!>                      size.
!>
!>            ISPEC=15: Number of simultaneous shifts in a multishift
!>                      QR iteration.
!>
!>                      If IHI-ILO+1 is ...
!>
!>                      greater than      ...but less    ... the
!>                      or equal to ...      than        default is
!>
!>                           1               30          NS =   2(+)
!>                          30               60          NS =   4(+)
!>                          60              150          NS =  10(+)
!>                         150              590          NS =  **
!>                         590             3000          NS =  64
!>                        3000             6000          NS = 128
!>                        6000             infinity      NS = 256
!>
!>                  (+)  By default some or all matrices of this order
!>                       are passed to the implicit double shift routine
!>                       CLAHQR and this parameter is ignored.  See
!>                       ISPEC=12 above and comments in IPARMQ for
!>                       details.
!>
!>                 (**)  The asterisks (**) indicate an ad-hoc
!>                       function of N increasing from 10 to 64.
!>
!>            ISPEC=16: Select structured matrix multiply.
!>                      If the number of simultaneous shifts (specified
!>                      by ISPEC=15) is less than 14, then the default
!>                      for ISPEC=16 is 0.  Otherwise the default for
!>                      ISPEC=16 is 2.
!>

References:

 K. Braman, R. Byers and R. Mathias, The Multi-Shift QR
 Algorithm Part I: Maintaining Well Focused Shifts, and Level 3
 Performance, SIAM Journal of Matrix Analysis, volume 23, pages
 929--947, 2002.

K. Braman, R. Byers and R. Mathias, The Multi-Shift QR Algorithm Part II: Aggressive Early Deflation, SIAM Journal of Matrix Analysis, volume 23, pages 948–973, 2002.

Definition at line 297 of file chseqr.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            IHI, ILO, INFO, LDH, LDZ, LWORK, N
      CHARACTER          COMPZ, JOB
*     ..
*     .. Array Arguments ..
      COMPLEX            H( LDH, * ), W( * ), WORK( * ), Z( LDZ, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
*
*     ==== Matrices of order NTINY or smaller must be processed by
*     .    CLAHQR because of insufficient subdiagonal scratch space.
*     .    (This is a hard limit.) ====
      INTEGER            NTINY
      parameter( ntiny = 15 )
*
*     ==== NL allocates some local workspace to help small matrices
*     .    through a rare CLAHQR failure.  NL > NTINY = 15 is
*     .    required and NL <= NMIN = ILAENV(ISPEC=12,...) is recom-
*     .    mended.  (The default value of NMIN is 75.)  Using NL = 49
*     .    allows up to six simultaneous shifts and a 16-by-16
*     .    deflation window.  ====
      INTEGER            NL
      parameter( nl = 49 )
      COMPLEX            ZERO, ONE
      parameter( zero = ( 0.0e0, 0.0e0 ),
     $                   one = ( 1.0e0, 0.0e0 ) )
      REAL               RZERO
      parameter( rzero = 0.0e0 )
*     ..
*     .. Local Arrays ..
      COMPLEX            HL( NL, NL ), WORKL( NL )
*     ..
*     .. Local Scalars ..
      INTEGER            KBOT, NMIN
      LOGICAL            INITZ, LQUERY, WANTT, WANTZ
*     ..
*     .. External Functions ..
      INTEGER            ILAENV
      LOGICAL            LSAME
      EXTERNAL           ilaenv, lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           ccopy, clacpy, clahqr, claqr0, claset, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          cmplx, max, min, real
*     ..
*     .. Executable Statements ..
*
*     ==== Decode and check the input parameters. ====
*
      wantt = lsame( job, 'S' )
      initz = lsame( compz, 'I' )
      wantz = initz .OR. lsame( compz, 'V' )
      work( 1 ) = cmplx( real( max( 1, n ) ), rzero )
      lquery = lwork.EQ.-1
*
      info = 0
      IF( .NOT.lsame( job, 'E' ) .AND. .NOT.wantt ) THEN
         info = -1
      ELSE IF( .NOT.lsame( compz, 'N' ) .AND. .NOT.wantz ) THEN
         info = -2
      ELSE IF( n.LT.0 ) THEN
         info = -3
      ELSE IF( ilo.LT.1 .OR. ilo.GT.max( 1, n ) ) THEN
         info = -4
      ELSE IF( ihi.LT.min( ilo, n ) .OR. ihi.GT.n ) THEN
         info = -5
      ELSE IF( ldh.LT.max( 1, n ) ) THEN
         info = -7
      ELSE IF( ldz.LT.1 .OR. ( wantz .AND. ldz.LT.max( 1, n ) ) ) THEN
         info = -10
      ELSE IF( lwork.LT.max( 1, n ) .AND. .NOT.lquery ) THEN
         info = -12
      END IF
*
      IF( info.NE.0 ) THEN
*
*        ==== Quick return in case of invalid argument. ====
*
         CALL xerbla( 'CHSEQR', -info )
         RETURN
*
      ELSE IF( n.EQ.0 ) THEN
*
*        ==== Quick return in case N = 0; nothing to do. ====
*
         RETURN
*
      ELSE IF( lquery ) THEN
*
*        ==== Quick return in case of a workspace query ====
*
         CALL claqr0( wantt, wantz, n, ilo, ihi, h, ldh, w, ilo, ihi, z,
     $                ldz, work, lwork, info )
*        ==== Ensure reported workspace size is backward-compatible with
*        .    previous LAPACK versions. ====
         work( 1 ) = cmplx( max( real( work( 1 ) ), real( max( 1,
     $               n ) ) ), rzero )
         RETURN
*
      ELSE
*
*        ==== copy eigenvalues isolated by CGEBAL ====
*
         IF( ilo.GT.1 )
     $      CALL ccopy( ilo-1, h, ldh+1, w, 1 )
         IF( ihi.LT.n )
     $      CALL ccopy( n-ihi, h( ihi+1, ihi+1 ), ldh+1, w( ihi+1 ), 1 )
*
*        ==== Initialize Z, if requested ====
*
         IF( initz )
     $      CALL claset( 'A', n, n, zero, one, z, ldz )
*
*        ==== Quick return if possible ====
*
         IF( ilo.EQ.ihi ) THEN
            w( ilo ) = h( ilo, ilo )
            RETURN
         END IF
*
*        ==== CLAHQR/CLAQR0 crossover point ====
*
         nmin = ilaenv( 12, 'CHSEQR', job( : 1 ) // compz( : 1 ), n,
     $          ilo, ihi, lwork )
         nmin = max( ntiny, nmin )
*
*        ==== CLAQR0 for big matrices; CLAHQR for small ones ====
*
         IF( n.GT.nmin ) THEN
            CALL claqr0( wantt, wantz, n, ilo, ihi, h, ldh, w, ilo, ihi,
     $                   z, ldz, work, lwork, info )
         ELSE
*
*           ==== Small matrix ====
*
            CALL clahqr( wantt, wantz, n, ilo, ihi, h, ldh, w, ilo, ihi,
     $                   z, ldz, info )
*
            IF( info.GT.0 ) THEN
*
*              ==== A rare CLAHQR failure!  CLAQR0 sometimes succeeds
*              .    when CLAHQR fails. ====
*
               kbot = info
*
               IF( n.GE.nl ) THEN
*
*                 ==== Larger matrices have enough subdiagonal scratch
*                 .    space to call CLAQR0 directly. ====
*
                  CALL claqr0( wantt, wantz, n, ilo, kbot, h, ldh, w,
     $                         ilo, ihi, z, ldz, work, lwork, info )
*
               ELSE
*
*                 ==== Tiny matrices don't have enough subdiagonal
*                 .    scratch space to benefit from CLAQR0.  Hence,
*                 .    tiny matrices must be copied into a larger
*                 .    array before calling CLAQR0. ====
*
                  CALL clacpy( 'A', n, n, h, ldh, hl, nl )
                  hl( n+1, n ) = zero
                  CALL claset( 'A', nl, nl-n, zero, zero, hl( 1, n+1 ),
     $                         nl )
                  CALL claqr0( wantt, wantz, nl, ilo, kbot, hl, nl, w,
     $                         ilo, ihi, z, ldz, workl, nl, info )
                  IF( wantt .OR. info.NE.0 )
     $               CALL clacpy( 'A', n, n, hl, nl, h, ldh )
               END IF
            END IF
         END IF
*
*        ==== Clear out the trash, if necessary. ====
*
         IF( ( wantt .OR. info.NE.0 ) .AND. n.GT.2 )
     $      CALL claset( 'L', n-2, n-2, zero, zero, h( 3, 1 ), ldh )
*
*        ==== Ensure reported workspace size is backward-compatible with
*        .    previous LAPACK versions. ====
*
         work( 1 ) = cmplx( max( real( max( 1, n ) ),
     $               real( work( 1 ) ) ), rzero )
      END IF
*
*     ==== End of CHSEQR ====
*

◆ cla_lin_berr()

subroutine cla_lin_berr	(	integer	n,
		integer	nz,
		integer	nrhs,
		complex, dimension( n, nrhs )	res,
		real, dimension( n, nrhs )	ayb,
		real, dimension( nrhs )	berr )

CLA_LIN_BERR computes a component-wise relative backward error.

Download CLA_LIN_BERR + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!>    CLA_LIN_BERR computes componentwise relative backward error from
!>    the formula
!>        max(i) ( abs(R(i)) / ( abs(op(A_s))*abs(Y) + abs(B_s) )(i) )
!>    where abs(Z) is the componentwise absolute value of the matrix
!>    or vector Z.
!>

Parameters

[in]	N	!> N is INTEGER !> The number of linear equations, i.e., the order of the !> matrix A. N >= 0. !>
[in]	NZ	!> NZ is INTEGER !> We add (NZ+1)*SLAMCH( 'Safe minimum' ) to R(i) in the numerator to !> guard against spuriously zero residuals. Default value is N. !>
[in]	NRHS	!> NRHS is INTEGER !> The number of right hand sides, i.e., the number of columns !> of the matrices AYB, RES, and BERR. NRHS >= 0. !>
[in]	RES	!> RES is COMPLEX array, dimension (N,NRHS) !> The residual matrix, i.e., the matrix R in the relative backward !> error formula above. !>
[in]	AYB	!> AYB is REAL array, dimension (N, NRHS) !> The denominator in the relative backward error formula above, i.e., !> the matrix abs(op(A_s))*abs(Y) + abs(B_s). The matrices A, Y, and B !> are from iterative refinement (see cla_gerfsx_extended.f). !>
[out]	BERR	!> BERR is REAL array, dimension (NRHS) !> The componentwise relative backward error from the formula above. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 100 of file cla_lin_berr.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            N, NZ, NRHS
*     ..
*     .. Array Arguments ..
      REAL               AYB( N, NRHS ), BERR( NRHS )
      COMPLEX            RES( N, NRHS )
*     ..
*
*  =====================================================================
*
*     .. Local Scalars ..
      REAL               TMP
      INTEGER            I, J
      COMPLEX            CDUM
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, real, aimag, max
*     ..
*     .. External Functions ..
      EXTERNAL           slamch
      REAL               SLAMCH
      REAL               SAFE1
*     ..
*     .. Statement Functions ..
      COMPLEX            CABS1
*     ..
*     .. Statement Function Definitions ..
      cabs1( cdum ) = abs( real( cdum ) ) + abs( aimag( cdum ) )
*     ..
*     .. Executable Statements ..
*
*     Adding SAFE1 to the numerator guards against spuriously zero
*     residuals.  A similar safeguard is in the CLA_yyAMV routine used
*     to compute AYB.
*
      safe1 = slamch( 'Safe minimum' )
      safe1 = (nz+1)*safe1
 
      DO j = 1, nrhs
         berr(j) = 0.0
         DO i = 1, n
            IF (ayb(i,j) .NE. 0.0) THEN
               tmp = (safe1 + cabs1(res(i,j)))/ayb(i,j)
               berr(j) = max( berr(j), tmp )
            END IF
*
*     If AYB is exactly 0.0 (and if computed by CLA_yyAMV), then we know
*     the true residual also must be exactly 0.0.
*
         END DO
      END DO
*
*     End of CLA_LIN_BERR
*

◆ cla_wwaddw()

subroutine cla_wwaddw	(	integer	n,
		complex, dimension( * )	x,
		complex, dimension( * )	y,
		complex, dimension( * )	w )

CLA_WWADDW adds a vector into a doubled-single vector.

Download CLA_WWADDW + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!>    CLA_WWADDW adds a vector W into a doubled-single vector (X, Y).
!>
!>    This works for all extant IBM's hex and binary floating point
!>    arithmetic, but not for decimal.
!>

Parameters

[in]	N	!> N is INTEGER !> The length of vectors X, Y, and W. !>
[in,out]	X	!> X is COMPLEX array, dimension (N) !> The first part of the doubled-single accumulation vector. !>
[in,out]	Y	!> Y is COMPLEX array, dimension (N) !> The second part of the doubled-single accumulation vector. !>
[in]	W	!> W is COMPLEX array, dimension (N) !> The vector to be added. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 80 of file cla_wwaddw.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            N
*     ..
*     .. Array Arguments ..
      COMPLEX            X( * ), Y( * ), W( * )
*     ..
*
*  =====================================================================
*
*     .. Local Scalars ..
      COMPLEX            S
      INTEGER            I
*     ..
*     .. Executable Statements ..
*
      DO 10 i = 1, n
        s = x(i) + w(i)
        s = (s + s) - s
        y(i) = ((x(i) - s) + w(i)) + y(i)
        x(i) = s
   10 CONTINUE
      RETURN
*
*     End of CLA_WWADDW
*

◆ claed0()

subroutine claed0	(	integer	qsiz,
		integer	n,
		real, dimension( * )	d,
		real, dimension( * )	e,
		complex, dimension( ldq, * )	q,
		integer	ldq,
		complex, dimension( ldqs, * )	qstore,
		integer	ldqs,
		real, dimension( * )	rwork,
		integer, dimension( * )	iwork,
		integer	info )

CLAED0 used by CSTEDC. Computes all eigenvalues and corresponding eigenvectors of an unreduced symmetric tridiagonal matrix using the divide and conquer method.

Download CLAED0 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> Using the divide and conquer method, CLAED0 computes all eigenvalues
!> of a symmetric tridiagonal matrix which is one diagonal block of
!> those from reducing a dense or band Hermitian matrix and
!> corresponding eigenvectors of the dense or band matrix.
!>

Parameters

[in]	QSIZ	!> QSIZ is INTEGER !> The dimension of the unitary matrix used to reduce !> the full matrix to tridiagonal form. QSIZ >= N if ICOMPQ = 1. !>
[in]	N	!> N is INTEGER !> The dimension of the symmetric tridiagonal matrix. N >= 0. !>
[in,out]	D	!> D is REAL array, dimension (N) !> On entry, the diagonal elements of the tridiagonal matrix. !> On exit, the eigenvalues in ascending order. !>
[in,out]	E	!> E is REAL array, dimension (N-1) !> On entry, the off-diagonal elements of the tridiagonal matrix. !> On exit, E has been destroyed. !>
[in,out]	Q	!> Q is COMPLEX array, dimension (LDQ,N) !> On entry, Q must contain an QSIZ x N matrix whose columns !> unitarily orthonormal. It is a part of the unitary matrix !> that reduces the full dense Hermitian matrix to a !> (reducible) symmetric tridiagonal matrix. !>
[in]	LDQ	!> LDQ is INTEGER !> The leading dimension of the array Q. LDQ >= max(1,N). !>
[out]	IWORK	!> IWORK is INTEGER array, !> the dimension of IWORK must be at least !> 6 + 6N + 5N*lg N !> ( lg( N ) = smallest integer k !> such that 2^k >= N ) !>
[out]	RWORK	!> RWORK is REAL array, !> dimension (1 + 3N + 2Nlg N + 3N**2) !> ( lg( N ) = smallest integer k !> such that 2^k >= N ) !>
[out]	QSTORE	!> QSTORE is COMPLEX array, dimension (LDQS, N) !> Used to store parts of !> the eigenvector matrix when the updating matrix multiplies !> take place. !>
[in]	LDQS	!> LDQS is INTEGER !> The leading dimension of the array QSTORE. !> LDQS >= max(1,N). !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> < 0: if INFO = -i, the i-th argument had an illegal value. !> > 0: The algorithm failed to compute an eigenvalue while !> working on the submatrix lying in rows and columns !> INFO/(N+1) through mod(INFO,N+1). !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 143 of file claed0.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INFO, LDQ, LDQS, N, QSIZ
*     ..
*     .. Array Arguments ..
      INTEGER            IWORK( * )
      REAL               D( * ), E( * ), RWORK( * )
      COMPLEX            Q( LDQ, * ), QSTORE( LDQS, * )
*     ..
*
*  =====================================================================
*
*  Warning:      N could be as big as QSIZ!
*
*     .. Parameters ..
      REAL               TWO
      parameter( two = 2.e+0 )
*     ..
*     .. Local Scalars ..
      INTEGER            CURLVL, CURPRB, CURR, I, IGIVCL, IGIVNM,
     $                   IGIVPT, INDXQ, IPERM, IPRMPT, IQ, IQPTR, IWREM,
     $                   J, K, LGN, LL, MATSIZ, MSD2, SMLSIZ, SMM1,
     $                   SPM1, SPM2, SUBMAT, SUBPBS, TLVLS
      REAL               TEMP
*     ..
*     .. External Subroutines ..
      EXTERNAL           ccopy, clacrm, claed7, scopy, ssteqr, xerbla
*     ..
*     .. External Functions ..
      INTEGER            ILAENV
      EXTERNAL           ilaenv
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, int, log, max, real
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
*
*     IF( ICOMPQ .LT. 0 .OR. ICOMPQ .GT. 2 ) THEN
*        INFO = -1
*     ELSE IF( ( ICOMPQ .EQ. 1 ) .AND. ( QSIZ .LT. MAX( 0, N ) ) )
*    $        THEN
      IF( qsiz.LT.max( 0, n ) ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( ldq.LT.max( 1, n ) ) THEN
         info = -6
      ELSE IF( ldqs.LT.max( 1, n ) ) THEN
         info = -8
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CLAED0', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
      smlsiz = ilaenv( 9, 'CLAED0', ' ', 0, 0, 0, 0 )
*
*     Determine the size and placement of the submatrices, and save in
*     the leading elements of IWORK.
*
      iwork( 1 ) = n
      subpbs = 1
      tlvls = 0
   10 CONTINUE
      IF( iwork( subpbs ).GT.smlsiz ) THEN
         DO 20 j = subpbs, 1, -1
            iwork( 2*j ) = ( iwork( j )+1 ) / 2
            iwork( 2*j-1 ) = iwork( j ) / 2
   20    CONTINUE
         tlvls = tlvls + 1
         subpbs = 2*subpbs
         GO TO 10
      END IF
      DO 30 j = 2, subpbs
         iwork( j ) = iwork( j ) + iwork( j-1 )
   30 CONTINUE
*
*     Divide the matrix into SUBPBS submatrices of size at most SMLSIZ+1
*     using rank-1 modifications (cuts).
*
      spm1 = subpbs - 1
      DO 40 i = 1, spm1
         submat = iwork( i ) + 1
         smm1 = submat - 1
         d( smm1 ) = d( smm1 ) - abs( e( smm1 ) )
         d( submat ) = d( submat ) - abs( e( smm1 ) )
   40 CONTINUE
*
      indxq = 4*n + 3
*
*     Set up workspaces for eigenvalues only/accumulate new vectors
*     routine
*
      temp = log( real( n ) ) / log( two )
      lgn = int( temp )
      IF( 2**lgn.LT.n )
     $   lgn = lgn + 1
      IF( 2**lgn.LT.n )
     $   lgn = lgn + 1
      iprmpt = indxq + n + 1
      iperm = iprmpt + n*lgn
      iqptr = iperm + n*lgn
      igivpt = iqptr + n + 2
      igivcl = igivpt + n*lgn
*
      igivnm = 1
      iq = igivnm + 2*n*lgn
      iwrem = iq + n**2 + 1
*     Initialize pointers
      DO 50 i = 0, subpbs
         iwork( iprmpt+i ) = 1
         iwork( igivpt+i ) = 1
   50 CONTINUE
      iwork( iqptr ) = 1
*
*     Solve each submatrix eigenproblem at the bottom of the divide and
*     conquer tree.
*
      curr = 0
      DO 70 i = 0, spm1
         IF( i.EQ.0 ) THEN
            submat = 1
            matsiz = iwork( 1 )
         ELSE
            submat = iwork( i ) + 1
            matsiz = iwork( i+1 ) - iwork( i )
         END IF
         ll = iq - 1 + iwork( iqptr+curr )
         CALL ssteqr( 'I', matsiz, d( submat ), e( submat ),
     $                rwork( ll ), matsiz, rwork, info )
         CALL clacrm( qsiz, matsiz, q( 1, submat ), ldq, rwork( ll ),
     $                matsiz, qstore( 1, submat ), ldqs,
     $                rwork( iwrem ) )
         iwork( iqptr+curr+1 ) = iwork( iqptr+curr ) + matsiz**2
         curr = curr + 1
         IF( info.GT.0 ) THEN
            info = submat*( n+1 ) + submat + matsiz - 1
            RETURN
         END IF
         k = 1
         DO 60 j = submat, iwork( i+1 )
            iwork( indxq+j ) = k
            k = k + 1
   60    CONTINUE
   70 CONTINUE
*
*     Successively merge eigensystems of adjacent submatrices
*     into eigensystem for the corresponding larger matrix.
*
*     while ( SUBPBS > 1 )
*
      curlvl = 1
   80 CONTINUE
      IF( subpbs.GT.1 ) THEN
         spm2 = subpbs - 2
         DO 90 i = 0, spm2, 2
            IF( i.EQ.0 ) THEN
               submat = 1
               matsiz = iwork( 2 )
               msd2 = iwork( 1 )
               curprb = 0
            ELSE
               submat = iwork( i ) + 1
               matsiz = iwork( i+2 ) - iwork( i )
               msd2 = matsiz / 2
               curprb = curprb + 1
            END IF
*
*     Merge lower order eigensystems (of size MSD2 and MATSIZ - MSD2)
*     into an eigensystem of size MATSIZ.  CLAED7 handles the case
*     when the eigenvectors of a full or band Hermitian matrix (which
*     was reduced to tridiagonal form) are desired.
*
*     I am free to use Q as a valuable working space until Loop 150.
*
            CALL claed7( matsiz, msd2, qsiz, tlvls, curlvl, curprb,
     $                   d( submat ), qstore( 1, submat ), ldqs,
     $                   e( submat+msd2-1 ), iwork( indxq+submat ),
     $                   rwork( iq ), iwork( iqptr ), iwork( iprmpt ),
     $                   iwork( iperm ), iwork( igivpt ),
     $                   iwork( igivcl ), rwork( igivnm ),
     $                   q( 1, submat ), rwork( iwrem ),
     $                   iwork( subpbs+1 ), info )
            IF( info.GT.0 ) THEN
               info = submat*( n+1 ) + submat + matsiz - 1
               RETURN
            END IF
            iwork( i / 2+1 ) = iwork( i+2 )
   90    CONTINUE
         subpbs = subpbs / 2
         curlvl = curlvl + 1
         GO TO 80
      END IF
*
*     end while
*
*     Re-merge the eigenvalues/vectors which were deflated at the final
*     merge step.
*
      DO 100 i = 1, n
         j = iwork( indxq+i )
         rwork( i ) = d( j )
         CALL ccopy( qsiz, qstore( 1, j ), 1, q( 1, i ), 1 )
  100 CONTINUE
      CALL scopy( n, rwork, 1, d, 1 )
*
      RETURN
*
*     End of CLAED0
*

◆ claed7()

subroutine claed7	(	integer	n,
		integer	cutpnt,
		integer	qsiz,
		integer	tlvls,
		integer	curlvl,
		integer	curpbm,
		real, dimension( * )	d,
		complex, dimension( ldq, * )	q,
		integer	ldq,
		real	rho,
		integer, dimension( * )	indxq,
		real, dimension( * )	qstore,
		integer, dimension( * )	qptr,
		integer, dimension( * )	prmptr,
		integer, dimension( * )	perm,
		integer, dimension( * )	givptr,
		integer, dimension( 2, * )	givcol,
		real, dimension( 2, * )	givnum,
		complex, dimension( * )	work,
		real, dimension( * )	rwork,
		integer, dimension( * )	iwork,
		integer	info )

CLAED7 used by CSTEDC. Computes the updated eigensystem of a diagonal matrix after modification by a rank-one symmetric matrix. Used when the original matrix is dense.

Download CLAED7 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CLAED7 computes the updated eigensystem of a diagonal
!> matrix after modification by a rank-one symmetric matrix. This
!> routine is used only for the eigenproblem which requires all
!> eigenvalues and optionally eigenvectors of a dense or banded
!> Hermitian matrix that has been reduced to tridiagonal form.
!>
!>   T = Q(in) ( D(in) + RHO * Z*Z**H ) Q**H(in) = Q(out) * D(out) * Q**H(out)
!>
!>   where Z = Q**Hu, u is a vector of length N with ones in the
!>   CUTPNT and CUTPNT + 1 th elements and zeros elsewhere.
!>
!>    The eigenvectors of the original matrix are stored in Q, and the
!>    eigenvalues are in D.  The algorithm consists of three stages:
!>
!>       The first stage consists of deflating the size of the problem
!>       when there are multiple eigenvalues or if there is a zero in
!>       the Z vector.  For each such occurrence the dimension of the
!>       secular equation problem is reduced by one.  This stage is
!>       performed by the routine SLAED2.
!>
!>       The second stage consists of calculating the updated
!>       eigenvalues. This is done by finding the roots of the secular
!>       equation via the routine SLAED4 (as called by SLAED3).
!>       This routine also calculates the eigenvectors of the current
!>       problem.
!>
!>       The final stage consists of computing the updated eigenvectors
!>       directly using the updated eigenvalues.  The eigenvectors for
!>       the current problem are multiplied with the eigenvectors from
!>       the overall problem.
!>

Parameters

[in]	N	!> N is INTEGER !> The dimension of the symmetric tridiagonal matrix. N >= 0. !>
[in]	CUTPNT	!> CUTPNT is INTEGER !> Contains the location of the last eigenvalue in the leading !> sub-matrix. min(1,N) <= CUTPNT <= N. !>
[in]	QSIZ	!> QSIZ is INTEGER !> The dimension of the unitary matrix used to reduce !> the full matrix to tridiagonal form. QSIZ >= N. !>
[in]	TLVLS	!> TLVLS is INTEGER !> The total number of merging levels in the overall divide and !> conquer tree. !>
[in]	CURLVL	!> CURLVL is INTEGER !> The current level in the overall merge routine, !> 0 <= curlvl <= tlvls. !>
[in]	CURPBM	!> CURPBM is INTEGER !> The current problem in the current level in the overall !> merge routine (counting from upper left to lower right). !>
[in,out]	D	!> D is REAL array, dimension (N) !> On entry, the eigenvalues of the rank-1-perturbed matrix. !> On exit, the eigenvalues of the repaired matrix. !>
[in,out]	Q	!> Q is COMPLEX array, dimension (LDQ,N) !> On entry, the eigenvectors of the rank-1-perturbed matrix. !> On exit, the eigenvectors of the repaired tridiagonal matrix. !>
[in]	LDQ	!> LDQ is INTEGER !> The leading dimension of the array Q. LDQ >= max(1,N). !>
[in]	RHO	!> RHO is REAL !> Contains the subdiagonal element used to create the rank-1 !> modification. !>
[out]	INDXQ	!> INDXQ is INTEGER array, dimension (N) !> This contains the permutation which will reintegrate the !> subproblem just solved back into sorted order, !> ie. D( INDXQ( I = 1, N ) ) will be in ascending order. !>
[out]	IWORK	!> IWORK is INTEGER array, dimension (4*N) !>
[out]	RWORK	!> RWORK is REAL array, !> dimension (3N+2QSIZ*N) !>
[out]	WORK	!> WORK is COMPLEX array, dimension (QSIZ*N) !>
[in,out]	QSTORE	!> QSTORE is REAL array, dimension (N**2+1) !> Stores eigenvectors of submatrices encountered during !> divide and conquer, packed together. QPTR points to !> beginning of the submatrices. !>
[in,out]	QPTR	!> QPTR is INTEGER array, dimension (N+2) !> List of indices pointing to beginning of submatrices stored !> in QSTORE. The submatrices are numbered starting at the !> bottom left of the divide and conquer tree, from left to !> right and bottom to top. !>
[in]	PRMPTR	!> PRMPTR is INTEGER array, dimension (N lg N) !> Contains a list of pointers which indicate where in PERM a !> level's permutation is stored. PRMPTR(i+1) - PRMPTR(i) !> indicates the size of the permutation and also the size of !> the full, non-deflated problem. !>
[in]	PERM	!> PERM is INTEGER array, dimension (N lg N) !> Contains the permutations (from deflation and sorting) to be !> applied to each eigenblock. !>
[in]	GIVPTR	!> GIVPTR is INTEGER array, dimension (N lg N) !> Contains a list of pointers which indicate where in GIVCOL a !> level's Givens rotations are stored. GIVPTR(i+1) - GIVPTR(i) !> indicates the number of Givens rotations. !>
[in]	GIVCOL	!> GIVCOL is INTEGER array, dimension (2, N lg N) !> Each pair of numbers indicates a pair of columns to take place !> in a Givens rotation. !>
[in]	GIVNUM	!> GIVNUM is REAL array, dimension (2, N lg N) !> Each number indicates the S value to be used in the !> corresponding Givens rotation. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> < 0: if INFO = -i, the i-th argument had an illegal value. !> > 0: if INFO = 1, an eigenvalue did not converge !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 245 of file claed7.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            CURLVL, CURPBM, CUTPNT, INFO, LDQ, N, QSIZ,
     $                   TLVLS
      REAL               RHO
*     ..
*     .. Array Arguments ..
      INTEGER            GIVCOL( 2, * ), GIVPTR( * ), INDXQ( * ),
     $                   IWORK( * ), PERM( * ), PRMPTR( * ), QPTR( * )
      REAL               D( * ), GIVNUM( 2, * ), QSTORE( * ), RWORK( * )
      COMPLEX            Q( LDQ, * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Local Scalars ..
      INTEGER            COLTYP, CURR, I, IDLMDA, INDX,
     $                   INDXC, INDXP, IQ, IW, IZ, K, N1, N2, PTR
*     ..
*     .. External Subroutines ..
      EXTERNAL           clacrm, claed8, slaed9, slaeda, slamrg, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, min
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
*
*     IF( ICOMPQ.LT.0 .OR. ICOMPQ.GT.1 ) THEN
*        INFO = -1
*     ELSE IF( N.LT.0 ) THEN
      IF( n.LT.0 ) THEN
         info = -1
      ELSE IF( min( 1, n ).GT.cutpnt .OR. n.LT.cutpnt ) THEN
         info = -2
      ELSE IF( qsiz.LT.n ) THEN
         info = -3
      ELSE IF( ldq.LT.max( 1, n ) ) THEN
         info = -9
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CLAED7', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
*     The following values are for bookkeeping purposes only.  They are
*     integer pointers which indicate the portion of the workspace
*     used by a particular array in SLAED2 and SLAED3.
*
      iz = 1
      idlmda = iz + n
      iw = idlmda + n
      iq = iw + n
*
      indx = 1
      indxc = indx + n
      coltyp = indxc + n
      indxp = coltyp + n
*
*     Form the z-vector which consists of the last row of Q_1 and the
*     first row of Q_2.
*
      ptr = 1 + 2**tlvls
      DO 10 i = 1, curlvl - 1
         ptr = ptr + 2**( tlvls-i )
   10 CONTINUE
      curr = ptr + curpbm
      CALL slaeda( n, tlvls, curlvl, curpbm, prmptr, perm, givptr,
     $             givcol, givnum, qstore, qptr, rwork( iz ),
     $             rwork( iz+n ), info )
*
*     When solving the final problem, we no longer need the stored data,
*     so we will overwrite the data from this level onto the previously
*     used storage space.
*
      IF( curlvl.EQ.tlvls ) THEN
         qptr( curr ) = 1
         prmptr( curr ) = 1
         givptr( curr ) = 1
      END IF
*
*     Sort and Deflate eigenvalues.
*
      CALL claed8( k, n, qsiz, q, ldq, d, rho, cutpnt, rwork( iz ),
     $             rwork( idlmda ), work, qsiz, rwork( iw ),
     $             iwork( indxp ), iwork( indx ), indxq,
     $             perm( prmptr( curr ) ), givptr( curr+1 ),
     $             givcol( 1, givptr( curr ) ),
     $             givnum( 1, givptr( curr ) ), info )
      prmptr( curr+1 ) = prmptr( curr ) + n
      givptr( curr+1 ) = givptr( curr+1 ) + givptr( curr )
*
*     Solve Secular Equation.
*
      IF( k.NE.0 ) THEN
         CALL slaed9( k, 1, k, n, d, rwork( iq ), k, rho,
     $                rwork( idlmda ), rwork( iw ),
     $                qstore( qptr( curr ) ), k, info )
         CALL clacrm( qsiz, k, work, qsiz, qstore( qptr( curr ) ), k, q,
     $                ldq, rwork( iq ) )
         qptr( curr+1 ) = qptr( curr ) + k**2
         IF( info.NE.0 ) THEN
            RETURN
         END IF
*
*     Prepare the INDXQ sorting premutation.
*
         n1 = k
         n2 = n - k
         CALL slamrg( n1, n2, d, 1, -1, indxq )
      ELSE
         qptr( curr+1 ) = qptr( curr )
         DO 20 i = 1, n
            indxq( i ) = i
   20    CONTINUE
      END IF
*
      RETURN
*
*     End of CLAED7
*

◆ claed8()

subroutine claed8	(	integer	k,
		integer	n,
		integer	qsiz,
		complex, dimension( ldq, * )	q,
		integer	ldq,
		real, dimension( * )	d,
		real	rho,
		integer	cutpnt,
		real, dimension( * )	z,
		real, dimension( * )	dlamda,
		complex, dimension( ldq2, * )	q2,
		integer	ldq2,
		real, dimension( * )	w,
		integer, dimension( * )	indxp,
		integer, dimension( * )	indx,
		integer, dimension( * )	indxq,
		integer, dimension( * )	perm,
		integer	givptr,
		integer, dimension( 2, * )	givcol,
		real, dimension( 2, * )	givnum,
		integer	info )

CLAED8 used by CSTEDC. Merges eigenvalues and deflates secular equation. Used when the original matrix is dense.

Download CLAED8 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CLAED8 merges the two sets of eigenvalues together into a single
!> sorted set.  Then it tries to deflate the size of the problem.
!> There are two ways in which deflation can occur:  when two or more
!> eigenvalues are close together or if there is a tiny element in the
!> Z vector.  For each such occurrence the order of the related secular
!> equation problem is reduced by one.
!>

Parameters

[out]	K	!> K is INTEGER !> Contains the number of non-deflated eigenvalues. !> This is the order of the related secular equation. !>
[in]	N	!> N is INTEGER !> The dimension of the symmetric tridiagonal matrix. N >= 0. !>
[in]	QSIZ	!> QSIZ is INTEGER !> The dimension of the unitary matrix used to reduce !> the dense or band matrix to tridiagonal form. !> QSIZ >= N if ICOMPQ = 1. !>
[in,out]	Q	!> Q is COMPLEX array, dimension (LDQ,N) !> On entry, Q contains the eigenvectors of the partially solved !> system which has been previously updated in matrix !> multiplies with other partially solved eigensystems. !> On exit, Q contains the trailing (N-K) updated eigenvectors !> (those which were deflated) in its last N-K columns. !>
[in]	LDQ	!> LDQ is INTEGER !> The leading dimension of the array Q. LDQ >= max( 1, N ). !>
[in,out]	D	!> D is REAL array, dimension (N) !> On entry, D contains the eigenvalues of the two submatrices to !> be combined. On exit, D contains the trailing (N-K) updated !> eigenvalues (those which were deflated) sorted into increasing !> order. !>
[in,out]	RHO	!> RHO is REAL !> Contains the off diagonal element associated with the rank-1 !> cut which originally split the two submatrices which are now !> being recombined. RHO is modified during the computation to !> the value required by SLAED3. !>
[in]	CUTPNT	!> CUTPNT is INTEGER !> Contains the location of the last eigenvalue in the leading !> sub-matrix. MIN(1,N) <= CUTPNT <= N. !>
[in]	Z	!> Z is REAL array, dimension (N) !> On input this vector contains the updating vector (the last !> row of the first sub-eigenvector matrix and the first row of !> the second sub-eigenvector matrix). The contents of Z are !> destroyed during the updating process. !>
[out]	DLAMDA	!> DLAMDA is REAL array, dimension (N) !> Contains a copy of the first K eigenvalues which will be used !> by SLAED3 to form the secular equation. !>
[out]	Q2	!> Q2 is COMPLEX array, dimension (LDQ2,N) !> If ICOMPQ = 0, Q2 is not referenced. Otherwise, !> Contains a copy of the first K eigenvectors which will be used !> by SLAED7 in a matrix multiply (SGEMM) to update the new !> eigenvectors. !>
[in]	LDQ2	!> LDQ2 is INTEGER !> The leading dimension of the array Q2. LDQ2 >= max( 1, N ). !>
[out]	W	!> W is REAL array, dimension (N) !> This will hold the first k values of the final !> deflation-altered z-vector and will be passed to SLAED3. !>
[out]	INDXP	!> INDXP is INTEGER array, dimension (N) !> This will contain the permutation used to place deflated !> values of D at the end of the array. On output INDXP(1:K) !> points to the nondeflated D-values and INDXP(K+1:N) !> points to the deflated eigenvalues. !>
[out]	INDX	!> INDX is INTEGER array, dimension (N) !> This will contain the permutation used to sort the contents of !> D into ascending order. !>
[in]	INDXQ	!> INDXQ is INTEGER array, dimension (N) !> This contains the permutation which separately sorts the two !> sub-problems in D into ascending order. Note that elements in !> the second half of this permutation must first have CUTPNT !> added to their values in order to be accurate. !>
[out]	PERM	!> PERM is INTEGER array, dimension (N) !> Contains the permutations (from deflation and sorting) to be !> applied to each eigenblock. !>
[out]	GIVPTR	!> GIVPTR is INTEGER !> Contains the number of Givens rotations which took place in !> this subproblem. !>
[out]	GIVCOL	!> GIVCOL is INTEGER array, dimension (2, N) !> Each pair of numbers indicates a pair of columns to take place !> in a Givens rotation. !>
[out]	GIVNUM	!> GIVNUM is REAL array, dimension (2, N) !> Each number indicates the S value to be used in the !> corresponding Givens rotation. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> < 0: if INFO = -i, the i-th argument had an illegal value. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 225 of file claed8.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            CUTPNT, GIVPTR, INFO, K, LDQ, LDQ2, N, QSIZ
      REAL               RHO
*     ..
*     .. Array Arguments ..
      INTEGER            GIVCOL( 2, * ), INDX( * ), INDXP( * ),
     $                   INDXQ( * ), PERM( * )
      REAL               D( * ), DLAMDA( * ), GIVNUM( 2, * ), W( * ),
     $                   Z( * )
      COMPLEX            Q( LDQ, * ), Q2( LDQ2, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               MONE, ZERO, ONE, TWO, EIGHT
      parameter( mone = -1.0e0, zero = 0.0e0, one = 1.0e0,
     $                   two = 2.0e0, eight = 8.0e0 )
*     ..
*     .. Local Scalars ..
      INTEGER            I, IMAX, J, JLAM, JMAX, JP, K2, N1, N1P1, N2
      REAL               C, EPS, S, T, TAU, TOL
*     ..
*     .. External Functions ..
      INTEGER            ISAMAX
      REAL               SLAMCH, SLAPY2
      EXTERNAL           isamax, slamch, slapy2
*     ..
*     .. External Subroutines ..
      EXTERNAL           ccopy, clacpy, csrot, scopy, slamrg, sscal,
     $                   xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, max, min, sqrt
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
*
      IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( qsiz.LT.n ) THEN
         info = -3
      ELSE IF( ldq.LT.max( 1, n ) ) THEN
         info = -5
      ELSE IF( cutpnt.LT.min( 1, n ) .OR. cutpnt.GT.n ) THEN
         info = -8
      ELSE IF( ldq2.LT.max( 1, n ) ) THEN
         info = -12
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CLAED8', -info )
         RETURN
      END IF
*
*     Need to initialize GIVPTR to O here in case of quick exit
*     to prevent an unspecified code behavior (usually sigfault)
*     when IWORK array on entry to *stedc is not zeroed
*     (or at least some IWORK entries which used in *laed7 for GIVPTR).
*
      givptr = 0
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
      n1 = cutpnt
      n2 = n - n1
      n1p1 = n1 + 1
*
      IF( rho.LT.zero ) THEN
         CALL sscal( n2, mone, z( n1p1 ), 1 )
      END IF
*
*     Normalize z so that norm(z) = 1
*
      t = one / sqrt( two )
      DO 10 j = 1, n
         indx( j ) = j
   10 CONTINUE
      CALL sscal( n, t, z, 1 )
      rho = abs( two*rho )
*
*     Sort the eigenvalues into increasing order
*
      DO 20 i = cutpnt + 1, n
         indxq( i ) = indxq( i ) + cutpnt
   20 CONTINUE
      DO 30 i = 1, n
         dlamda( i ) = d( indxq( i ) )
         w( i ) = z( indxq( i ) )
   30 CONTINUE
      i = 1
      j = cutpnt + 1
      CALL slamrg( n1, n2, dlamda, 1, 1, indx )
      DO 40 i = 1, n
         d( i ) = dlamda( indx( i ) )
         z( i ) = w( indx( i ) )
   40 CONTINUE
*
*     Calculate the allowable deflation tolerance
*
      imax = isamax( n, z, 1 )
      jmax = isamax( n, d, 1 )
      eps = slamch( 'Epsilon' )
      tol = eight*eps*abs( d( jmax ) )
*
*     If the rank-1 modifier is small enough, no more needs to be done
*     -- except to reorganize Q so that its columns correspond with the
*     elements in D.
*
      IF( rho*abs( z( imax ) ).LE.tol ) THEN
         k = 0
         DO 50 j = 1, n
            perm( j ) = indxq( indx( j ) )
            CALL ccopy( qsiz, q( 1, perm( j ) ), 1, q2( 1, j ), 1 )
   50    CONTINUE
         CALL clacpy( 'A', qsiz, n, q2( 1, 1 ), ldq2, q( 1, 1 ), ldq )
         RETURN
      END IF
*
*     If there are multiple eigenvalues then the problem deflates.  Here
*     the number of equal eigenvalues are found.  As each equal
*     eigenvalue is found, an elementary reflector is computed to rotate
*     the corresponding eigensubspace so that the corresponding
*     components of Z are zero in this new basis.
*
      k = 0
      k2 = n + 1
      DO 60 j = 1, n
         IF( rho*abs( z( j ) ).LE.tol ) THEN
*
*           Deflate due to small z component.
*
            k2 = k2 - 1
            indxp( k2 ) = j
            IF( j.EQ.n )
     $         GO TO 100
         ELSE
            jlam = j
            GO TO 70
         END IF
   60 CONTINUE
   70 CONTINUE
      j = j + 1
      IF( j.GT.n )
     $   GO TO 90
      IF( rho*abs( z( j ) ).LE.tol ) THEN
*
*        Deflate due to small z component.
*
         k2 = k2 - 1
         indxp( k2 ) = j
      ELSE
*
*        Check if eigenvalues are close enough to allow deflation.
*
         s = z( jlam )
         c = z( j )
*
*        Find sqrt(a**2+b**2) without overflow or
*        destructive underflow.
*
         tau = slapy2( c, s )
         t = d( j ) - d( jlam )
         c = c / tau
         s = -s / tau
         IF( abs( t*c*s ).LE.tol ) THEN
*
*           Deflation is possible.
*
            z( j ) = tau
            z( jlam ) = zero
*
*           Record the appropriate Givens rotation
*
            givptr = givptr + 1
            givcol( 1, givptr ) = indxq( indx( jlam ) )
            givcol( 2, givptr ) = indxq( indx( j ) )
            givnum( 1, givptr ) = c
            givnum( 2, givptr ) = s
            CALL csrot( qsiz, q( 1, indxq( indx( jlam ) ) ), 1,
     $                  q( 1, indxq( indx( j ) ) ), 1, c, s )
            t = d( jlam )*c*c + d( j )*s*s
            d( j ) = d( jlam )*s*s + d( j )*c*c
            d( jlam ) = t
            k2 = k2 - 1
            i = 1
   80       CONTINUE
            IF( k2+i.LE.n ) THEN
               IF( d( jlam ).LT.d( indxp( k2+i ) ) ) THEN
                  indxp( k2+i-1 ) = indxp( k2+i )
                  indxp( k2+i ) = jlam
                  i = i + 1
                  GO TO 80
               ELSE
                  indxp( k2+i-1 ) = jlam
               END IF
            ELSE
               indxp( k2+i-1 ) = jlam
            END IF
            jlam = j
         ELSE
            k = k + 1
            w( k ) = z( jlam )
            dlamda( k ) = d( jlam )
            indxp( k ) = jlam
            jlam = j
         END IF
      END IF
      GO TO 70
   90 CONTINUE
*
*     Record the last eigenvalue.
*
      k = k + 1
      w( k ) = z( jlam )
      dlamda( k ) = d( jlam )
      indxp( k ) = jlam
*
  100 CONTINUE
*
*     Sort the eigenvalues and corresponding eigenvectors into DLAMDA
*     and Q2 respectively.  The eigenvalues/vectors which were not
*     deflated go into the first K slots of DLAMDA and Q2 respectively,
*     while those which were deflated go into the last N - K slots.
*
      DO 110 j = 1, n
         jp = indxp( j )
         dlamda( j ) = d( jp )
         perm( j ) = indxq( indx( jp ) )
         CALL ccopy( qsiz, q( 1, perm( j ) ), 1, q2( 1, j ), 1 )
  110 CONTINUE
*
*     The deflated eigenvalues and their corresponding vectors go back
*     into the last N - K slots of D and Q respectively.
*
      IF( k.LT.n ) THEN
         CALL scopy( n-k, dlamda( k+1 ), 1, d( k+1 ), 1 )
         CALL clacpy( 'A', qsiz, n-k, q2( 1, k+1 ), ldq2, q( 1, k+1 ),
     $                ldq )
      END IF
*
      RETURN
*
*     End of CLAED8
*

◆ clals0()

subroutine clals0	(	integer	icompq,
		integer	nl,
		integer	nr,
		integer	sqre,
		integer	nrhs,
		complex, dimension( ldb, * )	b,
		integer	ldb,
		complex, dimension( ldbx, * )	bx,
		integer	ldbx,
		integer, dimension( * )	perm,
		integer	givptr,
		integer, dimension( ldgcol, * )	givcol,
		integer	ldgcol,
		real, dimension( ldgnum, * )	givnum,
		integer	ldgnum,
		real, dimension( ldgnum, * )	poles,
		real, dimension( * )	difl,
		real, dimension( ldgnum, * )	difr,
		real, dimension( * )	z,
		integer	k,
		real	c,
		real	s,
		real, dimension( * )	rwork,
		integer	info )

CLALS0 applies back multiplying factors in solving the least squares problem using divide and conquer SVD approach. Used by sgelsd.

Download CLALS0 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CLALS0 applies back the multiplying factors of either the left or the
!> right singular vector matrix of a diagonal matrix appended by a row
!> to the right hand side matrix B in solving the least squares problem
!> using the divide-and-conquer SVD approach.
!>
!> For the left singular vector matrix, three types of orthogonal
!> matrices are involved:
!>
!> (1L) Givens rotations: the number of such rotations is GIVPTR; the
!>      pairs of columns/rows they were applied to are stored in GIVCOL;
!>      and the C- and S-values of these rotations are stored in GIVNUM.
!>
!> (2L) Permutation. The (NL+1)-st row of B is to be moved to the first
!>      row, and for J=2:N, PERM(J)-th row of B is to be moved to the
!>      J-th row.
!>
!> (3L) The left singular vector matrix of the remaining matrix.
!>
!> For the right singular vector matrix, four types of orthogonal
!> matrices are involved:
!>
!> (1R) The right singular vector matrix of the remaining matrix.
!>
!> (2R) If SQRE = 1, one extra Givens rotation to generate the right
!>      null space.
!>
!> (3R) The inverse transformation of (2L).
!>
!> (4R) The inverse transformation of (1L).
!>

Parameters

[in]	ICOMPQ	!> ICOMPQ is INTEGER !> Specifies whether singular vectors are to be computed in !> factored form: !> = 0: Left singular vector matrix. !> = 1: Right singular vector matrix. !>
[in]	NL	!> NL is INTEGER !> The row dimension of the upper block. NL >= 1. !>
[in]	NR	!> NR is INTEGER !> The row dimension of the lower block. NR >= 1. !>
[in]	SQRE	!> SQRE is INTEGER !> = 0: the lower block is an NR-by-NR square matrix. !> = 1: the lower block is an NR-by-(NR+1) rectangular matrix. !> !> The bidiagonal matrix has row dimension N = NL + NR + 1, !> and column dimension M = N + SQRE. !>
[in]	NRHS	!> NRHS is INTEGER !> The number of columns of B and BX. NRHS must be at least 1. !>
[in,out]	B	!> B is COMPLEX array, dimension ( LDB, NRHS ) !> On input, B contains the right hand sides of the least !> squares problem in rows 1 through M. On output, B contains !> the solution X in rows 1 through N. !>
[in]	LDB	!> LDB is INTEGER !> The leading dimension of B. LDB must be at least !> max(1,MAX( M, N ) ). !>
[out]	BX	!> BX is COMPLEX array, dimension ( LDBX, NRHS ) !>
[in]	LDBX	!> LDBX is INTEGER !> The leading dimension of BX. !>
[in]	PERM	!> PERM is INTEGER array, dimension ( N ) !> The permutations (from deflation and sorting) applied !> to the two blocks. !>
[in]	GIVPTR	!> GIVPTR is INTEGER !> The number of Givens rotations which took place in this !> subproblem. !>
[in]	GIVCOL	!> GIVCOL is INTEGER array, dimension ( LDGCOL, 2 ) !> Each pair of numbers indicates a pair of rows/columns !> involved in a Givens rotation. !>
[in]	LDGCOL	!> LDGCOL is INTEGER !> The leading dimension of GIVCOL, must be at least N. !>
[in]	GIVNUM	!> GIVNUM is REAL array, dimension ( LDGNUM, 2 ) !> Each number indicates the C or S value used in the !> corresponding Givens rotation. !>
[in]	LDGNUM	!> LDGNUM is INTEGER !> The leading dimension of arrays DIFR, POLES and !> GIVNUM, must be at least K. !>
[in]	POLES	!> POLES is REAL array, dimension ( LDGNUM, 2 ) !> On entry, POLES(1:K, 1) contains the new singular !> values obtained from solving the secular equation, and !> POLES(1:K, 2) is an array containing the poles in the secular !> equation. !>
[in]	DIFL	!> DIFL is REAL array, dimension ( K ). !> On entry, DIFL(I) is the distance between I-th updated !> (undeflated) singular value and the I-th (undeflated) old !> singular value. !>
[in]	DIFR	!> DIFR is REAL array, dimension ( LDGNUM, 2 ). !> On entry, DIFR(I, 1) contains the distances between I-th !> updated (undeflated) singular value and the I+1-th !> (undeflated) old singular value. And DIFR(I, 2) is the !> normalizing factor for the I-th right singular vector. !>
[in]	Z	!> Z is REAL array, dimension ( K ) !> Contain the components of the deflation-adjusted updating row !> vector. !>
[in]	K	!> K is INTEGER !> Contains the dimension of the non-deflated matrix, !> This is the order of the related secular equation. 1 <= K <=N. !>
[in]	C	!> C is REAL !> C contains garbage if SQRE =0 and the C-value of a Givens !> rotation related to the right null space if SQRE = 1. !>
[in]	S	!> S is REAL !> S contains garbage if SQRE =0 and the S-value of a Givens !> rotation related to the right null space if SQRE = 1. !>
[out]	RWORK	!> RWORK is REAL array, dimension !> ( K(1+NRHS) + 2NRHS ) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> < 0: if INFO = -i, the i-th argument had an illegal value. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: Ming Gu and Ren-Cang Li, Computer Science Division, University of California at Berkeley, USA
Osni Marques, LBNL/NERSC, USA

Definition at line 267 of file clals0.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            GIVPTR, ICOMPQ, INFO, K, LDB, LDBX, LDGCOL,
     $                   LDGNUM, NL, NR, NRHS, SQRE
      REAL               C, S
*     ..
*     .. Array Arguments ..
      INTEGER            GIVCOL( LDGCOL, * ), PERM( * )
      REAL               DIFL( * ), DIFR( LDGNUM, * ),
     $                   GIVNUM( LDGNUM, * ), POLES( LDGNUM, * ),
     $                   RWORK( * ), Z( * )
      COMPLEX            B( LDB, * ), BX( LDBX, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ONE, ZERO, NEGONE
      parameter( one = 1.0e0, zero = 0.0e0, negone = -1.0e0 )
*     ..
*     .. Local Scalars ..
      INTEGER            I, J, JCOL, JROW, M, N, NLP1
      REAL               DIFLJ, DIFRJ, DJ, DSIGJ, DSIGJP, TEMP
*     ..
*     .. External Subroutines ..
      EXTERNAL           ccopy, clacpy, clascl, csrot, csscal, sgemv,
     $                   xerbla
*     ..
*     .. External Functions ..
      REAL               SLAMC3, SNRM2
      EXTERNAL           slamc3, snrm2
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          aimag, cmplx, max, real
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      n = nl + nr + 1
*
      IF( ( icompq.LT.0 ) .OR. ( icompq.GT.1 ) ) THEN
         info = -1
      ELSE IF( nl.LT.1 ) THEN
         info = -2
      ELSE IF( nr.LT.1 ) THEN
         info = -3
      ELSE IF( ( sqre.LT.0 ) .OR. ( sqre.GT.1 ) ) THEN
         info = -4
      ELSE IF( nrhs.LT.1 ) THEN
         info = -5
      ELSE IF( ldb.LT.n ) THEN
         info = -7
      ELSE IF( ldbx.LT.n ) THEN
         info = -9
      ELSE IF( givptr.LT.0 ) THEN
         info = -11
      ELSE IF( ldgcol.LT.n ) THEN
         info = -13
      ELSE IF( ldgnum.LT.n ) THEN
         info = -15
      ELSE IF( k.LT.1 ) THEN
         info = -20
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CLALS0', -info )
         RETURN
      END IF
*
      m = n + sqre
      nlp1 = nl + 1
*
      IF( icompq.EQ.0 ) THEN
*
*        Apply back orthogonal transformations from the left.
*
*        Step (1L): apply back the Givens rotations performed.
*
         DO 10 i = 1, givptr
            CALL csrot( nrhs, b( givcol( i, 2 ), 1 ), ldb,
     $                  b( givcol( i, 1 ), 1 ), ldb, givnum( i, 2 ),
     $                  givnum( i, 1 ) )
   10    CONTINUE
*
*        Step (2L): permute rows of B.
*
         CALL ccopy( nrhs, b( nlp1, 1 ), ldb, bx( 1, 1 ), ldbx )
         DO 20 i = 2, n
            CALL ccopy( nrhs, b( perm( i ), 1 ), ldb, bx( i, 1 ), ldbx )
   20    CONTINUE
*
*        Step (3L): apply the inverse of the left singular vector
*        matrix to BX.
*
         IF( k.EQ.1 ) THEN
            CALL ccopy( nrhs, bx, ldbx, b, ldb )
            IF( z( 1 ).LT.zero ) THEN
               CALL csscal( nrhs, negone, b, ldb )
            END IF
         ELSE
            DO 100 j = 1, k
               diflj = difl( j )
               dj = poles( j, 1 )
               dsigj = -poles( j, 2 )
               IF( j.LT.k ) THEN
                  difrj = -difr( j, 1 )
                  dsigjp = -poles( j+1, 2 )
               END IF
               IF( ( z( j ).EQ.zero ) .OR. ( poles( j, 2 ).EQ.zero ) )
     $              THEN
                  rwork( j ) = zero
               ELSE
                  rwork( j ) = -poles( j, 2 )*z( j ) / diflj /
     $                         ( poles( j, 2 )+dj )
               END IF
               DO 30 i = 1, j - 1
                  IF( ( z( i ).EQ.zero ) .OR.
     $                ( poles( i, 2 ).EQ.zero ) ) THEN
                     rwork( i ) = zero
                  ELSE
                     rwork( i ) = poles( i, 2 )*z( i ) /
     $                            ( slamc3( poles( i, 2 ), dsigj )-
     $                            diflj ) / ( poles( i, 2 )+dj )
                  END IF
   30          CONTINUE
               DO 40 i = j + 1, k
                  IF( ( z( i ).EQ.zero ) .OR.
     $                ( poles( i, 2 ).EQ.zero ) ) THEN
                     rwork( i ) = zero
                  ELSE
                     rwork( i ) = poles( i, 2 )*z( i ) /
     $                            ( slamc3( poles( i, 2 ), dsigjp )+
     $                            difrj ) / ( poles( i, 2 )+dj )
                  END IF
   40          CONTINUE
               rwork( 1 ) = negone
               temp = snrm2( k, rwork, 1 )
*
*              Since B and BX are complex, the following call to SGEMV
*              is performed in two steps (real and imaginary parts).
*
*              CALL SGEMV( 'T', K, NRHS, ONE, BX, LDBX, WORK, 1, ZERO,
*    $                     B( J, 1 ), LDB )
*
               i = k + nrhs*2
               DO 60 jcol = 1, nrhs
                  DO 50 jrow = 1, k
                     i = i + 1
                     rwork( i ) = real( bx( jrow, jcol ) )
   50             CONTINUE
   60          CONTINUE
               CALL sgemv( 'T', k, nrhs, one, rwork( 1+k+nrhs*2 ), k,
     $                     rwork( 1 ), 1, zero, rwork( 1+k ), 1 )
               i = k + nrhs*2
               DO 80 jcol = 1, nrhs
                  DO 70 jrow = 1, k
                     i = i + 1
                     rwork( i ) = aimag( bx( jrow, jcol ) )
   70             CONTINUE
   80          CONTINUE
               CALL sgemv( 'T', k, nrhs, one, rwork( 1+k+nrhs*2 ), k,
     $                     rwork( 1 ), 1, zero, rwork( 1+k+nrhs ), 1 )
               DO 90 jcol = 1, nrhs
                  b( j, jcol ) = cmplx( rwork( jcol+k ),
     $                           rwork( jcol+k+nrhs ) )
   90          CONTINUE
               CALL clascl( 'G', 0, 0, temp, one, 1, nrhs, b( j, 1 ),
     $                      ldb, info )
  100       CONTINUE
         END IF
*
*        Move the deflated rows of BX to B also.
*
         IF( k.LT.max( m, n ) )
     $      CALL clacpy( 'A', n-k, nrhs, bx( k+1, 1 ), ldbx,
     $                   b( k+1, 1 ), ldb )
      ELSE
*
*        Apply back the right orthogonal transformations.
*
*        Step (1R): apply back the new right singular vector matrix
*        to B.
*
         IF( k.EQ.1 ) THEN
            CALL ccopy( nrhs, b, ldb, bx, ldbx )
         ELSE
            DO 180 j = 1, k
               dsigj = poles( j, 2 )
               IF( z( j ).EQ.zero ) THEN
                  rwork( j ) = zero
               ELSE
                  rwork( j ) = -z( j ) / difl( j ) /
     $                         ( dsigj+poles( j, 1 ) ) / difr( j, 2 )
               END IF
               DO 110 i = 1, j - 1
                  IF( z( j ).EQ.zero ) THEN
                     rwork( i ) = zero
                  ELSE
                     rwork( i ) = z( j ) / ( slamc3( dsigj, -poles( i+1,
     $                            2 ) )-difr( i, 1 ) ) /
     $                            ( dsigj+poles( i, 1 ) ) / difr( i, 2 )
                  END IF
  110          CONTINUE
               DO 120 i = j + 1, k
                  IF( z( j ).EQ.zero ) THEN
                     rwork( i ) = zero
                  ELSE
                     rwork( i ) = z( j ) / ( slamc3( dsigj, -poles( i,
     $                            2 ) )-difl( i ) ) /
     $                            ( dsigj+poles( i, 1 ) ) / difr( i, 2 )
                  END IF
  120          CONTINUE
*
*              Since B and BX are complex, the following call to SGEMV
*              is performed in two steps (real and imaginary parts).
*
*              CALL SGEMV( 'T', K, NRHS, ONE, B, LDB, WORK, 1, ZERO,
*    $                     BX( J, 1 ), LDBX )
*
               i = k + nrhs*2
               DO 140 jcol = 1, nrhs
                  DO 130 jrow = 1, k
                     i = i + 1
                     rwork( i ) = real( b( jrow, jcol ) )
  130             CONTINUE
  140          CONTINUE
               CALL sgemv( 'T', k, nrhs, one, rwork( 1+k+nrhs*2 ), k,
     $                     rwork( 1 ), 1, zero, rwork( 1+k ), 1 )
               i = k + nrhs*2
               DO 160 jcol = 1, nrhs
                  DO 150 jrow = 1, k
                     i = i + 1
                     rwork( i ) = aimag( b( jrow, jcol ) )
  150             CONTINUE
  160          CONTINUE
               CALL sgemv( 'T', k, nrhs, one, rwork( 1+k+nrhs*2 ), k,
     $                     rwork( 1 ), 1, zero, rwork( 1+k+nrhs ), 1 )
               DO 170 jcol = 1, nrhs
                  bx( j, jcol ) = cmplx( rwork( jcol+k ),
     $                            rwork( jcol+k+nrhs ) )
  170          CONTINUE
  180       CONTINUE
         END IF
*
*        Step (2R): if SQRE = 1, apply back the rotation that is
*        related to the right null space of the subproblem.
*
         IF( sqre.EQ.1 ) THEN
            CALL ccopy( nrhs, b( m, 1 ), ldb, bx( m, 1 ), ldbx )
            CALL csrot( nrhs, bx( 1, 1 ), ldbx, bx( m, 1 ), ldbx, c, s )
         END IF
         IF( k.LT.max( m, n ) )
     $      CALL clacpy( 'A', n-k, nrhs, b( k+1, 1 ), ldb,
     $                   bx( k+1, 1 ), ldbx )
*
*        Step (3R): permute rows of B.
*
         CALL ccopy( nrhs, bx( 1, 1 ), ldbx, b( nlp1, 1 ), ldb )
         IF( sqre.EQ.1 ) THEN
            CALL ccopy( nrhs, bx( m, 1 ), ldbx, b( m, 1 ), ldb )
         END IF
         DO 190 i = 2, n
            CALL ccopy( nrhs, bx( i, 1 ), ldbx, b( perm( i ), 1 ), ldb )
  190    CONTINUE
*
*        Step (4R): apply back the Givens rotations performed.
*
         DO 200 i = givptr, 1, -1
            CALL csrot( nrhs, b( givcol( i, 2 ), 1 ), ldb,
     $                  b( givcol( i, 1 ), 1 ), ldb, givnum( i, 2 ),
     $                  -givnum( i, 1 ) )
  200    CONTINUE
      END IF
*
      RETURN
*
*     End of CLALS0
*

◆ clalsa()

subroutine clalsa	(	integer	icompq,
		integer	smlsiz,
		integer	n,
		integer	nrhs,
		complex, dimension( ldb, * )	b,
		integer	ldb,
		complex, dimension( ldbx, * )	bx,
		integer	ldbx,
		real, dimension( ldu, * )	u,
		integer	ldu,
		real, dimension( ldu, * )	vt,
		integer, dimension( * )	k,
		real, dimension( ldu, * )	difl,
		real, dimension( ldu, * )	difr,
		real, dimension( ldu, * )	z,
		real, dimension( ldu, * )	poles,
		integer, dimension( * )	givptr,
		integer, dimension( ldgcol, * )	givcol,
		integer	ldgcol,
		integer, dimension( ldgcol, * )	perm,
		real, dimension( ldu, * )	givnum,
		real, dimension( * )	c,
		real, dimension( * )	s,
		real, dimension( * )	rwork,
		integer, dimension( * )	iwork,
		integer	info )

CLALSA computes the SVD of the coefficient matrix in compact form. Used by sgelsd.

Download CLALSA + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CLALSA is an itermediate step in solving the least squares problem
!> by computing the SVD of the coefficient matrix in compact form (The
!> singular vectors are computed as products of simple orthorgonal
!> matrices.).
!>
!> If ICOMPQ = 0, CLALSA applies the inverse of the left singular vector
!> matrix of an upper bidiagonal matrix to the right hand side; and if
!> ICOMPQ = 1, CLALSA applies the right singular vector matrix to the
!> right hand side. The singular vector matrices were generated in
!> compact form by CLALSA.
!>

Parameters

[in]	ICOMPQ	!> ICOMPQ is INTEGER !> Specifies whether the left or the right singular vector !> matrix is involved. !> = 0: Left singular vector matrix !> = 1: Right singular vector matrix !>
[in]	SMLSIZ	!> SMLSIZ is INTEGER !> The maximum size of the subproblems at the bottom of the !> computation tree. !>
[in]	N	!> N is INTEGER !> The row and column dimensions of the upper bidiagonal matrix. !>
[in]	NRHS	!> NRHS is INTEGER !> The number of columns of B and BX. NRHS must be at least 1. !>
[in,out]	B	!> B is COMPLEX array, dimension ( LDB, NRHS ) !> On input, B contains the right hand sides of the least !> squares problem in rows 1 through M. !> On output, B contains the solution X in rows 1 through N. !>
[in]	LDB	!> LDB is INTEGER !> The leading dimension of B in the calling subprogram. !> LDB must be at least max(1,MAX( M, N ) ). !>
[out]	BX	!> BX is COMPLEX array, dimension ( LDBX, NRHS ) !> On exit, the result of applying the left or right singular !> vector matrix to B. !>
[in]	LDBX	!> LDBX is INTEGER !> The leading dimension of BX. !>
[in]	U	!> U is REAL array, dimension ( LDU, SMLSIZ ). !> On entry, U contains the left singular vector matrices of all !> subproblems at the bottom level. !>
[in]	LDU	!> LDU is INTEGER, LDU = > N. !> The leading dimension of arrays U, VT, DIFL, DIFR, !> POLES, GIVNUM, and Z. !>
[in]	VT	!> VT is REAL array, dimension ( LDU, SMLSIZ+1 ). !> On entry, VT**H contains the right singular vector matrices of !> all subproblems at the bottom level. !>
[in]	K	!> K is INTEGER array, dimension ( N ). !>
[in]	DIFL	!> DIFL is REAL array, dimension ( LDU, NLVL ). !> where NLVL = INT(log_2 (N/(SMLSIZ+1))) + 1. !>
[in]	DIFR	!> DIFR is REAL array, dimension ( LDU, 2 * NLVL ). !> On entry, DIFL(, I) and DIFR(, 2 * I -1) record !> distances between singular values on the I-th level and !> singular values on the (I -1)-th level, and DIFR(, 2 I) !> record the normalizing factors of the right singular vectors !> matrices of subproblems on I-th level. !>
[in]	Z	!> Z is REAL array, dimension ( LDU, NLVL ). !> On entry, Z(1, I) contains the components of the deflation- !> adjusted updating row vector for subproblems on the I-th !> level. !>
[in]	POLES	!> POLES is REAL array, dimension ( LDU, 2 * NLVL ). !> On entry, POLES(, 2 I -1: 2 * I) contains the new and old !> singular values involved in the secular equations on the I-th !> level. !>
[in]	GIVPTR	!> GIVPTR is INTEGER array, dimension ( N ). !> On entry, GIVPTR( I ) records the number of Givens !> rotations performed on the I-th problem on the computation !> tree. !>
[in]	GIVCOL	!> GIVCOL is INTEGER array, dimension ( LDGCOL, 2 * NLVL ). !> On entry, for each I, GIVCOL(, 2 I - 1: 2 * I) records the !> locations of Givens rotations performed on the I-th level on !> the computation tree. !>
[in]	LDGCOL	!> LDGCOL is INTEGER, LDGCOL = > N. !> The leading dimension of arrays GIVCOL and PERM. !>
[in]	PERM	!> PERM is INTEGER array, dimension ( LDGCOL, NLVL ). !> On entry, PERM(*, I) records permutations done on the I-th !> level of the computation tree. !>
[in]	GIVNUM	!> GIVNUM is REAL array, dimension ( LDU, 2 * NLVL ). !> On entry, GIVNUM(, 2 I -1 : 2 * I) records the C- and S- !> values of Givens rotations performed on the I-th level on the !> computation tree. !>
[in]	C	!> C is REAL array, dimension ( N ). !> On entry, if the I-th subproblem is not square, !> C( I ) contains the C-value of a Givens rotation related to !> the right null space of the I-th subproblem. !>
[in]	S	!> S is REAL array, dimension ( N ). !> On entry, if the I-th subproblem is not square, !> S( I ) contains the S-value of a Givens rotation related to !> the right null space of the I-th subproblem. !>
[out]	RWORK	!> RWORK is REAL array, dimension at least !> MAX( (SMLSZ+1)NRHS3, N(1+NRHS) + 2NRHS ). !>
[out]	IWORK	!> IWORK is INTEGER array, dimension (3*N) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> < 0: if INFO = -i, the i-th argument had an illegal value. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: Ming Gu and Ren-Cang Li, Computer Science Division, University of California at Berkeley, USA
Osni Marques, LBNL/NERSC, USA

Definition at line 263 of file clalsa.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            ICOMPQ, INFO, LDB, LDBX, LDGCOL, LDU, N, NRHS,
     $                   SMLSIZ
*     ..
*     .. Array Arguments ..
      INTEGER            GIVCOL( LDGCOL, * ), GIVPTR( * ), IWORK( * ),
     $                   K( * ), PERM( LDGCOL, * )
      REAL               C( * ), DIFL( LDU, * ), DIFR( LDU, * ),
     $                   GIVNUM( LDU, * ), POLES( LDU, * ), RWORK( * ),
     $                   S( * ), U( LDU, * ), VT( LDU, * ), Z( LDU, * )
      COMPLEX            B( LDB, * ), BX( LDBX, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ZERO, ONE
      parameter( zero = 0.0e0, one = 1.0e0 )
*     ..
*     .. Local Scalars ..
      INTEGER            I, I1, IC, IM1, INODE, J, JCOL, JIMAG, JREAL,
     $                   JROW, LF, LL, LVL, LVL2, ND, NDB1, NDIML,
     $                   NDIMR, NL, NLF, NLP1, NLVL, NR, NRF, NRP1, SQRE
*     ..
*     .. External Subroutines ..
      EXTERNAL           ccopy, clals0, sgemm, slasdt, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          aimag, cmplx, real
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
*
      IF( ( icompq.LT.0 ) .OR. ( icompq.GT.1 ) ) THEN
         info = -1
      ELSE IF( smlsiz.LT.3 ) THEN
         info = -2
      ELSE IF( n.LT.smlsiz ) THEN
         info = -3
      ELSE IF( nrhs.LT.1 ) THEN
         info = -4
      ELSE IF( ldb.LT.n ) THEN
         info = -6
      ELSE IF( ldbx.LT.n ) THEN
         info = -8
      ELSE IF( ldu.LT.n ) THEN
         info = -10
      ELSE IF( ldgcol.LT.n ) THEN
         info = -19
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CLALSA', -info )
         RETURN
      END IF
*
*     Book-keeping and  setting up the computation tree.
*
      inode = 1
      ndiml = inode + n
      ndimr = ndiml + n
*
      CALL slasdt( n, nlvl, nd, iwork( inode ), iwork( ndiml ),
     $             iwork( ndimr ), smlsiz )
*
*     The following code applies back the left singular vector factors.
*     For applying back the right singular vector factors, go to 170.
*
      IF( icompq.EQ.1 ) THEN
         GO TO 170
      END IF
*
*     The nodes on the bottom level of the tree were solved
*     by SLASDQ. The corresponding left and right singular vector
*     matrices are in explicit form. First apply back the left
*     singular vector matrices.
*
      ndb1 = ( nd+1 ) / 2
      DO 130 i = ndb1, nd
*
*        IC : center row of each node
*        NL : number of rows of left  subproblem
*        NR : number of rows of right subproblem
*        NLF: starting row of the left   subproblem
*        NRF: starting row of the right  subproblem
*
         i1 = i - 1
         ic = iwork( inode+i1 )
         nl = iwork( ndiml+i1 )
         nr = iwork( ndimr+i1 )
         nlf = ic - nl
         nrf = ic + 1
*
*        Since B and BX are complex, the following call to SGEMM
*        is performed in two steps (real and imaginary parts).
*
*        CALL SGEMM( 'T', 'N', NL, NRHS, NL, ONE, U( NLF, 1 ), LDU,
*     $               B( NLF, 1 ), LDB, ZERO, BX( NLF, 1 ), LDBX )
*
         j = nl*nrhs*2
         DO 20 jcol = 1, nrhs
            DO 10 jrow = nlf, nlf + nl - 1
               j = j + 1
               rwork( j ) = real( b( jrow, jcol ) )
   10       CONTINUE
   20    CONTINUE
         CALL sgemm( 'T', 'N', nl, nrhs, nl, one, u( nlf, 1 ), ldu,
     $               rwork( 1+nl*nrhs*2 ), nl, zero, rwork( 1 ), nl )
         j = nl*nrhs*2
         DO 40 jcol = 1, nrhs
            DO 30 jrow = nlf, nlf + nl - 1
               j = j + 1
               rwork( j ) = aimag( b( jrow, jcol ) )
   30       CONTINUE
   40    CONTINUE
         CALL sgemm( 'T', 'N', nl, nrhs, nl, one, u( nlf, 1 ), ldu,
     $               rwork( 1+nl*nrhs*2 ), nl, zero, rwork( 1+nl*nrhs ),
     $               nl )
         jreal = 0
         jimag = nl*nrhs
         DO 60 jcol = 1, nrhs
            DO 50 jrow = nlf, nlf + nl - 1
               jreal = jreal + 1
               jimag = jimag + 1
               bx( jrow, jcol ) = cmplx( rwork( jreal ),
     $                            rwork( jimag ) )
   50       CONTINUE
   60    CONTINUE
*
*        Since B and BX are complex, the following call to SGEMM
*        is performed in two steps (real and imaginary parts).
*
*        CALL SGEMM( 'T', 'N', NR, NRHS, NR, ONE, U( NRF, 1 ), LDU,
*    $               B( NRF, 1 ), LDB, ZERO, BX( NRF, 1 ), LDBX )
*
         j = nr*nrhs*2
         DO 80 jcol = 1, nrhs
            DO 70 jrow = nrf, nrf + nr - 1
               j = j + 1
               rwork( j ) = real( b( jrow, jcol ) )
   70       CONTINUE
   80    CONTINUE
         CALL sgemm( 'T', 'N', nr, nrhs, nr, one, u( nrf, 1 ), ldu,
     $               rwork( 1+nr*nrhs*2 ), nr, zero, rwork( 1 ), nr )
         j = nr*nrhs*2
         DO 100 jcol = 1, nrhs
            DO 90 jrow = nrf, nrf + nr - 1
               j = j + 1
               rwork( j ) = aimag( b( jrow, jcol ) )
   90       CONTINUE
  100    CONTINUE
         CALL sgemm( 'T', 'N', nr, nrhs, nr, one, u( nrf, 1 ), ldu,
     $               rwork( 1+nr*nrhs*2 ), nr, zero, rwork( 1+nr*nrhs ),
     $               nr )
         jreal = 0
         jimag = nr*nrhs
         DO 120 jcol = 1, nrhs
            DO 110 jrow = nrf, nrf + nr - 1
               jreal = jreal + 1
               jimag = jimag + 1
               bx( jrow, jcol ) = cmplx( rwork( jreal ),
     $                            rwork( jimag ) )
  110       CONTINUE
  120    CONTINUE
*
  130 CONTINUE
*
*     Next copy the rows of B that correspond to unchanged rows
*     in the bidiagonal matrix to BX.
*
      DO 140 i = 1, nd
         ic = iwork( inode+i-1 )
         CALL ccopy( nrhs, b( ic, 1 ), ldb, bx( ic, 1 ), ldbx )
  140 CONTINUE
*
*     Finally go through the left singular vector matrices of all
*     the other subproblems bottom-up on the tree.
*
      j = 2**nlvl
      sqre = 0
*
      DO 160 lvl = nlvl, 1, -1
         lvl2 = 2*lvl - 1
*
*        find the first node LF and last node LL on
*        the current level LVL
*
         IF( lvl.EQ.1 ) THEN
            lf = 1
            ll = 1
         ELSE
            lf = 2**( lvl-1 )
            ll = 2*lf - 1
         END IF
         DO 150 i = lf, ll
            im1 = i - 1
            ic = iwork( inode+im1 )
            nl = iwork( ndiml+im1 )
            nr = iwork( ndimr+im1 )
            nlf = ic - nl
            nrf = ic + 1
            j = j - 1
            CALL clals0( icompq, nl, nr, sqre, nrhs, bx( nlf, 1 ), ldbx,
     $                   b( nlf, 1 ), ldb, perm( nlf, lvl ),
     $                   givptr( j ), givcol( nlf, lvl2 ), ldgcol,
     $                   givnum( nlf, lvl2 ), ldu, poles( nlf, lvl2 ),
     $                   difl( nlf, lvl ), difr( nlf, lvl2 ),
     $                   z( nlf, lvl ), k( j ), c( j ), s( j ), rwork,
     $                   info )
  150    CONTINUE
  160 CONTINUE
      GO TO 330
*
*     ICOMPQ = 1: applying back the right singular vector factors.
*
  170 CONTINUE
*
*     First now go through the right singular vector matrices of all
*     the tree nodes top-down.
*
      j = 0
      DO 190 lvl = 1, nlvl
         lvl2 = 2*lvl - 1
*
*        Find the first node LF and last node LL on
*        the current level LVL.
*
         IF( lvl.EQ.1 ) THEN
            lf = 1
            ll = 1
         ELSE
            lf = 2**( lvl-1 )
            ll = 2*lf - 1
         END IF
         DO 180 i = ll, lf, -1
            im1 = i - 1
            ic = iwork( inode+im1 )
            nl = iwork( ndiml+im1 )
            nr = iwork( ndimr+im1 )
            nlf = ic - nl
            nrf = ic + 1
            IF( i.EQ.ll ) THEN
               sqre = 0
            ELSE
               sqre = 1
            END IF
            j = j + 1
            CALL clals0( icompq, nl, nr, sqre, nrhs, b( nlf, 1 ), ldb,
     $                   bx( nlf, 1 ), ldbx, perm( nlf, lvl ),
     $                   givptr( j ), givcol( nlf, lvl2 ), ldgcol,
     $                   givnum( nlf, lvl2 ), ldu, poles( nlf, lvl2 ),
     $                   difl( nlf, lvl ), difr( nlf, lvl2 ),
     $                   z( nlf, lvl ), k( j ), c( j ), s( j ), rwork,
     $                   info )
  180    CONTINUE
  190 CONTINUE
*
*     The nodes on the bottom level of the tree were solved
*     by SLASDQ. The corresponding right singular vector
*     matrices are in explicit form. Apply them back.
*
      ndb1 = ( nd+1 ) / 2
      DO 320 i = ndb1, nd
         i1 = i - 1
         ic = iwork( inode+i1 )
         nl = iwork( ndiml+i1 )
         nr = iwork( ndimr+i1 )
         nlp1 = nl + 1
         IF( i.EQ.nd ) THEN
            nrp1 = nr
         ELSE
            nrp1 = nr + 1
         END IF
         nlf = ic - nl
         nrf = ic + 1
*
*        Since B and BX are complex, the following call to SGEMM is
*        performed in two steps (real and imaginary parts).
*
*        CALL SGEMM( 'T', 'N', NLP1, NRHS, NLP1, ONE, VT( NLF, 1 ), LDU,
*    $               B( NLF, 1 ), LDB, ZERO, BX( NLF, 1 ), LDBX )
*
         j = nlp1*nrhs*2
         DO 210 jcol = 1, nrhs
            DO 200 jrow = nlf, nlf + nlp1 - 1
               j = j + 1
               rwork( j ) = real( b( jrow, jcol ) )
  200       CONTINUE
  210    CONTINUE
         CALL sgemm( 'T', 'N', nlp1, nrhs, nlp1, one, vt( nlf, 1 ), ldu,
     $               rwork( 1+nlp1*nrhs*2 ), nlp1, zero, rwork( 1 ),
     $               nlp1 )
         j = nlp1*nrhs*2
         DO 230 jcol = 1, nrhs
            DO 220 jrow = nlf, nlf + nlp1 - 1
               j = j + 1
               rwork( j ) = aimag( b( jrow, jcol ) )
  220       CONTINUE
  230    CONTINUE
         CALL sgemm( 'T', 'N', nlp1, nrhs, nlp1, one, vt( nlf, 1 ), ldu,
     $               rwork( 1+nlp1*nrhs*2 ), nlp1, zero,
     $               rwork( 1+nlp1*nrhs ), nlp1 )
         jreal = 0
         jimag = nlp1*nrhs
         DO 250 jcol = 1, nrhs
            DO 240 jrow = nlf, nlf + nlp1 - 1
               jreal = jreal + 1
               jimag = jimag + 1
               bx( jrow, jcol ) = cmplx( rwork( jreal ),
     $                            rwork( jimag ) )
  240       CONTINUE
  250    CONTINUE
*
*        Since B and BX are complex, the following call to SGEMM is
*        performed in two steps (real and imaginary parts).
*
*        CALL SGEMM( 'T', 'N', NRP1, NRHS, NRP1, ONE, VT( NRF, 1 ), LDU,
*    $               B( NRF, 1 ), LDB, ZERO, BX( NRF, 1 ), LDBX )
*
         j = nrp1*nrhs*2
         DO 270 jcol = 1, nrhs
            DO 260 jrow = nrf, nrf + nrp1 - 1
               j = j + 1
               rwork( j ) = real( b( jrow, jcol ) )
  260       CONTINUE
  270    CONTINUE
         CALL sgemm( 'T', 'N', nrp1, nrhs, nrp1, one, vt( nrf, 1 ), ldu,
     $               rwork( 1+nrp1*nrhs*2 ), nrp1, zero, rwork( 1 ),
     $               nrp1 )
         j = nrp1*nrhs*2
         DO 290 jcol = 1, nrhs
            DO 280 jrow = nrf, nrf + nrp1 - 1
               j = j + 1
               rwork( j ) = aimag( b( jrow, jcol ) )
  280       CONTINUE
  290    CONTINUE
         CALL sgemm( 'T', 'N', nrp1, nrhs, nrp1, one, vt( nrf, 1 ), ldu,
     $               rwork( 1+nrp1*nrhs*2 ), nrp1, zero,
     $               rwork( 1+nrp1*nrhs ), nrp1 )
         jreal = 0
         jimag = nrp1*nrhs
         DO 310 jcol = 1, nrhs
            DO 300 jrow = nrf, nrf + nrp1 - 1
               jreal = jreal + 1
               jimag = jimag + 1
               bx( jrow, jcol ) = cmplx( rwork( jreal ),
     $                            rwork( jimag ) )
  300       CONTINUE
  310    CONTINUE
*
  320 CONTINUE
*
  330 CONTINUE
*
      RETURN
*
*     End of CLALSA
*

◆ clalsd()

subroutine clalsd	(	character	uplo,
		integer	smlsiz,
		integer	n,
		integer	nrhs,
		real, dimension( * )	d,
		real, dimension( * )	e,
		complex, dimension( ldb, * )	b,
		integer	ldb,
		real	rcond,
		integer	rank,
		complex, dimension( * )	work,
		real, dimension( * )	rwork,
		integer, dimension( * )	iwork,
		integer	info )

CLALSD uses the singular value decomposition of A to solve the least squares problem.

Download CLALSD + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CLALSD uses the singular value decomposition of A to solve the least
!> squares problem of finding X to minimize the Euclidean norm of each
!> column of A*X-B, where A is N-by-N upper bidiagonal, and X and B
!> are N-by-NRHS. The solution X overwrites B.
!>
!> The singular values of A smaller than RCOND times the largest
!> singular value are treated as zero in solving the least squares
!> problem; in this case a minimum norm solution is returned.
!> The actual singular values are returned in D in ascending order.
!>
!> This code makes very mild assumptions about floating point
!> arithmetic. It will work on machines with a guard digit in
!> add/subtract, or on those binary machines without guard digits
!> which subtract like the Cray XMP, Cray YMP, Cray C 90, or Cray 2.
!> It could conceivably fail on hexadecimal or decimal machines
!> without guard digits, but we know of none.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': D and E define an upper bidiagonal matrix. !> = 'L': D and E define a lower bidiagonal matrix. !>
[in]	SMLSIZ	!> SMLSIZ is INTEGER !> The maximum size of the subproblems at the bottom of the !> computation tree. !>
[in]	N	!> N is INTEGER !> The dimension of the bidiagonal matrix. N >= 0. !>
[in]	NRHS	!> NRHS is INTEGER !> The number of columns of B. NRHS must be at least 1. !>
[in,out]	D	!> D is REAL array, dimension (N) !> On entry D contains the main diagonal of the bidiagonal !> matrix. On exit, if INFO = 0, D contains its singular values. !>
[in,out]	E	!> E is REAL array, dimension (N-1) !> Contains the super-diagonal entries of the bidiagonal matrix. !> On exit, E has been destroyed. !>
[in,out]	B	!> B is COMPLEX array, dimension (LDB,NRHS) !> On input, B contains the right hand sides of the least !> squares problem. On output, B contains the solution X. !>
[in]	LDB	!> LDB is INTEGER !> The leading dimension of B in the calling subprogram. !> LDB must be at least max(1,N). !>
[in]	RCOND	!> RCOND is REAL !> The singular values of A less than or equal to RCOND times !> the largest singular value are treated as zero in solving !> the least squares problem. If RCOND is negative, !> machine precision is used instead. !> For example, if diag(S)X=B were the least squares problem, !> where diag(S) is a diagonal matrix of singular values, the !> solution would be X(i) = B(i) / S(i) if S(i) is greater than !> RCONDmax(S), and X(i) = 0 if S(i) is less than or equal to !> RCOND*max(S). !>
[out]	RANK	!> RANK is INTEGER !> The number of singular values of A greater than RCOND times !> the largest singular value. !>
[out]	WORK	!> WORK is COMPLEX array, dimension (N * NRHS). !>
[out]	RWORK	!> RWORK is REAL array, dimension at least !> (9N + 2NSMLSIZ + 8NNLVL + 3SMLSIZNRHS + !> MAX( (SMLSIZ+1)2, N(1+NRHS) + 2*NRHS ), !> where !> NLVL = MAX( 0, INT( LOG_2( MIN( M,N )/(SMLSIZ+1) ) ) + 1 ) !>
[out]	IWORK	!> IWORK is INTEGER array, dimension (3NNLVL + 11*N). !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> < 0: if INFO = -i, the i-th argument had an illegal value. !> > 0: The algorithm failed to compute a singular value while !> working on the submatrix lying in rows and columns !> INFO/(N+1) through MOD(INFO,N+1). !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: Ming Gu and Ren-Cang Li, Computer Science Division, University of California at Berkeley, USA
Osni Marques, LBNL/NERSC, USA

Definition at line 184 of file clalsd.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          UPLO
      INTEGER            INFO, LDB, N, NRHS, RANK, SMLSIZ
      REAL               RCOND
*     ..
*     .. Array Arguments ..
      INTEGER            IWORK( * )
      REAL               D( * ), E( * ), RWORK( * )
      COMPLEX            B( LDB, * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ZERO, ONE, TWO
      parameter( zero = 0.0e0, one = 1.0e0, two = 2.0e0 )
      COMPLEX            CZERO
      parameter( czero = ( 0.0e0, 0.0e0 ) )
*     ..
*     .. Local Scalars ..
      INTEGER            BX, BXST, C, DIFL, DIFR, GIVCOL, GIVNUM,
     $                   GIVPTR, I, ICMPQ1, ICMPQ2, IRWB, IRWIB, IRWRB,
     $                   IRWU, IRWVT, IRWWRK, IWK, J, JCOL, JIMAG,
     $                   JREAL, JROW, K, NLVL, NM1, NRWORK, NSIZE, NSUB,
     $                   PERM, POLES, S, SIZEI, SMLSZP, SQRE, ST, ST1,
     $                   U, VT, Z
      REAL               CS, EPS, ORGNRM, R, RCND, SN, TOL
*     ..
*     .. External Functions ..
      INTEGER            ISAMAX
      REAL               SLAMCH, SLANST
      EXTERNAL           isamax, slamch, slanst
*     ..
*     .. External Subroutines ..
      EXTERNAL           ccopy, clacpy, clalsa, clascl, claset, csrot,
     $                   sgemm, slartg, slascl, slasda, slasdq, slaset,
     $                   slasrt, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, aimag, cmplx, int, log, real, sign
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
*
      IF( n.LT.0 ) THEN
         info = -3
      ELSE IF( nrhs.LT.1 ) THEN
         info = -4
      ELSE IF( ( ldb.LT.1 ) .OR. ( ldb.LT.n ) ) THEN
         info = -8
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CLALSD', -info )
         RETURN
      END IF
*
      eps = slamch( 'Epsilon' )
*
*     Set up the tolerance.
*
      IF( ( rcond.LE.zero ) .OR. ( rcond.GE.one ) ) THEN
         rcnd = eps
      ELSE
         rcnd = rcond
      END IF
*
      rank = 0
*
*     Quick return if possible.
*
      IF( n.EQ.0 ) THEN
         RETURN
      ELSE IF( n.EQ.1 ) THEN
         IF( d( 1 ).EQ.zero ) THEN
            CALL claset( 'A', 1, nrhs, czero, czero, b, ldb )
         ELSE
            rank = 1
            CALL clascl( 'G', 0, 0, d( 1 ), one, 1, nrhs, b, ldb, info )
            d( 1 ) = abs( d( 1 ) )
         END IF
         RETURN
      END IF
*
*     Rotate the matrix if it is lower bidiagonal.
*
      IF( uplo.EQ.'L' ) THEN
         DO 10 i = 1, n - 1
            CALL slartg( d( i ), e( i ), cs, sn, r )
            d( i ) = r
            e( i ) = sn*d( i+1 )
            d( i+1 ) = cs*d( i+1 )
            IF( nrhs.EQ.1 ) THEN
               CALL csrot( 1, b( i, 1 ), 1, b( i+1, 1 ), 1, cs, sn )
            ELSE
               rwork( i*2-1 ) = cs
               rwork( i*2 ) = sn
            END IF
   10    CONTINUE
         IF( nrhs.GT.1 ) THEN
            DO 30 i = 1, nrhs
               DO 20 j = 1, n - 1
                  cs = rwork( j*2-1 )
                  sn = rwork( j*2 )
                  CALL csrot( 1, b( j, i ), 1, b( j+1, i ), 1, cs, sn )
   20          CONTINUE
   30       CONTINUE
         END IF
      END IF
*
*     Scale.
*
      nm1 = n - 1
      orgnrm = slanst( 'M', n, d, e )
      IF( orgnrm.EQ.zero ) THEN
         CALL claset( 'A', n, nrhs, czero, czero, b, ldb )
         RETURN
      END IF
*
      CALL slascl( 'G', 0, 0, orgnrm, one, n, 1, d, n, info )
      CALL slascl( 'G', 0, 0, orgnrm, one, nm1, 1, e, nm1, info )
*
*     If N is smaller than the minimum divide size SMLSIZ, then solve
*     the problem with another solver.
*
      IF( n.LE.smlsiz ) THEN
         irwu = 1
         irwvt = irwu + n*n
         irwwrk = irwvt + n*n
         irwrb = irwwrk
         irwib = irwrb + n*nrhs
         irwb = irwib + n*nrhs
         CALL slaset( 'A', n, n, zero, one, rwork( irwu ), n )
         CALL slaset( 'A', n, n, zero, one, rwork( irwvt ), n )
         CALL slasdq( 'U', 0, n, n, n, 0, d, e, rwork( irwvt ), n,
     $                rwork( irwu ), n, rwork( irwwrk ), 1,
     $                rwork( irwwrk ), info )
         IF( info.NE.0 ) THEN
            RETURN
         END IF
*
*        In the real version, B is passed to SLASDQ and multiplied
*        internally by Q**H. Here B is complex and that product is
*        computed below in two steps (real and imaginary parts).
*
         j = irwb - 1
         DO 50 jcol = 1, nrhs
            DO 40 jrow = 1, n
               j = j + 1
               rwork( j ) = real( b( jrow, jcol ) )
   40       CONTINUE
   50    CONTINUE
         CALL sgemm( 'T', 'N', n, nrhs, n, one, rwork( irwu ), n,
     $               rwork( irwb ), n, zero, rwork( irwrb ), n )
         j = irwb - 1
         DO 70 jcol = 1, nrhs
            DO 60 jrow = 1, n
               j = j + 1
               rwork( j ) = aimag( b( jrow, jcol ) )
   60       CONTINUE
   70    CONTINUE
         CALL sgemm( 'T', 'N', n, nrhs, n, one, rwork( irwu ), n,
     $               rwork( irwb ), n, zero, rwork( irwib ), n )
         jreal = irwrb - 1
         jimag = irwib - 1
         DO 90 jcol = 1, nrhs
            DO 80 jrow = 1, n
               jreal = jreal + 1
               jimag = jimag + 1
               b( jrow, jcol ) = cmplx( rwork( jreal ), rwork( jimag ) )
   80       CONTINUE
   90    CONTINUE
*
         tol = rcnd*abs( d( isamax( n, d, 1 ) ) )
         DO 100 i = 1, n
            IF( d( i ).LE.tol ) THEN
               CALL claset( 'A', 1, nrhs, czero, czero, b( i, 1 ), ldb )
            ELSE
               CALL clascl( 'G', 0, 0, d( i ), one, 1, nrhs, b( i, 1 ),
     $                      ldb, info )
               rank = rank + 1
            END IF
  100    CONTINUE
*
*        Since B is complex, the following call to SGEMM is performed
*        in two steps (real and imaginary parts). That is for V * B
*        (in the real version of the code V**H is stored in WORK).
*
*        CALL SGEMM( 'T', 'N', N, NRHS, N, ONE, WORK, N, B, LDB, ZERO,
*    $               WORK( NWORK ), N )
*
         j = irwb - 1
         DO 120 jcol = 1, nrhs
            DO 110 jrow = 1, n
               j = j + 1
               rwork( j ) = real( b( jrow, jcol ) )
  110       CONTINUE
  120    CONTINUE
         CALL sgemm( 'T', 'N', n, nrhs, n, one, rwork( irwvt ), n,
     $               rwork( irwb ), n, zero, rwork( irwrb ), n )
         j = irwb - 1
         DO 140 jcol = 1, nrhs
            DO 130 jrow = 1, n
               j = j + 1
               rwork( j ) = aimag( b( jrow, jcol ) )
  130       CONTINUE
  140    CONTINUE
         CALL sgemm( 'T', 'N', n, nrhs, n, one, rwork( irwvt ), n,
     $               rwork( irwb ), n, zero, rwork( irwib ), n )
         jreal = irwrb - 1
         jimag = irwib - 1
         DO 160 jcol = 1, nrhs
            DO 150 jrow = 1, n
               jreal = jreal + 1
               jimag = jimag + 1
               b( jrow, jcol ) = cmplx( rwork( jreal ), rwork( jimag ) )
  150       CONTINUE
  160    CONTINUE
*
*        Unscale.
*
         CALL slascl( 'G', 0, 0, one, orgnrm, n, 1, d, n, info )
         CALL slasrt( 'D', n, d, info )
         CALL clascl( 'G', 0, 0, orgnrm, one, n, nrhs, b, ldb, info )
*
         RETURN
      END IF
*
*     Book-keeping and setting up some constants.
*
      nlvl = int( log( real( n ) / real( smlsiz+1 ) ) / log( two ) ) + 1
*
      smlszp = smlsiz + 1
*
      u = 1
      vt = 1 + smlsiz*n
      difl = vt + smlszp*n
      difr = difl + nlvl*n
      z = difr + nlvl*n*2
      c = z + nlvl*n
      s = c + n
      poles = s + n
      givnum = poles + 2*nlvl*n
      nrwork = givnum + 2*nlvl*n
      bx = 1
*
      irwrb = nrwork
      irwib = irwrb + smlsiz*nrhs
      irwb = irwib + smlsiz*nrhs
*
      sizei = 1 + n
      k = sizei + n
      givptr = k + n
      perm = givptr + n
      givcol = perm + nlvl*n
      iwk = givcol + nlvl*n*2
*
      st = 1
      sqre = 0
      icmpq1 = 1
      icmpq2 = 0
      nsub = 0
*
      DO 170 i = 1, n
         IF( abs( d( i ) ).LT.eps ) THEN
            d( i ) = sign( eps, d( i ) )
         END IF
  170 CONTINUE
*
      DO 240 i = 1, nm1
         IF( ( abs( e( i ) ).LT.eps ) .OR. ( i.EQ.nm1 ) ) THEN
            nsub = nsub + 1
            iwork( nsub ) = st
*
*           Subproblem found. First determine its size and then
*           apply divide and conquer on it.
*
            IF( i.LT.nm1 ) THEN
*
*              A subproblem with E(I) small for I < NM1.
*
               nsize = i - st + 1
               iwork( sizei+nsub-1 ) = nsize
            ELSE IF( abs( e( i ) ).GE.eps ) THEN
*
*              A subproblem with E(NM1) not too small but I = NM1.
*
               nsize = n - st + 1
               iwork( sizei+nsub-1 ) = nsize
            ELSE
*
*              A subproblem with E(NM1) small. This implies an
*              1-by-1 subproblem at D(N), which is not solved
*              explicitly.
*
               nsize = i - st + 1
               iwork( sizei+nsub-1 ) = nsize
               nsub = nsub + 1
               iwork( nsub ) = n
               iwork( sizei+nsub-1 ) = 1
               CALL ccopy( nrhs, b( n, 1 ), ldb, work( bx+nm1 ), n )
            END IF
            st1 = st - 1
            IF( nsize.EQ.1 ) THEN
*
*              This is a 1-by-1 subproblem and is not solved
*              explicitly.
*
               CALL ccopy( nrhs, b( st, 1 ), ldb, work( bx+st1 ), n )
            ELSE IF( nsize.LE.smlsiz ) THEN
*
*              This is a small subproblem and is solved by SLASDQ.
*
               CALL slaset( 'A', nsize, nsize, zero, one,
     $                      rwork( vt+st1 ), n )
               CALL slaset( 'A', nsize, nsize, zero, one,
     $                      rwork( u+st1 ), n )
               CALL slasdq( 'U', 0, nsize, nsize, nsize, 0, d( st ),
     $                      e( st ), rwork( vt+st1 ), n, rwork( u+st1 ),
     $                      n, rwork( nrwork ), 1, rwork( nrwork ),
     $                      info )
               IF( info.NE.0 ) THEN
                  RETURN
               END IF
*
*              In the real version, B is passed to SLASDQ and multiplied
*              internally by Q**H. Here B is complex and that product is
*              computed below in two steps (real and imaginary parts).
*
               j = irwb - 1
               DO 190 jcol = 1, nrhs
                  DO 180 jrow = st, st + nsize - 1
                     j = j + 1
                     rwork( j ) = real( b( jrow, jcol ) )
  180             CONTINUE
  190          CONTINUE
               CALL sgemm( 'T', 'N', nsize, nrhs, nsize, one,
     $                     rwork( u+st1 ), n, rwork( irwb ), nsize,
     $                     zero, rwork( irwrb ), nsize )
               j = irwb - 1
               DO 210 jcol = 1, nrhs
                  DO 200 jrow = st, st + nsize - 1
                     j = j + 1
                     rwork( j ) = aimag( b( jrow, jcol ) )
  200             CONTINUE
  210          CONTINUE
               CALL sgemm( 'T', 'N', nsize, nrhs, nsize, one,
     $                     rwork( u+st1 ), n, rwork( irwb ), nsize,
     $                     zero, rwork( irwib ), nsize )
               jreal = irwrb - 1
               jimag = irwib - 1
               DO 230 jcol = 1, nrhs
                  DO 220 jrow = st, st + nsize - 1
                     jreal = jreal + 1
                     jimag = jimag + 1
                     b( jrow, jcol ) = cmplx( rwork( jreal ),
     $                                 rwork( jimag ) )
  220             CONTINUE
  230          CONTINUE
*
               CALL clacpy( 'A', nsize, nrhs, b( st, 1 ), ldb,
     $                      work( bx+st1 ), n )
            ELSE
*
*              A large problem. Solve it using divide and conquer.
*
               CALL slasda( icmpq1, smlsiz, nsize, sqre, d( st ),
     $                      e( st ), rwork( u+st1 ), n, rwork( vt+st1 ),
     $                      iwork( k+st1 ), rwork( difl+st1 ),
     $                      rwork( difr+st1 ), rwork( z+st1 ),
     $                      rwork( poles+st1 ), iwork( givptr+st1 ),
     $                      iwork( givcol+st1 ), n, iwork( perm+st1 ),
     $                      rwork( givnum+st1 ), rwork( c+st1 ),
     $                      rwork( s+st1 ), rwork( nrwork ),
     $                      iwork( iwk ), info )
               IF( info.NE.0 ) THEN
                  RETURN
               END IF
               bxst = bx + st1
               CALL clalsa( icmpq2, smlsiz, nsize, nrhs, b( st, 1 ),
     $                      ldb, work( bxst ), n, rwork( u+st1 ), n,
     $                      rwork( vt+st1 ), iwork( k+st1 ),
     $                      rwork( difl+st1 ), rwork( difr+st1 ),
     $                      rwork( z+st1 ), rwork( poles+st1 ),
     $                      iwork( givptr+st1 ), iwork( givcol+st1 ), n,
     $                      iwork( perm+st1 ), rwork( givnum+st1 ),
     $                      rwork( c+st1 ), rwork( s+st1 ),
     $                      rwork( nrwork ), iwork( iwk ), info )
               IF( info.NE.0 ) THEN
                  RETURN
               END IF
            END IF
            st = i + 1
         END IF
  240 CONTINUE
*
*     Apply the singular values and treat the tiny ones as zero.
*
      tol = rcnd*abs( d( isamax( n, d, 1 ) ) )
*
      DO 250 i = 1, n
*
*        Some of the elements in D can be negative because 1-by-1
*        subproblems were not solved explicitly.
*
         IF( abs( d( i ) ).LE.tol ) THEN
            CALL claset( 'A', 1, nrhs, czero, czero, work( bx+i-1 ), n )
         ELSE
            rank = rank + 1
            CALL clascl( 'G', 0, 0, d( i ), one, 1, nrhs,
     $                   work( bx+i-1 ), n, info )
         END IF
         d( i ) = abs( d( i ) )
  250 CONTINUE
*
*     Now apply back the right singular vectors.
*
      icmpq2 = 1
      DO 320 i = 1, nsub
         st = iwork( i )
         st1 = st - 1
         nsize = iwork( sizei+i-1 )
         bxst = bx + st1
         IF( nsize.EQ.1 ) THEN
            CALL ccopy( nrhs, work( bxst ), n, b( st, 1 ), ldb )
         ELSE IF( nsize.LE.smlsiz ) THEN
*
*           Since B and BX are complex, the following call to SGEMM
*           is performed in two steps (real and imaginary parts).
*
*           CALL SGEMM( 'T', 'N', NSIZE, NRHS, NSIZE, ONE,
*    $                  RWORK( VT+ST1 ), N, RWORK( BXST ), N, ZERO,
*    $                  B( ST, 1 ), LDB )
*
            j = bxst - n - 1
            jreal = irwb - 1
            DO 270 jcol = 1, nrhs
               j = j + n
               DO 260 jrow = 1, nsize
                  jreal = jreal + 1
                  rwork( jreal ) = real( work( j+jrow ) )
  260          CONTINUE
  270       CONTINUE
            CALL sgemm( 'T', 'N', nsize, nrhs, nsize, one,
     $                  rwork( vt+st1 ), n, rwork( irwb ), nsize, zero,
     $                  rwork( irwrb ), nsize )
            j = bxst - n - 1
            jimag = irwb - 1
            DO 290 jcol = 1, nrhs
               j = j + n
               DO 280 jrow = 1, nsize
                  jimag = jimag + 1
                  rwork( jimag ) = aimag( work( j+jrow ) )
  280          CONTINUE
  290       CONTINUE
            CALL sgemm( 'T', 'N', nsize, nrhs, nsize, one,
     $                  rwork( vt+st1 ), n, rwork( irwb ), nsize, zero,
     $                  rwork( irwib ), nsize )
            jreal = irwrb - 1
            jimag = irwib - 1
            DO 310 jcol = 1, nrhs
               DO 300 jrow = st, st + nsize - 1
                  jreal = jreal + 1
                  jimag = jimag + 1
                  b( jrow, jcol ) = cmplx( rwork( jreal ),
     $                              rwork( jimag ) )
  300          CONTINUE
  310       CONTINUE
         ELSE
            CALL clalsa( icmpq2, smlsiz, nsize, nrhs, work( bxst ), n,
     $                   b( st, 1 ), ldb, rwork( u+st1 ), n,
     $                   rwork( vt+st1 ), iwork( k+st1 ),
     $                   rwork( difl+st1 ), rwork( difr+st1 ),
     $                   rwork( z+st1 ), rwork( poles+st1 ),
     $                   iwork( givptr+st1 ), iwork( givcol+st1 ), n,
     $                   iwork( perm+st1 ), rwork( givnum+st1 ),
     $                   rwork( c+st1 ), rwork( s+st1 ),
     $                   rwork( nrwork ), iwork( iwk ), info )
            IF( info.NE.0 ) THEN
               RETURN
            END IF
         END IF
  320 CONTINUE
*
*     Unscale and sort the singular values.
*
      CALL slascl( 'G', 0, 0, one, orgnrm, n, 1, d, n, info )
      CALL slasrt( 'D', n, d, info )
      CALL clascl( 'G', 0, 0, orgnrm, one, n, nrhs, b, ldb, info )
*
      RETURN
*
*     End of CLALSD
*

◆ clanhf()

real function clanhf	(	character	norm,
		character	transr,
		character	uplo,
		integer	n,
		complex, dimension( 0: * )	a,
		real, dimension( 0: * )	work )

CLANHF returns the value of the 1-norm, or the Frobenius norm, or the infinity norm, or the element of largest absolute value of a Hermitian matrix in RFP format.

Download CLANHF + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CLANHF  returns the value of the one norm,  or the Frobenius norm, or
!> the  infinity norm,  or the  element of  largest absolute value  of a
!> complex Hermitian matrix A in RFP format.
!>

Returns

CLANHF

!>
!>    CLANHF = ( max(abs(A(i,j))), NORM = 'M' or 'm'
!>             (
!>             ( norm1(A),         NORM = '1', 'O' or 'o'
!>             (
!>             ( normI(A),         NORM = 'I' or 'i'
!>             (
!>             ( normF(A),         NORM = 'F', 'f', 'E' or 'e'
!>
!> where  norm1  denotes the  one norm of a matrix (maximum column sum),
!> normI  denotes the  infinity norm  of a matrix  (maximum row sum) and
!> normF  denotes the  Frobenius norm of a matrix (square root of sum of
!> squares).  Note that  max(abs(A(i,j)))  is not a  matrix norm.
!>

Parameters

[in]	NORM	!> NORM is CHARACTER !> Specifies the value to be returned in CLANHF as described !> above. !>
[in]	TRANSR	!> TRANSR is CHARACTER !> Specifies whether the RFP format of A is normal or !> conjugate-transposed format. !> = 'N': RFP format is Normal !> = 'C': RFP format is Conjugate-transposed !>
[in]	UPLO	!> UPLO is CHARACTER !> On entry, UPLO specifies whether the RFP matrix A came from !> an upper or lower triangular matrix as follows: !> !> UPLO = 'U' or 'u' RFP A came from an upper triangular !> matrix !> !> UPLO = 'L' or 'l' RFP A came from a lower triangular !> matrix !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. When N = 0, CLANHF is !> set to zero. !>
[in]	A	!> A is COMPLEX array, dimension ( N(N+1)/2 ); !> On entry, the matrix A in RFP Format. !> RFP Format is described by TRANSR, UPLO and N as follows: !> If TRANSR='N' then RFP A is (0:N,0:K-1) when N is even; !> K=N/2. RFP A is (0:N-1,0:K) when N is odd; K=N/2. If !> TRANSR = 'C' then RFP is the Conjugate-transpose of RFP A !> as defined when TRANSR = 'N'. The contents of RFP A are !> defined by UPLO as follows: If UPLO = 'U' the RFP A !> contains the ( N(N+1)/2 ) elements of upper packed A !> either in normal or conjugate-transpose Format. If !> UPLO = 'L' the RFP A contains the ( N*(N+1) /2 ) elements !> of lower packed A either in normal or conjugate-transpose !> Format. The LDA of RFP A is (N+1)/2 when TRANSR = 'C'. When !> TRANSR is 'N' the LDA is N+1 when N is even and is N when !> is odd. See the Note below for more details. !> Unchanged on exit. !>
[out]	WORK	!> WORK is REAL array, dimension (LWORK), !> where LWORK >= N when NORM = 'I' or '1' or 'O'; otherwise, !> WORK is not referenced. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  We first consider Standard Packed Format when N is even.
!>  We give an example where N = 6.
!>
!>      AP is Upper             AP is Lower
!>
!>   00 01 02 03 04 05       00
!>      11 12 13 14 15       10 11
!>         22 23 24 25       20 21 22
!>            33 34 35       30 31 32 33
!>               44 45       40 41 42 43 44
!>                  55       50 51 52 53 54 55
!>
!>
!>  Let TRANSR = 'N'. RFP holds AP as follows:
!>  For UPLO = 'U' the upper trapezoid A(0:5,0:2) consists of the last
!>  three columns of AP upper. The lower triangle A(4:6,0:2) consists of
!>  conjugate-transpose of the first three columns of AP upper.
!>  For UPLO = 'L' the lower trapezoid A(1:6,0:2) consists of the first
!>  three columns of AP lower. The upper triangle A(0:2,0:2) consists of
!>  conjugate-transpose of the last three columns of AP lower.
!>  To denote conjugate we place -- above the element. This covers the
!>  case N even and TRANSR = 'N'.
!>
!>         RFP A                   RFP A
!>
!>                                -- -- --
!>        03 04 05                33 43 53
!>                                   -- --
!>        13 14 15                00 44 54
!>                                      --
!>        23 24 25                10 11 55
!>
!>        33 34 35                20 21 22
!>        --
!>        00 44 45                30 31 32
!>        -- --
!>        01 11 55                40 41 42
!>        -- -- --
!>        02 12 22                50 51 52
!>
!>  Now let TRANSR = 'C'. RFP A in both UPLO cases is just the conjugate-
!>  transpose of RFP A above. One therefore gets:
!>
!>
!>           RFP A                   RFP A
!>
!>     -- -- -- --                -- -- -- -- -- --
!>     03 13 23 33 00 01 02    33 00 10 20 30 40 50
!>     -- -- -- -- --                -- -- -- -- --
!>     04 14 24 34 44 11 12    43 44 11 21 31 41 51
!>     -- -- -- -- -- --                -- -- -- --
!>     05 15 25 35 45 55 22    53 54 55 22 32 42 52
!>
!>
!>  We next  consider Standard Packed Format when N is odd.
!>  We give an example where N = 5.
!>
!>     AP is Upper                 AP is Lower
!>
!>   00 01 02 03 04              00
!>      11 12 13 14              10 11
!>         22 23 24              20 21 22
!>            33 34              30 31 32 33
!>               44              40 41 42 43 44
!>
!>
!>  Let TRANSR = 'N'. RFP holds AP as follows:
!>  For UPLO = 'U' the upper trapezoid A(0:4,0:2) consists of the last
!>  three columns of AP upper. The lower triangle A(3:4,0:1) consists of
!>  conjugate-transpose of the first two   columns of AP upper.
!>  For UPLO = 'L' the lower trapezoid A(0:4,0:2) consists of the first
!>  three columns of AP lower. The upper triangle A(0:1,1:2) consists of
!>  conjugate-transpose of the last two   columns of AP lower.
!>  To denote conjugate we place -- above the element. This covers the
!>  case N odd  and TRANSR = 'N'.
!>
!>         RFP A                   RFP A
!>
!>                                   -- --
!>        02 03 04                00 33 43
!>                                      --
!>        12 13 14                10 11 44
!>
!>        22 23 24                20 21 22
!>        --
!>        00 33 34                30 31 32
!>        -- --
!>        01 11 44                40 41 42
!>
!>  Now let TRANSR = 'C'. RFP A in both UPLO cases is just the conjugate-
!>  transpose of RFP A above. One therefore gets:
!>
!>
!>           RFP A                   RFP A
!>
!>     -- -- --                   -- -- -- -- -- --
!>     02 12 22 00 01             00 10 20 30 40 50
!>     -- -- -- --                   -- -- -- -- --
!>     03 13 23 33 11             33 11 21 31 41 51
!>     -- -- -- -- --                   -- -- -- --
!>     04 14 24 34 44             43 44 22 32 42 52
!>

Definition at line 245 of file clanhf.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          NORM, TRANSR, UPLO
      INTEGER            N
*     ..
*     .. Array Arguments ..
      REAL               WORK( 0: * )
      COMPLEX            A( 0: * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ONE, ZERO
      parameter( one = 1.0e+0, zero = 0.0e+0 )
*     ..
*     .. Local Scalars ..
      INTEGER            I, J, IFM, ILU, NOE, N1, K, L, LDA
      REAL               SCALE, S, VALUE, AA, TEMP
*     ..
*     .. External Functions ..
      LOGICAL            LSAME, SISNAN
      EXTERNAL           lsame, sisnan
*     ..
*     .. External Subroutines ..
      EXTERNAL           classq
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, real, sqrt
*     ..
*     .. Executable Statements ..
*
      IF( n.EQ.0 ) THEN
         clanhf = zero
         RETURN
      ELSE IF( n.EQ.1 ) THEN
         clanhf = abs(real(a(0)))
         RETURN
      END IF
*
*     set noe = 1 if n is odd. if n is even set noe=0
*
      noe = 1
      IF( mod( n, 2 ).EQ.0 )
     $   noe = 0
*
*     set ifm = 0 when form='C' or 'c' and 1 otherwise
*
      ifm = 1
      IF( lsame( transr, 'C' ) )
     $   ifm = 0
*
*     set ilu = 0 when uplo='U or 'u' and 1 otherwise
*
      ilu = 1
      IF( lsame( uplo, 'U' ) )
     $   ilu = 0
*
*     set lda = (n+1)/2 when ifm = 0
*     set lda = n when ifm = 1 and noe = 1
*     set lda = n+1 when ifm = 1 and noe = 0
*
      IF( ifm.EQ.1 ) THEN
         IF( noe.EQ.1 ) THEN
            lda = n
         ELSE
*           noe=0
            lda = n + 1
         END IF
      ELSE
*        ifm=0
         lda = ( n+1 ) / 2
      END IF
*
      IF( lsame( norm, 'M' ) ) THEN
*
*       Find max(abs(A(i,j))).
*
         k = ( n+1 ) / 2
         VALUE = zero
         IF( noe.EQ.1 ) THEN
*           n is odd & n = k + k - 1
            IF( ifm.EQ.1 ) THEN
*              A is n by k
               IF( ilu.EQ.1 ) THEN
*                 uplo ='L'
                  j = 0
*                 -> L(0,0)
                  temp = abs( real( a( j+j*lda ) ) )
                  IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                 VALUE = temp
                  DO i = 1, n - 1
                     temp = abs( a( i+j*lda ) )
                     IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                    VALUE = temp
                  END DO
                  DO j = 1, k - 1
                     DO i = 0, j - 2
                        temp = abs( a( i+j*lda ) )
                        IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                       VALUE = temp
                     END DO
                     i = j - 1
*                    L(k+j,k+j)
                     temp = abs( real( a( i+j*lda ) ) )
                     IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                    VALUE = temp
                     i = j
*                    -> L(j,j)
                     temp = abs( real( a( i+j*lda ) ) )
                     IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                    VALUE = temp
                     DO i = j + 1, n - 1
                        temp = abs( a( i+j*lda ) )
                        IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                       VALUE = temp
                     END DO
                  END DO
               ELSE
*                 uplo = 'U'
                  DO j = 0, k - 2
                     DO i = 0, k + j - 2
                        temp = abs( a( i+j*lda ) )
                        IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                       VALUE = temp
                     END DO
                     i = k + j - 1
*                    -> U(i,i)
                     temp = abs( real( a( i+j*lda ) ) )
                     IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                    VALUE = temp
                     i = i + 1
*                    =k+j; i -> U(j,j)
                     temp = abs( real( a( i+j*lda ) ) )
                     IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                    VALUE = temp
                     DO i = k + j + 1, n - 1
                        temp = abs( a( i+j*lda ) )
                        IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                       VALUE = temp
                     END DO
                  END DO
                  DO i = 0, n - 2
                     temp = abs( a( i+j*lda ) )
                     IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                    VALUE = temp
*                    j=k-1
                  END DO
*                 i=n-1 -> U(n-1,n-1)
                  temp = abs( real( a( i+j*lda ) ) )
                  IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                 VALUE = temp
               END IF
            ELSE
*              xpose case; A is k by n
               IF( ilu.EQ.1 ) THEN
*                 uplo ='L'
                  DO j = 0, k - 2
                     DO i = 0, j - 1
                        temp = abs( a( i+j*lda ) )
                        IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                       VALUE = temp
                     END DO
                     i = j
*                    L(i,i)
                     temp = abs( real( a( i+j*lda ) ) )
                     IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                    VALUE = temp
                     i = j + 1
*                    L(j+k,j+k)
                     temp = abs( real( a( i+j*lda ) ) )
                     IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                    VALUE = temp
                     DO i = j + 2, k - 1
                        temp = abs( a( i+j*lda ) )
                        IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                       VALUE = temp
                     END DO
                  END DO
                  j = k - 1
                  DO i = 0, k - 2
                     temp = abs( a( i+j*lda ) )
                     IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                    VALUE = temp
                  END DO
                  i = k - 1
*                 -> L(i,i) is at A(i,j)
                  temp = abs( real( a( i+j*lda ) ) )
                     IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                    VALUE = temp
                  DO j = k, n - 1
                     DO i = 0, k - 1
                        temp = abs( a( i+j*lda ) )
                        IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                       VALUE = temp
                     END DO
                  END DO
               ELSE
*                 uplo = 'U'
                  DO j = 0, k - 2
                     DO i = 0, k - 1
                        temp = abs( a( i+j*lda ) )
                        IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                       VALUE = temp
                     END DO
                  END DO
                  j = k - 1
*                 -> U(j,j) is at A(0,j)
                  temp = abs( real( a( 0+j*lda ) ) )
                  IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                    VALUE = temp
                  DO i = 1, k - 1
                     temp = abs( a( i+j*lda ) )
                     IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                    VALUE = temp
                  END DO
                  DO j = k, n - 1
                     DO i = 0, j - k - 1
                        temp = abs( a( i+j*lda ) )
                        IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                       VALUE = temp
                     END DO
                     i = j - k
*                    -> U(i,i) at A(i,j)
                     temp = abs( real( a( i+j*lda ) ) )
                     IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                    VALUE = temp
                     i = j - k + 1
*                    U(j,j)
                     temp = abs( real( a( i+j*lda ) ) )
                     IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                    VALUE = temp
                     DO i = j - k + 2, k - 1
                        temp = abs( a( i+j*lda ) )
                        IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                       VALUE = temp
                     END DO
                  END DO
               END IF
            END IF
         ELSE
*           n is even & k = n/2
            IF( ifm.EQ.1 ) THEN
*              A is n+1 by k
               IF( ilu.EQ.1 ) THEN
*                 uplo ='L'
                  j = 0
*                 -> L(k,k) & j=1 -> L(0,0)
                  temp = abs( real( a( j+j*lda ) ) )
                  IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                 VALUE = temp
                  temp = abs( real( a( j+1+j*lda ) ) )
                  IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                 VALUE = temp
                  DO i = 2, n
                     temp = abs( a( i+j*lda ) )
                     IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                    VALUE = temp
                  END DO
                  DO j = 1, k - 1
                     DO i = 0, j - 1
                        temp = abs( a( i+j*lda ) )
                        IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                       VALUE = temp
                     END DO
                     i = j
*                    L(k+j,k+j)
                     temp = abs( real( a( i+j*lda ) ) )
                     IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                    VALUE = temp
                     i = j + 1
*                    -> L(j,j)
                     temp = abs( real( a( i+j*lda ) ) )
                     IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                    VALUE = temp
                     DO i = j + 2, n
                        temp = abs( a( i+j*lda ) )
                        IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                       VALUE = temp
                     END DO
                  END DO
               ELSE
*                 uplo = 'U'
                  DO j = 0, k - 2
                     DO i = 0, k + j - 1
                        temp = abs( a( i+j*lda ) )
                        IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                       VALUE = temp
                     END DO
                     i = k + j
*                    -> U(i,i)
                     temp = abs( real( a( i+j*lda ) ) )
                     IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                    VALUE = temp
                     i = i + 1
*                    =k+j+1; i -> U(j,j)
                     temp = abs( real( a( i+j*lda ) ) )
                     IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                    VALUE = temp
                     DO i = k + j + 2, n
                        temp = abs( a( i+j*lda ) )
                        IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                       VALUE = temp
                     END DO
                  END DO
                  DO i = 0, n - 2
                     temp = abs( a( i+j*lda ) )
                     IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                    VALUE = temp
*                 j=k-1
                  END DO
*                 i=n-1 -> U(n-1,n-1)
                  temp = abs( real( a( i+j*lda ) ) )
                     IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                    VALUE = temp
                  i = n
*                 -> U(k-1,k-1)
                  temp = abs( real( a( i+j*lda ) ) )
                     IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                    VALUE = temp
               END IF
            ELSE
*              xpose case; A is k by n+1
               IF( ilu.EQ.1 ) THEN
*                 uplo ='L'
                  j = 0
*                 -> L(k,k) at A(0,0)
                  temp = abs( real( a( j+j*lda ) ) )
                  IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                    VALUE = temp
                  DO i = 1, k - 1
                     temp = abs( a( i+j*lda ) )
                     IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                    VALUE = temp
                  END DO
                  DO j = 1, k - 1
                     DO i = 0, j - 2
                        temp = abs( a( i+j*lda ) )
                        IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                       VALUE = temp
                     END DO
                     i = j - 1
*                    L(i,i)
                     temp = abs( real( a( i+j*lda ) ) )
                     IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                    VALUE = temp
                     i = j
*                    L(j+k,j+k)
                     temp = abs( real( a( i+j*lda ) ) )
                     IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                    VALUE = temp
                     DO i = j + 1, k - 1
                        temp = abs( a( i+j*lda ) )
                        IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                       VALUE = temp
                     END DO
                  END DO
                  j = k
                  DO i = 0, k - 2
                     temp = abs( a( i+j*lda ) )
                     IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                    VALUE = temp
                  END DO
                  i = k - 1
*                 -> L(i,i) is at A(i,j)
                  temp = abs( real( a( i+j*lda ) ) )
                  IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                 VALUE = temp
                  DO j = k + 1, n
                     DO i = 0, k - 1
                        temp = abs( a( i+j*lda ) )
                        IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                       VALUE = temp
                     END DO
                  END DO
               ELSE
*                 uplo = 'U'
                  DO j = 0, k - 1
                     DO i = 0, k - 1
                        temp = abs( a( i+j*lda ) )
                        IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                       VALUE = temp
                     END DO
                  END DO
                  j = k
*                 -> U(j,j) is at A(0,j)
                  temp = abs( real( a( 0+j*lda ) ) )
                  IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                 VALUE = temp
                  DO i = 1, k - 1
                     temp = abs( a( i+j*lda ) )
                     IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                    VALUE = temp
                  END DO
                  DO j = k + 1, n - 1
                     DO i = 0, j - k - 2
                        temp = abs( a( i+j*lda ) )
                        IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                       VALUE = temp
                     END DO
                     i = j - k - 1
*                    -> U(i,i) at A(i,j)
                     temp = abs( real( a( i+j*lda ) ) )
                     IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                    VALUE = temp
                     i = j - k
*                    U(j,j)
                     temp = abs( real( a( i+j*lda ) ) )
                     IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                    VALUE = temp
                     DO i = j - k + 1, k - 1
                        temp = abs( a( i+j*lda ) )
                        IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                       VALUE = temp
                     END DO
                  END DO
                  j = n
                  DO i = 0, k - 2
                     temp = abs( a( i+j*lda ) )
                     IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                    VALUE = temp
                  END DO
                  i = k - 1
*                 U(k,k) at A(i,j)
                  temp = abs( real( a( i+j*lda ) ) )
                  IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                 VALUE = temp
               END IF
            END IF
         END IF
      ELSE IF( ( lsame( norm, 'I' ) ) .OR. ( lsame( norm, 'O' ) ) .OR.
     $         ( norm.EQ.'1' ) ) THEN
*
*       Find normI(A) ( = norm1(A), since A is Hermitian).
*
         IF( ifm.EQ.1 ) THEN
*           A is 'N'
            k = n / 2
            IF( noe.EQ.1 ) THEN
*              n is odd & A is n by (n+1)/2
               IF( ilu.EQ.0 ) THEN
*                 uplo = 'U'
                  DO i = 0, k - 1
                     work( i ) = zero
                  END DO
                  DO j = 0, k
                     s = zero
                     DO i = 0, k + j - 1
                        aa = abs( a( i+j*lda ) )
*                       -> A(i,j+k)
                        s = s + aa
                        work( i ) = work( i ) + aa
                     END DO
                     aa = abs( real( a( i+j*lda ) ) )
*                    -> A(j+k,j+k)
                     work( j+k ) = s + aa
                     IF( i.EQ.k+k )
     $                  GO TO 10
                     i = i + 1
                     aa = abs( real( a( i+j*lda ) ) )
*                    -> A(j,j)
                     work( j ) = work( j ) + aa
                     s = zero
                     DO l = j + 1, k - 1
                        i = i + 1
                        aa = abs( a( i+j*lda ) )
*                       -> A(l,j)
                        s = s + aa
                        work( l ) = work( l ) + aa
                     END DO
                     work( j ) = work( j ) + s
                  END DO
   10             CONTINUE
                  VALUE = work( 0 )
                  DO i = 1, n-1
                     temp = work( i )
                     IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                    VALUE = temp
                  END DO
               ELSE
*                 ilu = 1 & uplo = 'L'
                  k = k + 1
*                 k=(n+1)/2 for n odd and ilu=1
                  DO i = k, n - 1
                     work( i ) = zero
                  END DO
                  DO j = k - 1, 0, -1
                     s = zero
                     DO i = 0, j - 2
                        aa = abs( a( i+j*lda ) )
*                       -> A(j+k,i+k)
                        s = s + aa
                        work( i+k ) = work( i+k ) + aa
                     END DO
                     IF( j.GT.0 ) THEN
                        aa = abs( real( a( i+j*lda ) ) )
*                       -> A(j+k,j+k)
                        s = s + aa
                        work( i+k ) = work( i+k ) + s
*                       i=j
                        i = i + 1
                     END IF
                     aa = abs( real( a( i+j*lda ) ) )
*                    -> A(j,j)
                     work( j ) = aa
                     s = zero
                     DO l = j + 1, n - 1
                        i = i + 1
                        aa = abs( a( i+j*lda ) )
*                       -> A(l,j)
                        s = s + aa
                        work( l ) = work( l ) + aa
                     END DO
                     work( j ) = work( j ) + s
                  END DO
                  VALUE = work( 0 )
                  DO i = 1, n-1
                     temp = work( i )
                     IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                    VALUE = temp
                  END DO
               END IF
            ELSE
*              n is even & A is n+1 by k = n/2
               IF( ilu.EQ.0 ) THEN
*                 uplo = 'U'
                  DO i = 0, k - 1
                     work( i ) = zero
                  END DO
                  DO j = 0, k - 1
                     s = zero
                     DO i = 0, k + j - 1
                        aa = abs( a( i+j*lda ) )
*                       -> A(i,j+k)
                        s = s + aa
                        work( i ) = work( i ) + aa
                     END DO
                     aa = abs( real( a( i+j*lda ) ) )
*                    -> A(j+k,j+k)
                     work( j+k ) = s + aa
                     i = i + 1
                     aa = abs( real( a( i+j*lda ) ) )
*                    -> A(j,j)
                     work( j ) = work( j ) + aa
                     s = zero
                     DO l = j + 1, k - 1
                        i = i + 1
                        aa = abs( a( i+j*lda ) )
*                       -> A(l,j)
                        s = s + aa
                        work( l ) = work( l ) + aa
                     END DO
                     work( j ) = work( j ) + s
                  END DO
                  VALUE = work( 0 )
                  DO i = 1, n-1
                     temp = work( i )
                     IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                    VALUE = temp
                  END DO
               ELSE
*                 ilu = 1 & uplo = 'L'
                  DO i = k, n - 1
                     work( i ) = zero
                  END DO
                  DO j = k - 1, 0, -1
                     s = zero
                     DO i = 0, j - 1
                        aa = abs( a( i+j*lda ) )
*                       -> A(j+k,i+k)
                        s = s + aa
                        work( i+k ) = work( i+k ) + aa
                     END DO
                     aa = abs( real( a( i+j*lda ) ) )
*                    -> A(j+k,j+k)
                     s = s + aa
                     work( i+k ) = work( i+k ) + s
*                    i=j
                     i = i + 1
                     aa = abs( real( a( i+j*lda ) ) )
*                    -> A(j,j)
                     work( j ) = aa
                     s = zero
                     DO l = j + 1, n - 1
                        i = i + 1
                        aa = abs( a( i+j*lda ) )
*                       -> A(l,j)
                        s = s + aa
                        work( l ) = work( l ) + aa
                     END DO
                     work( j ) = work( j ) + s
                  END DO
                  VALUE = work( 0 )
                  DO i = 1, n-1
                     temp = work( i )
                     IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                    VALUE = temp
                  END DO
               END IF
            END IF
         ELSE
*           ifm=0
            k = n / 2
            IF( noe.EQ.1 ) THEN
*              n is odd & A is (n+1)/2 by n
               IF( ilu.EQ.0 ) THEN
*                 uplo = 'U'
                  n1 = k
*                 n/2
                  k = k + 1
*                 k is the row size and lda
                  DO i = n1, n - 1
                     work( i ) = zero
                  END DO
                  DO j = 0, n1 - 1
                     s = zero
                     DO i = 0, k - 1
                        aa = abs( a( i+j*lda ) )
*                       A(j,n1+i)
                        work( i+n1 ) = work( i+n1 ) + aa
                        s = s + aa
                     END DO
                     work( j ) = s
                  END DO
*                 j=n1=k-1 is special
                  s = abs( real( a( 0+j*lda ) ) )
*                 A(k-1,k-1)
                  DO i = 1, k - 1
                     aa = abs( a( i+j*lda ) )
*                    A(k-1,i+n1)
                     work( i+n1 ) = work( i+n1 ) + aa
                     s = s + aa
                  END DO
                  work( j ) = work( j ) + s
                  DO j = k, n - 1
                     s = zero
                     DO i = 0, j - k - 1
                        aa = abs( a( i+j*lda ) )
*                       A(i,j-k)
                        work( i ) = work( i ) + aa
                        s = s + aa
                     END DO
*                    i=j-k
                     aa = abs( real( a( i+j*lda ) ) )
*                    A(j-k,j-k)
                     s = s + aa
                     work( j-k ) = work( j-k ) + s
                     i = i + 1
                     s = abs( real( a( i+j*lda ) ) )
*                    A(j,j)
                     DO l = j + 1, n - 1
                        i = i + 1
                        aa = abs( a( i+j*lda ) )
*                       A(j,l)
                        work( l ) = work( l ) + aa
                        s = s + aa
                     END DO
                     work( j ) = work( j ) + s
                  END DO
                  VALUE = work( 0 )
                  DO i = 1, n-1
                     temp = work( i )
                     IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                    VALUE = temp
                  END DO
               ELSE
*                 ilu=1 & uplo = 'L'
                  k = k + 1
*                 k=(n+1)/2 for n odd and ilu=1
                  DO i = k, n - 1
                     work( i ) = zero
                  END DO
                  DO j = 0, k - 2
*                    process
                     s = zero
                     DO i = 0, j - 1
                        aa = abs( a( i+j*lda ) )
*                       A(j,i)
                        work( i ) = work( i ) + aa
                        s = s + aa
                     END DO
                     aa = abs( real( a( i+j*lda ) ) )
*                    i=j so process of A(j,j)
                     s = s + aa
                     work( j ) = s
*                    is initialised here
                     i = i + 1
*                    i=j process A(j+k,j+k)
                     aa = abs( real( a( i+j*lda ) ) )
                     s = aa
                     DO l = k + j + 1, n - 1
                        i = i + 1
                        aa = abs( a( i+j*lda ) )
*                       A(l,k+j)
                        s = s + aa
                        work( l ) = work( l ) + aa
                     END DO
                     work( k+j ) = work( k+j ) + s
                  END DO
*                 j=k-1 is special :process col A(k-1,0:k-1)
                  s = zero
                  DO i = 0, k - 2
                     aa = abs( a( i+j*lda ) )
*                    A(k,i)
                     work( i ) = work( i ) + aa
                     s = s + aa
                  END DO
*                 i=k-1
                  aa = abs( real( a( i+j*lda ) ) )
*                 A(k-1,k-1)
                  s = s + aa
                  work( i ) = s
*                 done with col j=k+1
                  DO j = k, n - 1
*                    process col j of A = A(j,0:k-1)
                     s = zero
                     DO i = 0, k - 1
                        aa = abs( a( i+j*lda ) )
*                       A(j,i)
                        work( i ) = work( i ) + aa
                        s = s + aa
                     END DO
                     work( j ) = work( j ) + s
                  END DO
                  VALUE = work( 0 )
                  DO i = 1, n-1
                     temp = work( i )
                     IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                    VALUE = temp
                  END DO
               END IF
            ELSE
*              n is even & A is k=n/2 by n+1
               IF( ilu.EQ.0 ) THEN
*                 uplo = 'U'
                  DO i = k, n - 1
                     work( i ) = zero
                  END DO
                  DO j = 0, k - 1
                     s = zero
                     DO i = 0, k - 1
                        aa = abs( a( i+j*lda ) )
*                       A(j,i+k)
                        work( i+k ) = work( i+k ) + aa
                        s = s + aa
                     END DO
                     work( j ) = s
                  END DO
*                 j=k
                  aa = abs( real( a( 0+j*lda ) ) )
*                 A(k,k)
                  s = aa
                  DO i = 1, k - 1
                     aa = abs( a( i+j*lda ) )
*                    A(k,k+i)
                     work( i+k ) = work( i+k ) + aa
                     s = s + aa
                  END DO
                  work( j ) = work( j ) + s
                  DO j = k + 1, n - 1
                     s = zero
                     DO i = 0, j - 2 - k
                        aa = abs( a( i+j*lda ) )
*                       A(i,j-k-1)
                        work( i ) = work( i ) + aa
                        s = s + aa
                     END DO
*                    i=j-1-k
                     aa = abs( real( a( i+j*lda ) ) )
*                    A(j-k-1,j-k-1)
                     s = s + aa
                     work( j-k-1 ) = work( j-k-1 ) + s
                     i = i + 1
                     aa = abs( real( a( i+j*lda ) ) )
*                    A(j,j)
                     s = aa
                     DO l = j + 1, n - 1
                        i = i + 1
                        aa = abs( a( i+j*lda ) )
*                       A(j,l)
                        work( l ) = work( l ) + aa
                        s = s + aa
                     END DO
                     work( j ) = work( j ) + s
                  END DO
*                 j=n
                  s = zero
                  DO i = 0, k - 2
                     aa = abs( a( i+j*lda ) )
*                    A(i,k-1)
                     work( i ) = work( i ) + aa
                     s = s + aa
                  END DO
*                 i=k-1
                  aa = abs( real( a( i+j*lda ) ) )
*                 A(k-1,k-1)
                  s = s + aa
                  work( i ) = work( i ) + s
                  VALUE = work( 0 )
                  DO i = 1, n-1
                     temp = work( i )
                     IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                    VALUE = temp
                  END DO
               ELSE
*                 ilu=1 & uplo = 'L'
                  DO i = k, n - 1
                     work( i ) = zero
                  END DO
*                 j=0 is special :process col A(k:n-1,k)
                  s = abs( real( a( 0 ) ) )
*                 A(k,k)
                  DO i = 1, k - 1
                     aa = abs( a( i ) )
*                    A(k+i,k)
                     work( i+k ) = work( i+k ) + aa
                     s = s + aa
                  END DO
                  work( k ) = work( k ) + s
                  DO j = 1, k - 1
*                    process
                     s = zero
                     DO i = 0, j - 2
                        aa = abs( a( i+j*lda ) )
*                       A(j-1,i)
                        work( i ) = work( i ) + aa
                        s = s + aa
                     END DO
                     aa = abs( real( a( i+j*lda ) ) )
*                    i=j-1 so process of A(j-1,j-1)
                     s = s + aa
                     work( j-1 ) = s
*                    is initialised here
                     i = i + 1
*                    i=j process A(j+k,j+k)
                     aa = abs( real( a( i+j*lda ) ) )
                     s = aa
                     DO l = k + j + 1, n - 1
                        i = i + 1
                        aa = abs( a( i+j*lda ) )
*                       A(l,k+j)
                        s = s + aa
                        work( l ) = work( l ) + aa
                     END DO
                     work( k+j ) = work( k+j ) + s
                  END DO
*                 j=k is special :process col A(k,0:k-1)
                  s = zero
                  DO i = 0, k - 2
                     aa = abs( a( i+j*lda ) )
*                    A(k,i)
                     work( i ) = work( i ) + aa
                     s = s + aa
                  END DO
*
*                 i=k-1
                  aa = abs( real( a( i+j*lda ) ) )
*                 A(k-1,k-1)
                  s = s + aa
                  work( i ) = s
*                 done with col j=k+1
                  DO j = k + 1, n
*
*                    process col j-1 of A = A(j-1,0:k-1)
                     s = zero
                     DO i = 0, k - 1
                        aa = abs( a( i+j*lda ) )
*                       A(j-1,i)
                        work( i ) = work( i ) + aa
                        s = s + aa
                     END DO
                     work( j-1 ) = work( j-1 ) + s
                  END DO
                  VALUE = work( 0 )
                  DO i = 1, n-1
                     temp = work( i )
                     IF( VALUE .LT. temp .OR. sisnan( temp ) )
     $                    VALUE = temp
                  END DO
               END IF
            END IF
         END IF
      ELSE IF( ( lsame( norm, 'F' ) ) .OR. ( lsame( norm, 'E' ) ) ) THEN
*
*       Find normF(A).
*
         k = ( n+1 ) / 2
         scale = zero
         s = one
         IF( noe.EQ.1 ) THEN
*           n is odd
            IF( ifm.EQ.1 ) THEN
*              A is normal & A is n by k
               IF( ilu.EQ.0 ) THEN
*                 A is upper
                  DO j = 0, k - 3
                     CALL classq( k-j-2, a( k+j+1+j*lda ), 1, scale, s )
*                    L at A(k,0)
                  END DO
                  DO j = 0, k - 1
                     CALL classq( k+j-1, a( 0+j*lda ), 1, scale, s )
*                    trap U at A(0,0)
                  END DO
                  s = s + s
*                 double s for the off diagonal elements
                  l = k - 1
*                 -> U(k,k) at A(k-1,0)
                  DO i = 0, k - 2
                     aa = real( a( l ) )
*                    U(k+i,k+i)
                     IF( aa.NE.zero ) THEN
                        IF( scale.LT.aa ) THEN
                           s = one + s*( scale / aa )**2
                           scale = aa
                        ELSE
                           s = s + ( aa / scale )**2
                        END IF
                     END IF
                     aa = real( a( l+1 ) )
*                    U(i,i)
                     IF( aa.NE.zero ) THEN
                        IF( scale.LT.aa ) THEN
                           s = one + s*( scale / aa )**2
                           scale = aa
                        ELSE
                           s = s + ( aa / scale )**2
                        END IF
                     END IF
                     l = l + lda + 1
                  END DO
                  aa = real( a( l ) )
*                 U(n-1,n-1)
                  IF( aa.NE.zero ) THEN
                     IF( scale.LT.aa ) THEN
                        s = one + s*( scale / aa )**2
                        scale = aa
                     ELSE
                        s = s + ( aa / scale )**2
                     END IF
                  END IF
               ELSE
*                 ilu=1 & A is lower
                  DO j = 0, k - 1
                     CALL classq( n-j-1, a( j+1+j*lda ), 1, scale, s )
*                    trap L at A(0,0)
                  END DO
                  DO j = 1, k - 2
                     CALL classq( j, a( 0+( 1+j )*lda ), 1, scale, s )
*                    U at A(0,1)
                  END DO
                  s = s + s
*                 double s for the off diagonal elements
                  aa = real( a( 0 ) )
*                 L(0,0) at A(0,0)
                  IF( aa.NE.zero ) THEN
                     IF( scale.LT.aa ) THEN
                        s = one + s*( scale / aa )**2
                        scale = aa
                     ELSE
                        s = s + ( aa / scale )**2
                     END IF
                  END IF
                  l = lda
*                 -> L(k,k) at A(0,1)
                  DO i = 1, k - 1
                     aa = real( a( l ) )
*                    L(k-1+i,k-1+i)
                     IF( aa.NE.zero ) THEN
                        IF( scale.LT.aa ) THEN
                           s = one + s*( scale / aa )**2
                           scale = aa
                        ELSE
                           s = s + ( aa / scale )**2
                        END IF
                     END IF
                     aa = real( a( l+1 ) )
*                    L(i,i)
                     IF( aa.NE.zero ) THEN
                        IF( scale.LT.aa ) THEN
                           s = one + s*( scale / aa )**2
                           scale = aa
                        ELSE
                           s = s + ( aa / scale )**2
                        END IF
                     END IF
                     l = l + lda + 1
                  END DO
               END IF
            ELSE
*              A is xpose & A is k by n
               IF( ilu.EQ.0 ) THEN
*                 A**H is upper
                  DO j = 1, k - 2
                     CALL classq( j, a( 0+( k+j )*lda ), 1, scale, s )
*                    U at A(0,k)
                  END DO
                  DO j = 0, k - 2
                     CALL classq( k, a( 0+j*lda ), 1, scale, s )
*                    k by k-1 rect. at A(0,0)
                  END DO
                  DO j = 0, k - 2
                     CALL classq( k-j-1, a( j+1+( j+k-1 )*lda ), 1,
     $                            scale, s )
*                    L at A(0,k-1)
                  END DO
                  s = s + s
*                 double s for the off diagonal elements
                  l = 0 + k*lda - lda
*                 -> U(k-1,k-1) at A(0,k-1)
                  aa = real( a( l ) )
*                 U(k-1,k-1)
                  IF( aa.NE.zero ) THEN
                     IF( scale.LT.aa ) THEN
                        s = one + s*( scale / aa )**2
                        scale = aa
                     ELSE
                        s = s + ( aa / scale )**2
                     END IF
                  END IF
                  l = l + lda
*                 -> U(0,0) at A(0,k)
                  DO j = k, n - 1
                     aa = real( a( l ) )
*                    -> U(j-k,j-k)
                     IF( aa.NE.zero ) THEN
                        IF( scale.LT.aa ) THEN
                           s = one + s*( scale / aa )**2
                           scale = aa
                        ELSE
                           s = s + ( aa / scale )**2
                        END IF
                     END IF
                     aa = real( a( l+1 ) )
*                    -> U(j,j)
                     IF( aa.NE.zero ) THEN
                        IF( scale.LT.aa ) THEN
                           s = one + s*( scale / aa )**2
                           scale = aa
                        ELSE
                           s = s + ( aa / scale )**2
                        END IF
                     END IF
                     l = l + lda + 1
                  END DO
               ELSE
*                 A**H is lower
                  DO j = 1, k - 1
                     CALL classq( j, a( 0+j*lda ), 1, scale, s )
*                    U at A(0,0)
                  END DO
                  DO j = k, n - 1
                     CALL classq( k, a( 0+j*lda ), 1, scale, s )
*                    k by k-1 rect. at A(0,k)
                  END DO
                  DO j = 0, k - 3
                     CALL classq( k-j-2, a( j+2+j*lda ), 1, scale, s )
*                    L at A(1,0)
                  END DO
                  s = s + s
*                 double s for the off diagonal elements
                  l = 0
*                 -> L(0,0) at A(0,0)
                  DO i = 0, k - 2
                     aa = real( a( l ) )
*                    L(i,i)
                     IF( aa.NE.zero ) THEN
                        IF( scale.LT.aa ) THEN
                           s = one + s*( scale / aa )**2
                           scale = aa
                        ELSE
                           s = s + ( aa / scale )**2
                        END IF
                     END IF
                     aa = real( a( l+1 ) )
*                    L(k+i,k+i)
                     IF( aa.NE.zero ) THEN
                        IF( scale.LT.aa ) THEN
                           s = one + s*( scale / aa )**2
                           scale = aa
                        ELSE
                           s = s + ( aa / scale )**2
                        END IF
                     END IF
                     l = l + lda + 1
                  END DO
*                 L-> k-1 + (k-1)*lda or L(k-1,k-1) at A(k-1,k-1)
                  aa = real( a( l ) )
*                 L(k-1,k-1) at A(k-1,k-1)
                  IF( aa.NE.zero ) THEN
                     IF( scale.LT.aa ) THEN
                        s = one + s*( scale / aa )**2
                        scale = aa
                     ELSE
                        s = s + ( aa / scale )**2
                     END IF
                  END IF
               END IF
            END IF
         ELSE
*           n is even
            IF( ifm.EQ.1 ) THEN
*              A is normal
               IF( ilu.EQ.0 ) THEN
*                 A is upper
                  DO j = 0, k - 2
                     CALL classq( k-j-1, a( k+j+2+j*lda ), 1, scale, s )
*                 L at A(k+1,0)
                  END DO
                  DO j = 0, k - 1
                     CALL classq( k+j, a( 0+j*lda ), 1, scale, s )
*                 trap U at A(0,0)
                  END DO
                  s = s + s
*                 double s for the off diagonal elements
                  l = k
*                 -> U(k,k) at A(k,0)
                  DO i = 0, k - 1
                     aa = real( a( l ) )
*                    U(k+i,k+i)
                     IF( aa.NE.zero ) THEN
                        IF( scale.LT.aa ) THEN
                           s = one + s*( scale / aa )**2
                           scale = aa
                        ELSE
                           s = s + ( aa / scale )**2
                        END IF
                     END IF
                     aa = real( a( l+1 ) )
*                    U(i,i)
                     IF( aa.NE.zero ) THEN
                        IF( scale.LT.aa ) THEN
                           s = one + s*( scale / aa )**2
                           scale = aa
                        ELSE
                           s = s + ( aa / scale )**2
                        END IF
                     END IF
                     l = l + lda + 1
                  END DO
               ELSE
*                 ilu=1 & A is lower
                  DO j = 0, k - 1
                     CALL classq( n-j-1, a( j+2+j*lda ), 1, scale, s )
*                    trap L at A(1,0)
                  END DO
                  DO j = 1, k - 1
                     CALL classq( j, a( 0+j*lda ), 1, scale, s )
*                    U at A(0,0)
                  END DO
                  s = s + s
*                 double s for the off diagonal elements
                  l = 0
*                 -> L(k,k) at A(0,0)
                  DO i = 0, k - 1
                     aa = real( a( l ) )
*                    L(k-1+i,k-1+i)
                     IF( aa.NE.zero ) THEN
                        IF( scale.LT.aa ) THEN
                           s = one + s*( scale / aa )**2
                           scale = aa
                        ELSE
                           s = s + ( aa / scale )**2
                        END IF
                     END IF
                     aa = real( a( l+1 ) )
*                    L(i,i)
                     IF( aa.NE.zero ) THEN
                        IF( scale.LT.aa ) THEN
                           s = one + s*( scale / aa )**2
                           scale = aa
                        ELSE
                           s = s + ( aa / scale )**2
                        END IF
                     END IF
                     l = l + lda + 1
                  END DO
               END IF
            ELSE
*              A is xpose
               IF( ilu.EQ.0 ) THEN
*                 A**H is upper
                  DO j = 1, k - 1
                     CALL classq( j, a( 0+( k+1+j )*lda ), 1, scale, s )
*                 U at A(0,k+1)
                  END DO
                  DO j = 0, k - 1
                     CALL classq( k, a( 0+j*lda ), 1, scale, s )
*                 k by k rect. at A(0,0)
                  END DO
                  DO j = 0, k - 2
                     CALL classq( k-j-1, a( j+1+( j+k )*lda ), 1, scale,
     $                            s )
*                 L at A(0,k)
                  END DO
                  s = s + s
*                 double s for the off diagonal elements
                  l = 0 + k*lda
*                 -> U(k,k) at A(0,k)
                  aa = real( a( l ) )
*                 U(k,k)
                  IF( aa.NE.zero ) THEN
                     IF( scale.LT.aa ) THEN
                        s = one + s*( scale / aa )**2
                        scale = aa
                     ELSE
                        s = s + ( aa / scale )**2
                     END IF
                  END IF
                  l = l + lda
*                 -> U(0,0) at A(0,k+1)
                  DO j = k + 1, n - 1
                     aa = real( a( l ) )
*                    -> U(j-k-1,j-k-1)
                     IF( aa.NE.zero ) THEN
                        IF( scale.LT.aa ) THEN
                           s = one + s*( scale / aa )**2
                           scale = aa
                        ELSE
                           s = s + ( aa / scale )**2
                        END IF
                     END IF
                     aa = real( a( l+1 ) )
*                    -> U(j,j)
                     IF( aa.NE.zero ) THEN
                        IF( scale.LT.aa ) THEN
                           s = one + s*( scale / aa )**2
                           scale = aa
                        ELSE
                           s = s + ( aa / scale )**2
                        END IF
                     END IF
                     l = l + lda + 1
                  END DO
*                 L=k-1+n*lda
*                 -> U(k-1,k-1) at A(k-1,n)
                  aa = real( a( l ) )
*                 U(k,k)
                  IF( aa.NE.zero ) THEN
                     IF( scale.LT.aa ) THEN
                        s = one + s*( scale / aa )**2
                        scale = aa
                     ELSE
                        s = s + ( aa / scale )**2
                     END IF
                  END IF
               ELSE
*                 A**H is lower
                  DO j = 1, k - 1
                     CALL classq( j, a( 0+( j+1 )*lda ), 1, scale, s )
*                 U at A(0,1)
                  END DO
                  DO j = k + 1, n
                     CALL classq( k, a( 0+j*lda ), 1, scale, s )
*                 k by k rect. at A(0,k+1)
                  END DO
                  DO j = 0, k - 2
                     CALL classq( k-j-1, a( j+1+j*lda ), 1, scale, s )
*                 L at A(0,0)
                  END DO
                  s = s + s
*                 double s for the off diagonal elements
                  l = 0
*                 -> L(k,k) at A(0,0)
                  aa = real( a( l ) )
*                 L(k,k) at A(0,0)
                  IF( aa.NE.zero ) THEN
                     IF( scale.LT.aa ) THEN
                        s = one + s*( scale / aa )**2
                        scale = aa
                     ELSE
                        s = s + ( aa / scale )**2
                     END IF
                  END IF
                  l = lda
*                 -> L(0,0) at A(0,1)
                  DO i = 0, k - 2
                     aa = real( a( l ) )
*                    L(i,i)
                     IF( aa.NE.zero ) THEN
                        IF( scale.LT.aa ) THEN
                           s = one + s*( scale / aa )**2
                           scale = aa
                        ELSE
                           s = s + ( aa / scale )**2
                        END IF
                     END IF
                     aa = real( a( l+1 ) )
*                    L(k+i+1,k+i+1)
                     IF( aa.NE.zero ) THEN
                        IF( scale.LT.aa ) THEN
                           s = one + s*( scale / aa )**2
                           scale = aa
                        ELSE
                           s = s + ( aa / scale )**2
                        END IF
                     END IF
                     l = l + lda + 1
                  END DO
*                 L-> k - 1 + k*lda or L(k-1,k-1) at A(k-1,k)
                  aa = real( a( l ) )
*                 L(k-1,k-1) at A(k-1,k)
                  IF( aa.NE.zero ) THEN
                     IF( scale.LT.aa ) THEN
                        s = one + s*( scale / aa )**2
                        scale = aa
                     ELSE
                        s = s + ( aa / scale )**2
                     END IF
                  END IF
               END IF
            END IF
         END IF
         VALUE = scale*sqrt( s )
      END IF
*
      clanhf = VALUE
      RETURN
*
*     End of CLANHF
*

◆ clarscl2()

subroutine clarscl2	(	integer	m,
		integer	n,
		real, dimension( * )	d,
		complex, dimension( ldx, * )	x,
		integer	ldx )

CLARSCL2 performs reciprocal diagonal scaling on a vector.

Download CLARSCL2 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CLARSCL2 performs a reciprocal diagonal scaling on an vector:
!>   x <-- inv(D) * x
!> where the REAL diagonal matrix D is stored as a vector.
!>
!> Eventually to be replaced by BLAS_cge_diag_scale in the new BLAS
!> standard.
!>

Parameters

[in]	M	!> M is INTEGER !> The number of rows of D and X. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of X. N >= 0. !>
[in]	D	!> D is REAL array, length M !> Diagonal matrix D, stored as a vector of length M. !>
[in,out]	X	!> X is COMPLEX array, dimension (LDX,N) !> On entry, the vector X to be scaled by D. !> On exit, the scaled vector. !>
[in]	LDX	!> LDX is INTEGER !> The leading dimension of the vector X. LDX >= M. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 90 of file clarscl2.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            M, N, LDX
*     ..
*     .. Array Arguments ..
      COMPLEX            X( LDX, * )
      REAL               D( * )
*     ..
*
*  =====================================================================
*
*     .. Local Scalars ..
      INTEGER            I, J
*     ..
*     .. Executable Statements ..
*
      DO j = 1, n
         DO i = 1, m
            x( i, j ) = x( i, j ) / d( i )
         END DO
      END DO
 
      RETURN

◆ clarz()

subroutine clarz	(	character	side,
		integer	m,
		integer	n,
		integer	l,
		complex, dimension( * )	v,
		integer	incv,
		complex	tau,
		complex, dimension( ldc, * )	c,
		integer	ldc,
		complex, dimension( * )	work )

CLARZ applies an elementary reflector (as returned by stzrzf) to a general matrix.

Download CLARZ + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CLARZ applies a complex elementary reflector H to a complex
!> M-by-N matrix C, from either the left or the right. H is represented
!> in the form
!>
!>       H = I - tau * v * v**H
!>
!> where tau is a complex scalar and v is a complex vector.
!>
!> If tau = 0, then H is taken to be the unit matrix.
!>
!> To apply H**H (the conjugate transpose of H), supply conjg(tau) instead
!> tau.
!>
!> H is a product of k elementary reflectors as returned by CTZRZF.
!>

Parameters

[in]	SIDE	!> SIDE is CHARACTER1 !> = 'L': form H C !> = 'R': form C * H !>
[in]	M	!> M is INTEGER !> The number of rows of the matrix C. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix C. !>
[in]	L	!> L is INTEGER !> The number of entries of the vector V containing !> the meaningful part of the Householder vectors. !> If SIDE = 'L', M >= L >= 0, if SIDE = 'R', N >= L >= 0. !>
[in]	V	!> V is COMPLEX array, dimension (1+(L-1)*abs(INCV)) !> The vector v in the representation of H as returned by !> CTZRZF. V is not used if TAU = 0. !>
[in]	INCV	!> INCV is INTEGER !> The increment between elements of v. INCV <> 0. !>
[in]	TAU	!> TAU is COMPLEX !> The value tau in the representation of H. !>
[in,out]	C	!> C is COMPLEX array, dimension (LDC,N) !> On entry, the M-by-N matrix C. !> On exit, C is overwritten by the matrix H * C if SIDE = 'L', !> or C * H if SIDE = 'R'. !>
[in]	LDC	!> LDC is INTEGER !> The leading dimension of the array C. LDC >= max(1,M). !>
[out]	WORK	!> WORK is COMPLEX array, dimension !> (N) if SIDE = 'L' !> or (M) if SIDE = 'R' !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: A. Petitet, Computer Science Dept., Univ. of Tenn., Knoxville, USA

Further Details:

!>

Definition at line 146 of file clarz.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          SIDE
      INTEGER            INCV, L, LDC, M, N
      COMPLEX            TAU
*     ..
*     .. Array Arguments ..
      COMPLEX            C( LDC, * ), V( * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            ONE, ZERO
      parameter( one = ( 1.0e+0, 0.0e+0 ),
     $                   zero = ( 0.0e+0, 0.0e+0 ) )
*     ..
*     .. External Subroutines ..
      EXTERNAL           caxpy, ccopy, cgemv, cgerc, cgeru, clacgv
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. Executable Statements ..
*
      IF( lsame( side, 'L' ) ) THEN
*
*        Form  H * C
*
         IF( tau.NE.zero ) THEN
*
*           w( 1:n ) = conjg( C( 1, 1:n ) )
*
            CALL ccopy( n, c, ldc, work, 1 )
            CALL clacgv( n, work, 1 )
*
*           w( 1:n ) = conjg( w( 1:n ) + C( m-l+1:m, 1:n )**H * v( 1:l ) )
*
            CALL cgemv( 'Conjugate transpose', l, n, one, c( m-l+1, 1 ),
     $                  ldc, v, incv, one, work, 1 )
            CALL clacgv( n, work, 1 )
*
*           C( 1, 1:n ) = C( 1, 1:n ) - tau * w( 1:n )
*
            CALL caxpy( n, -tau, work, 1, c, ldc )
*
*           C( m-l+1:m, 1:n ) = C( m-l+1:m, 1:n ) - ...
*                               tau * v( 1:l ) * w( 1:n )**H
*
            CALL cgeru( l, n, -tau, v, incv, work, 1, c( m-l+1, 1 ),
     $                  ldc )
         END IF
*
      ELSE
*
*        Form  C * H
*
         IF( tau.NE.zero ) THEN
*
*           w( 1:m ) = C( 1:m, 1 )
*
            CALL ccopy( m, c, 1, work, 1 )
*
*           w( 1:m ) = w( 1:m ) + C( 1:m, n-l+1:n, 1:n ) * v( 1:l )
*
            CALL cgemv( 'No transpose', m, l, one, c( 1, n-l+1 ), ldc,
     $                  v, incv, one, work, 1 )
*
*           C( 1:m, 1 ) = C( 1:m, 1 ) - tau * w( 1:m )
*
            CALL caxpy( m, -tau, work, 1, c, 1 )
*
*           C( 1:m, n-l+1:n ) = C( 1:m, n-l+1:n ) - ...
*                               tau * w( 1:m ) * v( 1:l )**H
*
            CALL cgerc( m, l, -tau, work, 1, v, incv, c( 1, n-l+1 ),
     $                  ldc )
*
         END IF
*
      END IF
*
      RETURN
*
*     End of CLARZ
*

◆ clarzb()

subroutine clarzb	(	character	side,
		character	trans,
		character	direct,
		character	storev,
		integer	m,
		integer	n,
		integer	k,
		integer	l,
		complex, dimension( ldv, * )	v,
		integer	ldv,
		complex, dimension( ldt, * )	t,
		integer	ldt,
		complex, dimension( ldc, * )	c,
		integer	ldc,
		complex, dimension( ldwork, * )	work,
		integer	ldwork )

CLARZB applies a block reflector or its conjugate-transpose to a general matrix.

Download CLARZB + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CLARZB applies a complex block reflector H or its transpose H**H
!> to a complex distributed M-by-N  C from the left or the right.
!>
!> Currently, only STOREV = 'R' and DIRECT = 'B' are supported.
!>

Parameters

[in]	SIDE	!> SIDE is CHARACTER1 !> = 'L': apply H or HH from the Left !> = 'R': apply H or H*H from the Right !>
[in]	TRANS	!> TRANS is CHARACTER1 !> = 'N': apply H (No transpose) !> = 'C': apply H*H (Conjugate transpose) !>
[in]	DIRECT	!> DIRECT is CHARACTER*1 !> Indicates how H is formed from a product of elementary !> reflectors !> = 'F': H = H(1) H(2) . . . H(k) (Forward, not supported yet) !> = 'B': H = H(k) . . . H(2) H(1) (Backward) !>
[in]	STOREV	!> STOREV is CHARACTER*1 !> Indicates how the vectors which define the elementary !> reflectors are stored: !> = 'C': Columnwise (not supported yet) !> = 'R': Rowwise !>
[in]	M	!> M is INTEGER !> The number of rows of the matrix C. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix C. !>
[in]	K	!> K is INTEGER !> The order of the matrix T (= the number of elementary !> reflectors whose product defines the block reflector). !>
[in]	L	!> L is INTEGER !> The number of columns of the matrix V containing the !> meaningful part of the Householder reflectors. !> If SIDE = 'L', M >= L >= 0, if SIDE = 'R', N >= L >= 0. !>
[in]	V	!> V is COMPLEX array, dimension (LDV,NV). !> If STOREV = 'C', NV = K; if STOREV = 'R', NV = L. !>
[in]	LDV	!> LDV is INTEGER !> The leading dimension of the array V. !> If STOREV = 'C', LDV >= L; if STOREV = 'R', LDV >= K. !>
[in]	T	!> T is COMPLEX array, dimension (LDT,K) !> The triangular K-by-K matrix T in the representation of the !> block reflector. !>
[in]	LDT	!> LDT is INTEGER !> The leading dimension of the array T. LDT >= K. !>
[in,out]	C	!> C is COMPLEX array, dimension (LDC,N) !> On entry, the M-by-N matrix C. !> On exit, C is overwritten by HC or HHC or CH or CH**H. !>
[in]	LDC	!> LDC is INTEGER !> The leading dimension of the array C. LDC >= max(1,M). !>
[out]	WORK	!> WORK is COMPLEX array, dimension (LDWORK,K) !>
[in]	LDWORK	!> LDWORK is INTEGER !> The leading dimension of the array WORK. !> If SIDE = 'L', LDWORK >= max(1,N); !> if SIDE = 'R', LDWORK >= max(1,M). !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: A. Petitet, Computer Science Dept., Univ. of Tenn., Knoxville, USA

Further Details:

!>

Definition at line 181 of file clarzb.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          DIRECT, SIDE, STOREV, TRANS
      INTEGER            K, L, LDC, LDT, LDV, LDWORK, M, N
*     ..
*     .. Array Arguments ..
      COMPLEX            C( LDC, * ), T( LDT, * ), V( LDV, * ),
     $                   WORK( LDWORK, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            ONE
      parameter( one = ( 1.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      CHARACTER          TRANST
      INTEGER            I, INFO, J
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           ccopy, cgemm, clacgv, ctrmm, xerbla
*     ..
*     .. Executable Statements ..
*
*     Quick return if possible
*
      IF( m.LE.0 .OR. n.LE.0 )
     $   RETURN
*
*     Check for currently supported options
*
      info = 0
      IF( .NOT.lsame( direct, 'B' ) ) THEN
         info = -3
      ELSE IF( .NOT.lsame( storev, 'R' ) ) THEN
         info = -4
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CLARZB', -info )
         RETURN
      END IF
*
      IF( lsame( trans, 'N' ) ) THEN
         transt = 'C'
      ELSE
         transt = 'N'
      END IF
*
      IF( lsame( side, 'L' ) ) THEN
*
*        Form  H * C  or  H**H * C
*
*        W( 1:n, 1:k ) = C( 1:k, 1:n )**H
*
         DO 10 j = 1, k
            CALL ccopy( n, c( j, 1 ), ldc, work( 1, j ), 1 )
   10    CONTINUE
*
*        W( 1:n, 1:k ) = W( 1:n, 1:k ) + ...
*                        C( m-l+1:m, 1:n )**H * V( 1:k, 1:l )**T
*
         IF( l.GT.0 )
     $      CALL cgemm( 'Transpose', 'Conjugate transpose', n, k, l,
     $                  one, c( m-l+1, 1 ), ldc, v, ldv, one, work,
     $                  ldwork )
*
*        W( 1:n, 1:k ) = W( 1:n, 1:k ) * T**T  or  W( 1:m, 1:k ) * T
*
         CALL ctrmm( 'Right', 'Lower', transt, 'Non-unit', n, k, one, t,
     $               ldt, work, ldwork )
*
*        C( 1:k, 1:n ) = C( 1:k, 1:n ) - W( 1:n, 1:k )**H
*
         DO 30 j = 1, n
            DO 20 i = 1, k
               c( i, j ) = c( i, j ) - work( j, i )
   20       CONTINUE
   30    CONTINUE
*
*        C( m-l+1:m, 1:n ) = C( m-l+1:m, 1:n ) - ...
*                            V( 1:k, 1:l )**H * W( 1:n, 1:k )**H
*
         IF( l.GT.0 )
     $      CALL cgemm( 'Transpose', 'Transpose', l, n, k, -one, v, ldv,
     $                  work, ldwork, one, c( m-l+1, 1 ), ldc )
*
      ELSE IF( lsame( side, 'R' ) ) THEN
*
*        Form  C * H  or  C * H**H
*
*        W( 1:m, 1:k ) = C( 1:m, 1:k )
*
         DO 40 j = 1, k
            CALL ccopy( m, c( 1, j ), 1, work( 1, j ), 1 )
   40    CONTINUE
*
*        W( 1:m, 1:k ) = W( 1:m, 1:k ) + ...
*                        C( 1:m, n-l+1:n ) * V( 1:k, 1:l )**H
*
         IF( l.GT.0 )
     $      CALL cgemm( 'No transpose', 'Transpose', m, k, l, one,
     $                  c( 1, n-l+1 ), ldc, v, ldv, one, work, ldwork )
*
*        W( 1:m, 1:k ) = W( 1:m, 1:k ) * conjg( T )  or
*                        W( 1:m, 1:k ) * T**H
*
         DO 50 j = 1, k
            CALL clacgv( k-j+1, t( j, j ), 1 )
   50    CONTINUE
         CALL ctrmm( 'Right', 'Lower', trans, 'Non-unit', m, k, one, t,
     $               ldt, work, ldwork )
         DO 60 j = 1, k
            CALL clacgv( k-j+1, t( j, j ), 1 )
   60    CONTINUE
*
*        C( 1:m, 1:k ) = C( 1:m, 1:k ) - W( 1:m, 1:k )
*
         DO 80 j = 1, k
            DO 70 i = 1, m
               c( i, j ) = c( i, j ) - work( i, j )
   70       CONTINUE
   80    CONTINUE
*
*        C( 1:m, n-l+1:n ) = C( 1:m, n-l+1:n ) - ...
*                            W( 1:m, 1:k ) * conjg( V( 1:k, 1:l ) )
*
         DO 90 j = 1, l
            CALL clacgv( k, v( 1, j ), 1 )
   90    CONTINUE
         IF( l.GT.0 )
     $      CALL cgemm( 'No transpose', 'No transpose', m, l, k, -one,
     $                  work, ldwork, v, ldv, one, c( 1, n-l+1 ), ldc )
         DO 100 j = 1, l
            CALL clacgv( k, v( 1, j ), 1 )
  100    CONTINUE
*
      END IF
*
      RETURN
*
*     End of CLARZB
*

◆ clarzt()

subroutine clarzt	(	character	direct,
		character	storev,
		integer	n,
		integer	k,
		complex, dimension( ldv, * )	v,
		integer	ldv,
		complex, dimension( * )	tau,
		complex, dimension( ldt, * )	t,
		integer	ldt )

CLARZT forms the triangular factor T of a block reflector H = I - vtvH.

Download CLARZT + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CLARZT forms the triangular factor T of a complex block reflector
!> H of order > n, which is defined as a product of k elementary
!> reflectors.
!>
!> If DIRECT = 'F', H = H(1) H(2) . . . H(k) and T is upper triangular;
!>
!> If DIRECT = 'B', H = H(k) . . . H(2) H(1) and T is lower triangular.
!>
!> If STOREV = 'C', the vector which defines the elementary reflector
!> H(i) is stored in the i-th column of the array V, and
!>
!>    H  =  I - V * T * V**H
!>
!> If STOREV = 'R', the vector which defines the elementary reflector
!> H(i) is stored in the i-th row of the array V, and
!>
!>    H  =  I - V**H * T * V
!>
!> Currently, only STOREV = 'R' and DIRECT = 'B' are supported.
!>

Parameters

[in]	DIRECT	!> DIRECT is CHARACTER*1 !> Specifies the order in which the elementary reflectors are !> multiplied to form the block reflector: !> = 'F': H = H(1) H(2) . . . H(k) (Forward, not supported yet) !> = 'B': H = H(k) . . . H(2) H(1) (Backward) !>
[in]	STOREV	!> STOREV is CHARACTER*1 !> Specifies how the vectors which define the elementary !> reflectors are stored (see also Further Details): !> = 'C': columnwise (not supported yet) !> = 'R': rowwise !>
[in]	N	!> N is INTEGER !> The order of the block reflector H. N >= 0. !>
[in]	K	!> K is INTEGER !> The order of the triangular factor T (= the number of !> elementary reflectors). K >= 1. !>
[in,out]	V	!> V is COMPLEX array, dimension !> (LDV,K) if STOREV = 'C' !> (LDV,N) if STOREV = 'R' !> The matrix V. See further details. !>
[in]	LDV	!> LDV is INTEGER !> The leading dimension of the array V. !> If STOREV = 'C', LDV >= max(1,N); if STOREV = 'R', LDV >= K. !>
[in]	TAU	!> TAU is COMPLEX array, dimension (K) !> TAU(i) must contain the scalar factor of the elementary !> reflector H(i). !>
[out]	T	!> T is COMPLEX array, dimension (LDT,K) !> The k by k triangular factor T of the block reflector. !> If DIRECT = 'F', T is upper triangular; if DIRECT = 'B', T is !> lower triangular. The rest of the array is not used. !>
[in]	LDT	!> LDT is INTEGER !> The leading dimension of the array T. LDT >= K. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: A. Petitet, Computer Science Dept., Univ. of Tenn., Knoxville, USA

Further Details:

!>
!>  The shape of the matrix V and the storage of the vectors which define
!>  the H(i) is best illustrated by the following example with n = 5 and
!>  k = 3. The elements equal to 1 are not stored; the corresponding
!>  array elements are modified but restored on exit. The rest of the
!>  array is not used.
!>
!>  DIRECT = 'F' and STOREV = 'C':         DIRECT = 'F' and STOREV = 'R':
!>
!>                                              ______V_____
!>         ( v1 v2 v3 )                        /            \
!>         ( v1 v2 v3 )                      ( v1 v1 v1 v1 v1 . . . . 1 )
!>     V = ( v1 v2 v3 )                      ( v2 v2 v2 v2 v2 . . . 1   )
!>         ( v1 v2 v3 )                      ( v3 v3 v3 v3 v3 . . 1     )
!>         ( v1 v2 v3 )
!>            .  .  .
!>            .  .  .
!>            1  .  .
!>               1  .
!>                  1
!>
!>  DIRECT = 'B' and STOREV = 'C':         DIRECT = 'B' and STOREV = 'R':
!>
!>                                                        ______V_____
!>            1                                          /            \
!>            .  1                           ( 1 . . . . v1 v1 v1 v1 v1 )
!>            .  .  1                        ( . 1 . . . v2 v2 v2 v2 v2 )
!>            .  .  .                        ( . . 1 . . v3 v3 v3 v3 v3 )
!>            .  .  .
!>         ( v1 v2 v3 )
!>         ( v1 v2 v3 )
!>     V = ( v1 v2 v3 )
!>         ( v1 v2 v3 )
!>         ( v1 v2 v3 )
!>

Definition at line 184 of file clarzt.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          DIRECT, STOREV
      INTEGER            K, LDT, LDV, N
*     ..
*     .. Array Arguments ..
      COMPLEX            T( LDT, * ), TAU( * ), V( LDV, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            ZERO
      parameter( zero = ( 0.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      INTEGER            I, INFO, J
*     ..
*     .. External Subroutines ..
      EXTERNAL           cgemv, clacgv, ctrmv, xerbla
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. Executable Statements ..
*
*     Check for currently supported options
*
      info = 0
      IF( .NOT.lsame( direct, 'B' ) ) THEN
         info = -1
      ELSE IF( .NOT.lsame( storev, 'R' ) ) THEN
         info = -2
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CLARZT', -info )
         RETURN
      END IF
*
      DO 20 i = k, 1, -1
         IF( tau( i ).EQ.zero ) THEN
*
*           H(i)  =  I
*
            DO 10 j = i, k
               t( j, i ) = zero
   10       CONTINUE
         ELSE
*
*           general case
*
            IF( i.LT.k ) THEN
*
*              T(i+1:k,i) = - tau(i) * V(i+1:k,1:n) * V(i,1:n)**H
*
               CALL clacgv( n, v( i, 1 ), ldv )
               CALL cgemv( 'No transpose', k-i, n, -tau( i ),
     $                     v( i+1, 1 ), ldv, v( i, 1 ), ldv, zero,
     $                     t( i+1, i ), 1 )
               CALL clacgv( n, v( i, 1 ), ldv )
*
*              T(i+1:k,i) = T(i+1:k,i+1:k) * T(i+1:k,i)
*
               CALL ctrmv( 'Lower', 'No transpose', 'Non-unit', k-i,
     $                     t( i+1, i+1 ), ldt, t( i+1, i ), 1 )
            END IF
            t( i, i ) = tau( i )
         END IF
   20 CONTINUE
      RETURN
*
*     End of CLARZT
*

◆ clascl2()

subroutine clascl2	(	integer	m,
		integer	n,
		real, dimension( * )	d,
		complex, dimension( ldx, * )	x,
		integer	ldx )

CLASCL2 performs diagonal scaling on a vector.

Download CLASCL2 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CLASCL2 performs a diagonal scaling on a vector:
!>   x <-- D * x
!> where the diagonal REAL matrix D is stored as a vector.
!>
!> Eventually to be replaced by BLAS_cge_diag_scale in the new BLAS
!> standard.
!>

Parameters

[in]	M	!> M is INTEGER !> The number of rows of D and X. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of X. N >= 0. !>
[in]	D	!> D is REAL array, length M !> Diagonal matrix D, stored as a vector of length M. !>
[in,out]	X	!> X is COMPLEX array, dimension (LDX,N) !> On entry, the vector X to be scaled by D. !> On exit, the scaled vector. !>
[in]	LDX	!> LDX is INTEGER !> The leading dimension of the vector X. LDX >= M. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 90 of file clascl2.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            M, N, LDX
*     ..
*     .. Array Arguments ..
      REAL               D( * )
      COMPLEX            X( LDX, * )
*     ..
*
*  =====================================================================
*
*     .. Local Scalars ..
      INTEGER            I, J
*     ..
*     .. Executable Statements ..
*
      DO j = 1, n
         DO i = 1, m
            x( i, j ) = x( i, j ) * d( i )
         END DO
      END DO
 
      RETURN

◆ clatrz()

subroutine clatrz	(	integer	m,
		integer	n,
		integer	l,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( * )	tau,
		complex, dimension( * )	work )

CLATRZ factors an upper trapezoidal matrix by means of unitary transformations.

Download CLATRZ + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CLATRZ factors the M-by-(M+L) complex upper trapezoidal matrix
!> [ A1 A2 ] = [ A(1:M,1:M) A(1:M,N-L+1:N) ] as ( R  0 ) * Z by means
!> of unitary transformations, where  Z is an (M+L)-by-(M+L) unitary
!> matrix and, R and A1 are M-by-M upper triangular matrices.
!>

Parameters

[in]	M	!> M is INTEGER !> The number of rows of the matrix A. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix A. N >= 0. !>
[in]	L	!> L is INTEGER !> The number of columns of the matrix A containing the !> meaningful part of the Householder vectors. N-M >= L >= 0. !>
[in,out]	A	!> A is COMPLEX array, dimension (LDA,N) !> On entry, the leading M-by-N upper trapezoidal part of the !> array A must contain the matrix to be factorized. !> On exit, the leading M-by-M upper triangular part of A !> contains the upper triangular matrix R, and elements N-L+1 to !> N of the first M rows of A, with the array TAU, represent the !> unitary matrix Z as a product of M elementary reflectors. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,M). !>
[out]	TAU	!> TAU is COMPLEX array, dimension (M) !> The scalar factors of the elementary reflectors. !>
[out]	WORK	!> WORK is COMPLEX array, dimension (M) !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: A. Petitet, Computer Science Dept., Univ. of Tenn., Knoxville, USA

Further Details:

!>
!>  The factorization is obtained by Householder's method.  The kth
!>  transformation matrix, Z( k ), which is used to introduce zeros into
!>  the ( m - k + 1 )th row of A, is given in the form
!>
!>     Z( k ) = ( I     0   ),
!>              ( 0  T( k ) )
!>
!>  where
!>
!>     T( k ) = I - tau*u( k )*u( k )**H,   u( k ) = (   1    ),
!>                                                 (   0    )
!>                                                 ( z( k ) )
!>
!>  tau is a scalar and z( k ) is an l element vector. tau and z( k )
!>  are chosen to annihilate the elements of the kth row of A2.
!>
!>  The scalar tau is returned in the kth element of TAU and the vector
!>  u( k ) in the kth row of A2, such that the elements of z( k ) are
!>  in  a( k, l + 1 ), ..., a( k, n ). The elements of R are returned in
!>  the upper triangular part of A1.
!>
!>  Z is given by
!>
!>     Z =  Z( 1 ) * Z( 2 ) * ... * Z( m ).
!>

Definition at line 139 of file clatrz.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            L, LDA, M, N
*     ..
*     .. Array Arguments ..
      COMPLEX            A( LDA, * ), TAU( * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            ZERO
      parameter( zero = ( 0.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      INTEGER            I
      COMPLEX            ALPHA
*     ..
*     .. External Subroutines ..
      EXTERNAL           clacgv, clarfg, clarz
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          conjg
*     ..
*     .. Executable Statements ..
*
*     Quick return if possible
*
      IF( m.EQ.0 ) THEN
         RETURN
      ELSE IF( m.EQ.n ) THEN
         DO 10 i = 1, n
            tau( i ) = zero
   10    CONTINUE
         RETURN
      END IF
*
      DO 20 i = m, 1, -1
*
*        Generate elementary reflector H(i) to annihilate
*        [ A(i,i) A(i,n-l+1:n) ]
*
         CALL clacgv( l, a( i, n-l+1 ), lda )
         alpha = conjg( a( i, i ) )
         CALL clarfg( l+1, alpha, a( i, n-l+1 ), lda, tau( i ) )
         tau( i ) = conjg( tau( i ) )
*
*        Apply H(i) to A(1:i-1,i:n) from the right
*
         CALL clarz( 'Right', i-1, n-i+1, l, a( i, n-l+1 ), lda,
     $               conjg( tau( i ) ), a( 1, i ), lda, work )
         a( i, i ) = conjg( alpha )
*
   20 CONTINUE
*
      RETURN
*
*     End of CLATRZ
*

◆ clatzm()

subroutine clatzm	(	character	side,
		integer	m,
		integer	n,
		complex, dimension( * )	v,
		integer	incv,
		complex	tau,
		complex, dimension( ldc, * )	c1,
		complex, dimension( ldc, * )	c2,
		integer	ldc,
		complex, dimension( * )	work )

CLATZM

Download CLATZM + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> This routine is deprecated and has been replaced by routine CUNMRZ.
!>
!> CLATZM applies a Householder matrix generated by CTZRQF to a matrix.
!>
!> Let P = I - tau*u*u**H,   u = ( 1 ),
!>                               ( v )
!> where v is an (m-1) vector if SIDE = 'L', or a (n-1) vector if
!> SIDE = 'R'.
!>
!> If SIDE equals 'L', let
!>        C = [ C1 ] 1
!>            [ C2 ] m-1
!>              n
!> Then C is overwritten by P*C.
!>
!> If SIDE equals 'R', let
!>        C = [ C1, C2 ] m
!>               1  n-1
!> Then C is overwritten by C*P.
!>

Parameters

[in]	SIDE	!> SIDE is CHARACTER1 !> = 'L': form P C !> = 'R': form C * P !>
[in]	M	!> M is INTEGER !> The number of rows of the matrix C. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix C. !>
[in]	V	!> V is COMPLEX array, dimension !> (1 + (M-1)abs(INCV)) if SIDE = 'L' !> (1 + (N-1)abs(INCV)) if SIDE = 'R' !> The vector v in the representation of P. V is not used !> if TAU = 0. !>
[in]	INCV	!> INCV is INTEGER !> The increment between elements of v. INCV <> 0 !>
[in]	TAU	!> TAU is COMPLEX !> The value tau in the representation of P. !>
[in,out]	C1	!> C1 is COMPLEX array, dimension !> (LDC,N) if SIDE = 'L' !> (M,1) if SIDE = 'R' !> On entry, the n-vector C1 if SIDE = 'L', or the m-vector C1 !> if SIDE = 'R'. !> !> On exit, the first row of PC if SIDE = 'L', or the first !> column of CP if SIDE = 'R'. !>
[in,out]	C2	!> C2 is COMPLEX array, dimension !> (LDC, N) if SIDE = 'L' !> (LDC, N-1) if SIDE = 'R' !> On entry, the (m - 1) x n matrix C2 if SIDE = 'L', or the !> m x (n - 1) matrix C2 if SIDE = 'R'. !> !> On exit, rows 2:m of PC if SIDE = 'L', or columns 2:m of CP !> if SIDE = 'R'. !>
[in]	LDC	!> LDC is INTEGER !> The leading dimension of the arrays C1 and C2. !> LDC >= max(1,M). !>
[out]	WORK	!> WORK is COMPLEX array, dimension !> (N) if SIDE = 'L' !> (M) if SIDE = 'R' !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 151 of file clatzm.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          SIDE
      INTEGER            INCV, LDC, M, N
      COMPLEX            TAU
*     ..
*     .. Array Arguments ..
      COMPLEX            C1( LDC, * ), C2( LDC, * ), V( * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            ONE, ZERO
      parameter( one = ( 1.0e+0, 0.0e+0 ),
     $                   zero = ( 0.0e+0, 0.0e+0 ) )
*     ..
*     .. External Subroutines ..
      EXTERNAL           caxpy, ccopy, cgemv, cgerc, cgeru, clacgv
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          min
*     ..
*     .. Executable Statements ..
*
      IF( ( min( m, n ).EQ.0 ) .OR. ( tau.EQ.zero ) )
     $   RETURN
*
      IF( lsame( side, 'L' ) ) THEN
*
*        w :=  ( C1 + v**H * C2 )**H
*
         CALL ccopy( n, c1, ldc, work, 1 )
         CALL clacgv( n, work, 1 )
         CALL cgemv( 'Conjugate transpose', m-1, n, one, c2, ldc, v,
     $               incv, one, work, 1 )
*
*        [ C1 ] := [ C1 ] - tau* [ 1 ] * w**H
*        [ C2 ]    [ C2 ]        [ v ]
*
         CALL clacgv( n, work, 1 )
         CALL caxpy( n, -tau, work, 1, c1, ldc )
         CALL cgeru( m-1, n, -tau, v, incv, work, 1, c2, ldc )
*
      ELSE IF( lsame( side, 'R' ) ) THEN
*
*        w := C1 + C2 * v
*
         CALL ccopy( m, c1, 1, work, 1 )
         CALL cgemv( 'No transpose', m, n-1, one, c2, ldc, v, incv, one,
     $               work, 1 )
*
*        [ C1, C2 ] := [ C1, C2 ] - tau* w * [ 1 , v**H]
*
         CALL caxpy( m, -tau, work, 1, c1, 1 )
         CALL cgerc( m, n-1, -tau, work, 1, v, incv, c2, ldc )
      END IF
*
      RETURN
*
*     End of CLATZM
*

◆ cpbcon()

subroutine cpbcon	(	character	uplo,
		integer	n,
		integer	kd,
		complex, dimension( ldab, * )	ab,
		integer	ldab,
		real	anorm,
		real	rcond,
		complex, dimension( * )	work,
		real, dimension( * )	rwork,
		integer	info )

CPBCON

Download CPBCON + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CPBCON estimates the reciprocal of the condition number (in the
!> 1-norm) of a complex Hermitian positive definite band matrix using
!> the Cholesky factorization A = U**H*U or A = L*L**H computed by
!> CPBTRF.
!>
!> An estimate is obtained for norm(inv(A)), and the reciprocal of the
!> condition number is computed as RCOND = 1 / (ANORM * norm(inv(A))).
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': Upper triangular factor stored in AB; !> = 'L': Lower triangular factor stored in AB. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in]	KD	!> KD is INTEGER !> The number of superdiagonals of the matrix A if UPLO = 'U', !> or the number of sub-diagonals if UPLO = 'L'. KD >= 0. !>
[in]	AB	!> AB is COMPLEX array, dimension (LDAB,N) !> The triangular factor U or L from the Cholesky factorization !> A = U*HU or A = LL*H of the band matrix A, stored in the !> first KD+1 rows of the array. The j-th column of U or L is !> stored in the j-th column of the array AB as follows: !> if UPLO ='U', AB(kd+1+i-j,j) = U(i,j) for max(1,j-kd)<=i<=j; !> if UPLO ='L', AB(1+i-j,j) = L(i,j) for j<=i<=min(n,j+kd). !>
[in]	LDAB	!> LDAB is INTEGER !> The leading dimension of the array AB. LDAB >= KD+1. !>
[in]	ANORM	!> ANORM is REAL !> The 1-norm (or infinity-norm) of the Hermitian band matrix A. !>
[out]	RCOND	!> RCOND is REAL !> The reciprocal of the condition number of the matrix A, !> computed as RCOND = 1/(ANORM * AINVNM), where AINVNM is an !> estimate of the 1-norm of inv(A) computed in this routine. !>
[out]	WORK	!> WORK is COMPLEX array, dimension (2*N) !>
[out]	RWORK	!> RWORK is REAL array, dimension (N) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 131 of file cpbcon.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          UPLO
      INTEGER            INFO, KD, LDAB, N
      REAL               ANORM, RCOND
*     ..
*     .. Array Arguments ..
      REAL               RWORK( * )
      COMPLEX            AB( LDAB, * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ONE, ZERO
      parameter( one = 1.0e+0, zero = 0.0e+0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            UPPER
      CHARACTER          NORMIN
      INTEGER            IX, KASE
      REAL               AINVNM, SCALE, SCALEL, SCALEU, SMLNUM
      COMPLEX            ZDUM
*     ..
*     .. Local Arrays ..
      INTEGER            ISAVE( 3 )
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      INTEGER            ICAMAX
      REAL               SLAMCH
      EXTERNAL           lsame, icamax, slamch
*     ..
*     .. External Subroutines ..
      EXTERNAL           clacn2, clatbs, csrscl, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, aimag, real
*     ..
*     .. Statement Functions ..
      REAL               CABS1
*     ..
*     .. Statement Function definitions ..
      cabs1( zdum ) = abs( real( zdum ) ) + abs( aimag( zdum ) )
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      upper = lsame( uplo, 'U' )
      IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( kd.LT.0 ) THEN
         info = -3
      ELSE IF( ldab.LT.kd+1 ) THEN
         info = -5
      ELSE IF( anorm.LT.zero ) THEN
         info = -6
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CPBCON', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      rcond = zero
      IF( n.EQ.0 ) THEN
         rcond = one
         RETURN
      ELSE IF( anorm.EQ.zero ) THEN
         RETURN
      END IF
*
      smlnum = slamch( 'Safe minimum' )
*
*     Estimate the 1-norm of the inverse.
*
      kase = 0
      normin = 'N'
   10 CONTINUE
      CALL clacn2( n, work( n+1 ), work, ainvnm, kase, isave )
      IF( kase.NE.0 ) THEN
         IF( upper ) THEN
*
*           Multiply by inv(U**H).
*
            CALL clatbs( 'Upper', 'Conjugate transpose', 'Non-unit',
     $                   normin, n, kd, ab, ldab, work, scalel, rwork,
     $                   info )
            normin = 'Y'
*
*           Multiply by inv(U).
*
            CALL clatbs( 'Upper', 'No transpose', 'Non-unit', normin, n,
     $                   kd, ab, ldab, work, scaleu, rwork, info )
         ELSE
*
*           Multiply by inv(L).
*
            CALL clatbs( 'Lower', 'No transpose', 'Non-unit', normin, n,
     $                   kd, ab, ldab, work, scalel, rwork, info )
            normin = 'Y'
*
*           Multiply by inv(L**H).
*
            CALL clatbs( 'Lower', 'Conjugate transpose', 'Non-unit',
     $                   normin, n, kd, ab, ldab, work, scaleu, rwork,
     $                   info )
         END IF
*
*        Multiply by 1/SCALE if doing so will not cause overflow.
*
         scale = scalel*scaleu
         IF( scale.NE.one ) THEN
            ix = icamax( n, work, 1 )
            IF( scale.LT.cabs1( work( ix ) )*smlnum .OR. scale.EQ.zero )
     $         GO TO 20
            CALL csrscl( n, scale, work, 1 )
         END IF
         GO TO 10
      END IF
*
*     Compute the estimate of the reciprocal condition number.
*
      IF( ainvnm.NE.zero )
     $   rcond = ( one / ainvnm ) / anorm
*
   20 CONTINUE
*
      RETURN
*
*     End of CPBCON
*

◆ cpbequ()

subroutine cpbequ	(	character	uplo,
		integer	n,
		integer	kd,
		complex, dimension( ldab, * )	ab,
		integer	ldab,
		real, dimension( * )	s,
		real	scond,
		real	amax,
		integer	info )

CPBEQU

Download CPBEQU + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CPBEQU computes row and column scalings intended to equilibrate a
!> Hermitian positive definite band matrix A and reduce its condition
!> number (with respect to the two-norm).  S contains the scale factors,
!> S(i) = 1/sqrt(A(i,i)), chosen so that the scaled matrix B with
!> elements B(i,j) = S(i)*A(i,j)*S(j) has ones on the diagonal.  This
!> choice of S puts the condition number of B within a factor N of the
!> smallest possible condition number over all possible diagonal
!> scalings.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': Upper triangular of A is stored; !> = 'L': Lower triangular of A is stored. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in]	KD	!> KD is INTEGER !> The number of superdiagonals of the matrix A if UPLO = 'U', !> or the number of subdiagonals if UPLO = 'L'. KD >= 0. !>
[in]	AB	!> AB is COMPLEX array, dimension (LDAB,N) !> The upper or lower triangle of the Hermitian band matrix A, !> stored in the first KD+1 rows of the array. The j-th column !> of A is stored in the j-th column of the array AB as follows: !> if UPLO = 'U', AB(kd+1+i-j,j) = A(i,j) for max(1,j-kd)<=i<=j; !> if UPLO = 'L', AB(1+i-j,j) = A(i,j) for j<=i<=min(n,j+kd). !>
[in]	LDAB	!> LDAB is INTEGER !> The leading dimension of the array A. LDAB >= KD+1. !>
[out]	S	!> S is REAL array, dimension (N) !> If INFO = 0, S contains the scale factors for A. !>
[out]	SCOND	!> SCOND is REAL !> If INFO = 0, S contains the ratio of the smallest S(i) to !> the largest S(i). If SCOND >= 0.1 and AMAX is neither too !> large nor too small, it is not worth scaling by S. !>
[out]	AMAX	!> AMAX is REAL !> Absolute value of largest matrix element. If AMAX is very !> close to overflow or very close to underflow, the matrix !> should be scaled. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value. !> > 0: if INFO = i, the i-th diagonal element is nonpositive. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 129 of file cpbequ.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          UPLO
      INTEGER            INFO, KD, LDAB, N
      REAL               AMAX, SCOND
*     ..
*     .. Array Arguments ..
      REAL               S( * )
      COMPLEX            AB( LDAB, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ZERO, ONE
      parameter( zero = 0.0e+0, one = 1.0e+0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            UPPER
      INTEGER            I, J
      REAL               SMIN
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, min, real, sqrt
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      upper = lsame( uplo, 'U' )
      IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( kd.LT.0 ) THEN
         info = -3
      ELSE IF( ldab.LT.kd+1 ) THEN
         info = -5
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CPBEQU', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 ) THEN
         scond = one
         amax = zero
         RETURN
      END IF
*
      IF( upper ) THEN
         j = kd + 1
      ELSE
         j = 1
      END IF
*
*     Initialize SMIN and AMAX.
*
      s( 1 ) = real( ab( j, 1 ) )
      smin = s( 1 )
      amax = s( 1 )
*
*     Find the minimum and maximum diagonal elements.
*
      DO 10 i = 2, n
         s( i ) = real( ab( j, i ) )
         smin = min( smin, s( i ) )
         amax = max( amax, s( i ) )
   10 CONTINUE
*
      IF( smin.LE.zero ) THEN
*
*        Find the first non-positive diagonal element and return.
*
         DO 20 i = 1, n
            IF( s( i ).LE.zero ) THEN
               info = i
               RETURN
            END IF
   20    CONTINUE
      ELSE
*
*        Set the scale factors to the reciprocals
*        of the diagonal elements.
*
         DO 30 i = 1, n
            s( i ) = one / sqrt( s( i ) )
   30    CONTINUE
*
*        Compute SCOND = min(S(I)) / max(S(I))
*
         scond = sqrt( smin ) / sqrt( amax )
      END IF
      RETURN
*
*     End of CPBEQU
*

◆ cpbrfs()

subroutine cpbrfs	(	character	uplo,
		integer	n,
		integer	kd,
		integer	nrhs,
		complex, dimension( ldab, * )	ab,
		integer	ldab,
		complex, dimension( ldafb, * )	afb,
		integer	ldafb,
		complex, dimension( ldb, * )	b,
		integer	ldb,
		complex, dimension( ldx, * )	x,
		integer	ldx,
		real, dimension( * )	ferr,
		real, dimension( * )	berr,
		complex, dimension( * )	work,
		real, dimension( * )	rwork,
		integer	info )

CPBRFS

Download CPBRFS + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CPBRFS improves the computed solution to a system of linear
!> equations when the coefficient matrix is Hermitian positive definite
!> and banded, and provides error bounds and backward error estimates
!> for the solution.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': Upper triangle of A is stored; !> = 'L': Lower triangle of A is stored. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in]	KD	!> KD is INTEGER !> The number of superdiagonals of the matrix A if UPLO = 'U', !> or the number of subdiagonals if UPLO = 'L'. KD >= 0. !>
[in]	NRHS	!> NRHS is INTEGER !> The number of right hand sides, i.e., the number of columns !> of the matrices B and X. NRHS >= 0. !>
[in]	AB	!> AB is COMPLEX array, dimension (LDAB,N) !> The upper or lower triangle of the Hermitian band matrix A, !> stored in the first KD+1 rows of the array. The j-th column !> of A is stored in the j-th column of the array AB as follows: !> if UPLO = 'U', AB(kd+1+i-j,j) = A(i,j) for max(1,j-kd)<=i<=j; !> if UPLO = 'L', AB(1+i-j,j) = A(i,j) for j<=i<=min(n,j+kd). !>
[in]	LDAB	!> LDAB is INTEGER !> The leading dimension of the array AB. LDAB >= KD+1. !>
[in]	AFB	!> AFB is COMPLEX array, dimension (LDAFB,N) !> The triangular factor U or L from the Cholesky factorization !> A = U*HU or A = LL*H of the band matrix A as computed by !> CPBTRF, in the same storage format as A (see AB). !>
[in]	LDAFB	!> LDAFB is INTEGER !> The leading dimension of the array AFB. LDAFB >= KD+1. !>
[in]	B	!> B is COMPLEX array, dimension (LDB,NRHS) !> The right hand side matrix B. !>
[in]	LDB	!> LDB is INTEGER !> The leading dimension of the array B. LDB >= max(1,N). !>
[in,out]	X	!> X is COMPLEX array, dimension (LDX,NRHS) !> On entry, the solution matrix X, as computed by CPBTRS. !> On exit, the improved solution matrix X. !>
[in]	LDX	!> LDX is INTEGER !> The leading dimension of the array X. LDX >= max(1,N). !>
[out]	FERR	!> FERR is REAL array, dimension (NRHS) !> The estimated forward error bound for each solution vector !> X(j) (the j-th column of the solution matrix X). !> If XTRUE is the true solution corresponding to X(j), FERR(j) !> is an estimated upper bound for the magnitude of the largest !> element in (X(j) - XTRUE) divided by the magnitude of the !> largest element in X(j). The estimate is as reliable as !> the estimate for RCOND, and is almost always a slight !> overestimate of the true error. !>
[out]	BERR	!> BERR is REAL array, dimension (NRHS) !> The componentwise relative backward error of each solution !> vector X(j) (i.e., the smallest relative change in !> any element of A or B that makes X(j) an exact solution). !>
[out]	WORK	!> WORK is COMPLEX array, dimension (2*N) !>
[out]	RWORK	!> RWORK is REAL array, dimension (N) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Internal Parameters:

!>  ITMAX is the maximum number of steps of iterative refinement.
!>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 187 of file cpbrfs.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          UPLO
      INTEGER            INFO, KD, LDAB, LDAFB, LDB, LDX, N, NRHS
*     ..
*     .. Array Arguments ..
      REAL               BERR( * ), FERR( * ), RWORK( * )
      COMPLEX            AB( LDAB, * ), AFB( LDAFB, * ), B( LDB, * ),
     $                   WORK( * ), X( LDX, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      INTEGER            ITMAX
      parameter( itmax = 5 )
      REAL               ZERO
      parameter( zero = 0.0e+0 )
      COMPLEX            ONE
      parameter( one = ( 1.0e+0, 0.0e+0 ) )
      REAL               TWO
      parameter( two = 2.0e+0 )
      REAL               THREE
      parameter( three = 3.0e+0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            UPPER
      INTEGER            COUNT, I, J, K, KASE, L, NZ
      REAL               EPS, LSTRES, S, SAFE1, SAFE2, SAFMIN, XK
      COMPLEX            ZDUM
*     ..
*     .. Local Arrays ..
      INTEGER            ISAVE( 3 )
*     ..
*     .. External Subroutines ..
      EXTERNAL           caxpy, ccopy, chbmv, clacn2, cpbtrs, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, aimag, max, min, real
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      REAL               SLAMCH
      EXTERNAL           lsame, slamch
*     ..
*     .. Statement Functions ..
      REAL               CABS1
*     ..
*     .. Statement Function definitions ..
      cabs1( zdum ) = abs( real( zdum ) ) + abs( aimag( zdum ) )
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      upper = lsame( uplo, 'U' )
      IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( kd.LT.0 ) THEN
         info = -3
      ELSE IF( nrhs.LT.0 ) THEN
         info = -4
      ELSE IF( ldab.LT.kd+1 ) THEN
         info = -6
      ELSE IF( ldafb.LT.kd+1 ) THEN
         info = -8
      ELSE IF( ldb.LT.max( 1, n ) ) THEN
         info = -10
      ELSE IF( ldx.LT.max( 1, n ) ) THEN
         info = -12
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CPBRFS', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 .OR. nrhs.EQ.0 ) THEN
         DO 10 j = 1, nrhs
            ferr( j ) = zero
            berr( j ) = zero
   10    CONTINUE
         RETURN
      END IF
*
*     NZ = maximum number of nonzero elements in each row of A, plus 1
*
      nz = min( n+1, 2*kd+2 )
      eps = slamch( 'Epsilon' )
      safmin = slamch( 'Safe minimum' )
      safe1 = nz*safmin
      safe2 = safe1 / eps
*
*     Do for each right hand side
*
      DO 140 j = 1, nrhs
*
         count = 1
         lstres = three
   20    CONTINUE
*
*        Loop until stopping criterion is satisfied.
*
*        Compute residual R = B - A * X
*
         CALL ccopy( n, b( 1, j ), 1, work, 1 )
         CALL chbmv( uplo, n, kd, -one, ab, ldab, x( 1, j ), 1, one,
     $               work, 1 )
*
*        Compute componentwise relative backward error from formula
*
*        max(i) ( abs(R(i)) / ( abs(A)*abs(X) + abs(B) )(i) )
*
*        where abs(Z) is the componentwise absolute value of the matrix
*        or vector Z.  If the i-th component of the denominator is less
*        than SAFE2, then SAFE1 is added to the i-th components of the
*        numerator and denominator before dividing.
*
         DO 30 i = 1, n
            rwork( i ) = cabs1( b( i, j ) )
   30    CONTINUE
*
*        Compute abs(A)*abs(X) + abs(B).
*
         IF( upper ) THEN
            DO 50 k = 1, n
               s = zero
               xk = cabs1( x( k, j ) )
               l = kd + 1 - k
               DO 40 i = max( 1, k-kd ), k - 1
                  rwork( i ) = rwork( i ) + cabs1( ab( l+i, k ) )*xk
                  s = s + cabs1( ab( l+i, k ) )*cabs1( x( i, j ) )
   40          CONTINUE
               rwork( k ) = rwork( k ) + abs( real( ab( kd+1, k ) ) )*
     $                      xk + s
   50       CONTINUE
         ELSE
            DO 70 k = 1, n
               s = zero
               xk = cabs1( x( k, j ) )
               rwork( k ) = rwork( k ) + abs( real( ab( 1, k ) ) )*xk
               l = 1 - k
               DO 60 i = k + 1, min( n, k+kd )
                  rwork( i ) = rwork( i ) + cabs1( ab( l+i, k ) )*xk
                  s = s + cabs1( ab( l+i, k ) )*cabs1( x( i, j ) )
   60          CONTINUE
               rwork( k ) = rwork( k ) + s
   70       CONTINUE
         END IF
         s = zero
         DO 80 i = 1, n
            IF( rwork( i ).GT.safe2 ) THEN
               s = max( s, cabs1( work( i ) ) / rwork( i ) )
            ELSE
               s = max( s, ( cabs1( work( i ) )+safe1 ) /
     $             ( rwork( i )+safe1 ) )
            END IF
   80    CONTINUE
         berr( j ) = s
*
*        Test stopping criterion. Continue iterating if
*           1) The residual BERR(J) is larger than machine epsilon, and
*           2) BERR(J) decreased by at least a factor of 2 during the
*              last iteration, and
*           3) At most ITMAX iterations tried.
*
         IF( berr( j ).GT.eps .AND. two*berr( j ).LE.lstres .AND.
     $       count.LE.itmax ) THEN
*
*           Update solution and try again.
*
            CALL cpbtrs( uplo, n, kd, 1, afb, ldafb, work, n, info )
            CALL caxpy( n, one, work, 1, x( 1, j ), 1 )
            lstres = berr( j )
            count = count + 1
            GO TO 20
         END IF
*
*        Bound error from formula
*
*        norm(X - XTRUE) / norm(X) .le. FERR =
*        norm( abs(inv(A))*
*           ( abs(R) + NZ*EPS*( abs(A)*abs(X)+abs(B) ))) / norm(X)
*
*        where
*          norm(Z) is the magnitude of the largest component of Z
*          inv(A) is the inverse of A
*          abs(Z) is the componentwise absolute value of the matrix or
*             vector Z
*          NZ is the maximum number of nonzeros in any row of A, plus 1
*          EPS is machine epsilon
*
*        The i-th component of abs(R)+NZ*EPS*(abs(A)*abs(X)+abs(B))
*        is incremented by SAFE1 if the i-th component of
*        abs(A)*abs(X) + abs(B) is less than SAFE2.
*
*        Use CLACN2 to estimate the infinity-norm of the matrix
*           inv(A) * diag(W),
*        where W = abs(R) + NZ*EPS*( abs(A)*abs(X)+abs(B) )))
*
         DO 90 i = 1, n
            IF( rwork( i ).GT.safe2 ) THEN
               rwork( i ) = cabs1( work( i ) ) + nz*eps*rwork( i )
            ELSE
               rwork( i ) = cabs1( work( i ) ) + nz*eps*rwork( i ) +
     $                      safe1
            END IF
   90    CONTINUE
*
         kase = 0
  100    CONTINUE
         CALL clacn2( n, work( n+1 ), work, ferr( j ), kase, isave )
         IF( kase.NE.0 ) THEN
            IF( kase.EQ.1 ) THEN
*
*              Multiply by diag(W)*inv(A**H).
*
               CALL cpbtrs( uplo, n, kd, 1, afb, ldafb, work, n, info )
               DO 110 i = 1, n
                  work( i ) = rwork( i )*work( i )
  110          CONTINUE
            ELSE IF( kase.EQ.2 ) THEN
*
*              Multiply by inv(A)*diag(W).
*
               DO 120 i = 1, n
                  work( i ) = rwork( i )*work( i )
  120          CONTINUE
               CALL cpbtrs( uplo, n, kd, 1, afb, ldafb, work, n, info )
            END IF
            GO TO 100
         END IF
*
*        Normalize error.
*
         lstres = zero
         DO 130 i = 1, n
            lstres = max( lstres, cabs1( x( i, j ) ) )
  130    CONTINUE
         IF( lstres.NE.zero )
     $      ferr( j ) = ferr( j ) / lstres
*
  140 CONTINUE
*
      RETURN
*
*     End of CPBRFS
*

◆ cpbstf()

subroutine cpbstf	(	character	uplo,
		integer	n,
		integer	kd,
		complex, dimension( ldab, * )	ab,
		integer	ldab,
		integer	info )

CPBSTF

Download CPBSTF + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CPBSTF computes a split Cholesky factorization of a complex
!> Hermitian positive definite band matrix A.
!>
!> This routine is designed to be used in conjunction with CHBGST.
!>
!> The factorization has the form  A = S**H*S  where S is a band matrix
!> of the same bandwidth as A and the following structure:
!>
!>   S = ( U    )
!>       ( M  L )
!>
!> where U is upper triangular of order m = (n+kd)/2, and L is lower
!> triangular of order n-m.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': Upper triangle of A is stored; !> = 'L': Lower triangle of A is stored. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in]	KD	!> KD is INTEGER !> The number of superdiagonals of the matrix A if UPLO = 'U', !> or the number of subdiagonals if UPLO = 'L'. KD >= 0. !>
[in,out]	AB	!> AB is COMPLEX array, dimension (LDAB,N) !> On entry, the upper or lower triangle of the Hermitian band !> matrix A, stored in the first kd+1 rows of the array. The !> j-th column of A is stored in the j-th column of the array AB !> as follows: !> if UPLO = 'U', AB(kd+1+i-j,j) = A(i,j) for max(1,j-kd)<=i<=j; !> if UPLO = 'L', AB(1+i-j,j) = A(i,j) for j<=i<=min(n,j+kd). !> !> On exit, if INFO = 0, the factor S from the split Cholesky !> factorization A = S*HS. See Further Details. !>
[in]	LDAB	!> LDAB is INTEGER !> The leading dimension of the array AB. LDAB >= KD+1. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !> > 0: if INFO = i, the factorization could not be completed, !> because the updated element a(i,i) was negative; the !> matrix A is not positive definite. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  The band storage scheme is illustrated by the following example, when
!>  N = 7, KD = 2:
!>
!>  S = ( s11  s12  s13                     )
!>      (      s22  s23  s24                )
!>      (           s33  s34                )
!>      (                s44                )
!>      (           s53  s54  s55           )
!>      (                s64  s65  s66      )
!>      (                     s75  s76  s77 )
!>
!>  If UPLO = 'U', the array AB holds:
!>
!>  on entry:                          on exit:
!>
!>   *    *   a13  a24  a35  a46  a57   *    *   s13  s24  s53**H s64**H s75**H
!>   *   a12  a23  a34  a45  a56  a67   *   s12  s23  s34  s54**H s65**H s76**H
!>  a11  a22  a33  a44  a55  a66  a77  s11  s22  s33  s44  s55    s66    s77
!>
!>  If UPLO = 'L', the array AB holds:
!>
!>  on entry:                          on exit:
!>
!>  a11  a22  a33  a44  a55  a66  a77  s11    s22    s33    s44  s55  s66  s77
!>  a21  a32  a43  a54  a65  a76   *   s12**H s23**H s34**H s54  s65  s76   *
!>  a31  a42  a53  a64  a64   *    *   s13**H s24**H s53    s64  s75   *    *
!>
!>  Array elements marked * are not used by the routine; s12**H denotes
!>  conjg(s12); the diagonal elements of S are real.
!>

Definition at line 152 of file cpbstf.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          UPLO
      INTEGER            INFO, KD, LDAB, N
*     ..
*     .. Array Arguments ..
      COMPLEX            AB( LDAB, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ONE, ZERO
      parameter( one = 1.0e+0, zero = 0.0e+0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            UPPER
      INTEGER            J, KLD, KM, M
      REAL               AJJ
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           cher, clacgv, csscal, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, min, real, sqrt
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      upper = lsame( uplo, 'U' )
      IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( kd.LT.0 ) THEN
         info = -3
      ELSE IF( ldab.LT.kd+1 ) THEN
         info = -5
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CPBSTF', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
      kld = max( 1, ldab-1 )
*
*     Set the splitting point m.
*
      m = ( n+kd ) / 2
*
      IF( upper ) THEN
*
*        Factorize A(m+1:n,m+1:n) as L**H*L, and update A(1:m,1:m).
*
         DO 10 j = n, m + 1, -1
*
*           Compute s(j,j) and test for non-positive-definiteness.
*
            ajj = real( ab( kd+1, j ) )
            IF( ajj.LE.zero ) THEN
               ab( kd+1, j ) = ajj
               GO TO 50
            END IF
            ajj = sqrt( ajj )
            ab( kd+1, j ) = ajj
            km = min( j-1, kd )
*
*           Compute elements j-km:j-1 of the j-th column and update the
*           the leading submatrix within the band.
*
            CALL csscal( km, one / ajj, ab( kd+1-km, j ), 1 )
            CALL cher( 'Upper', km, -one, ab( kd+1-km, j ), 1,
     $                 ab( kd+1, j-km ), kld )
   10    CONTINUE
*
*        Factorize the updated submatrix A(1:m,1:m) as U**H*U.
*
         DO 20 j = 1, m
*
*           Compute s(j,j) and test for non-positive-definiteness.
*
            ajj = real( ab( kd+1, j ) )
            IF( ajj.LE.zero ) THEN
               ab( kd+1, j ) = ajj
               GO TO 50
            END IF
            ajj = sqrt( ajj )
            ab( kd+1, j ) = ajj
            km = min( kd, m-j )
*
*           Compute elements j+1:j+km of the j-th row and update the
*           trailing submatrix within the band.
*
            IF( km.GT.0 ) THEN
               CALL csscal( km, one / ajj, ab( kd, j+1 ), kld )
               CALL clacgv( km, ab( kd, j+1 ), kld )
               CALL cher( 'Upper', km, -one, ab( kd, j+1 ), kld,
     $                    ab( kd+1, j+1 ), kld )
               CALL clacgv( km, ab( kd, j+1 ), kld )
            END IF
   20    CONTINUE
      ELSE
*
*        Factorize A(m+1:n,m+1:n) as L**H*L, and update A(1:m,1:m).
*
         DO 30 j = n, m + 1, -1
*
*           Compute s(j,j) and test for non-positive-definiteness.
*
            ajj = real( ab( 1, j ) )
            IF( ajj.LE.zero ) THEN
               ab( 1, j ) = ajj
               GO TO 50
            END IF
            ajj = sqrt( ajj )
            ab( 1, j ) = ajj
            km = min( j-1, kd )
*
*           Compute elements j-km:j-1 of the j-th row and update the
*           trailing submatrix within the band.
*
            CALL csscal( km, one / ajj, ab( km+1, j-km ), kld )
            CALL clacgv( km, ab( km+1, j-km ), kld )
            CALL cher( 'Lower', km, -one, ab( km+1, j-km ), kld,
     $                 ab( 1, j-km ), kld )
            CALL clacgv( km, ab( km+1, j-km ), kld )
   30    CONTINUE
*
*        Factorize the updated submatrix A(1:m,1:m) as U**H*U.
*
         DO 40 j = 1, m
*
*           Compute s(j,j) and test for non-positive-definiteness.
*
            ajj = real( ab( 1, j ) )
            IF( ajj.LE.zero ) THEN
               ab( 1, j ) = ajj
               GO TO 50
            END IF
            ajj = sqrt( ajj )
            ab( 1, j ) = ajj
            km = min( kd, m-j )
*
*           Compute elements j+1:j+km of the j-th column and update the
*           trailing submatrix within the band.
*
            IF( km.GT.0 ) THEN
               CALL csscal( km, one / ajj, ab( 2, j ), 1 )
               CALL cher( 'Lower', km, -one, ab( 2, j ), 1,
     $                    ab( 1, j+1 ), kld )
            END IF
   40    CONTINUE
      END IF
      RETURN
*
   50 CONTINUE
      info = j
      RETURN
*
*     End of CPBSTF
*

◆ cpbtf2()

subroutine cpbtf2	(	character	uplo,
		integer	n,
		integer	kd,
		complex, dimension( ldab, * )	ab,
		integer	ldab,
		integer	info )

CPBTF2 computes the Cholesky factorization of a symmetric/Hermitian positive definite band matrix (unblocked algorithm).

Download CPBTF2 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CPBTF2 computes the Cholesky factorization of a complex Hermitian
!> positive definite band matrix A.
!>
!> The factorization has the form
!>    A = U**H * U ,  if UPLO = 'U', or
!>    A = L  * L**H,  if UPLO = 'L',
!> where U is an upper triangular matrix, U**H is the conjugate transpose
!> of U, and L is lower triangular.
!>
!> This is the unblocked version of the algorithm, calling Level 2 BLAS.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> Specifies whether the upper or lower triangular part of the !> Hermitian matrix A is stored: !> = 'U': Upper triangular !> = 'L': Lower triangular !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in]	KD	!> KD is INTEGER !> The number of super-diagonals of the matrix A if UPLO = 'U', !> or the number of sub-diagonals if UPLO = 'L'. KD >= 0. !>
[in,out]	AB	!> AB is COMPLEX array, dimension (LDAB,N) !> On entry, the upper or lower triangle of the Hermitian band !> matrix A, stored in the first KD+1 rows of the array. The !> j-th column of A is stored in the j-th column of the array AB !> as follows: !> if UPLO = 'U', AB(kd+1+i-j,j) = A(i,j) for max(1,j-kd)<=i<=j; !> if UPLO = 'L', AB(1+i-j,j) = A(i,j) for j<=i<=min(n,j+kd). !> !> On exit, if INFO = 0, the triangular factor U or L from the !> Cholesky factorization A = U*H U or A = LL*H of the band !> matrix A, in the same storage format as A. !>
[in]	LDAB	!> LDAB is INTEGER !> The leading dimension of the array AB. LDAB >= KD+1. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -k, the k-th argument had an illegal value !> > 0: if INFO = k, the leading minor of order k is not !> positive definite, and the factorization could not be !> completed. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  The band storage scheme is illustrated by the following example, when
!>  N = 6, KD = 2, and UPLO = 'U':
!>
!>  On entry:                       On exit:
!>
!>      *    *   a13  a24  a35  a46      *    *   u13  u24  u35  u46
!>      *   a12  a23  a34  a45  a56      *   u12  u23  u34  u45  u56
!>     a11  a22  a33  a44  a55  a66     u11  u22  u33  u44  u55  u66
!>
!>  Similarly, if UPLO = 'L' the format of A is as follows:
!>
!>  On entry:                       On exit:
!>
!>     a11  a22  a33  a44  a55  a66     l11  l22  l33  l44  l55  l66
!>     a21  a32  a43  a54  a65   *      l21  l32  l43  l54  l65   *
!>     a31  a42  a53  a64   *    *      l31  l42  l53  l64   *    *
!>
!>  Array elements marked * are not used by the routine.
!>

Definition at line 141 of file cpbtf2.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          UPLO
      INTEGER            INFO, KD, LDAB, N
*     ..
*     .. Array Arguments ..
      COMPLEX            AB( LDAB, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ONE, ZERO
      parameter( one = 1.0e+0, zero = 0.0e+0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            UPPER
      INTEGER            J, KLD, KN
      REAL               AJJ
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           cher, clacgv, csscal, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, min, real, sqrt
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      upper = lsame( uplo, 'U' )
      IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( kd.LT.0 ) THEN
         info = -3
      ELSE IF( ldab.LT.kd+1 ) THEN
         info = -5
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CPBTF2', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
      kld = max( 1, ldab-1 )
*
      IF( upper ) THEN
*
*        Compute the Cholesky factorization A = U**H * U.
*
         DO 10 j = 1, n
*
*           Compute U(J,J) and test for non-positive-definiteness.
*
            ajj = real( ab( kd+1, j ) )
            IF( ajj.LE.zero ) THEN
               ab( kd+1, j ) = ajj
               GO TO 30
            END IF
            ajj = sqrt( ajj )
            ab( kd+1, j ) = ajj
*
*           Compute elements J+1:J+KN of row J and update the
*           trailing submatrix within the band.
*
            kn = min( kd, n-j )
            IF( kn.GT.0 ) THEN
               CALL csscal( kn, one / ajj, ab( kd, j+1 ), kld )
               CALL clacgv( kn, ab( kd, j+1 ), kld )
               CALL cher( 'Upper', kn, -one, ab( kd, j+1 ), kld,
     $                    ab( kd+1, j+1 ), kld )
               CALL clacgv( kn, ab( kd, j+1 ), kld )
            END IF
   10    CONTINUE
      ELSE
*
*        Compute the Cholesky factorization A = L*L**H.
*
         DO 20 j = 1, n
*
*           Compute L(J,J) and test for non-positive-definiteness.
*
            ajj = real( ab( 1, j ) )
            IF( ajj.LE.zero ) THEN
               ab( 1, j ) = ajj
               GO TO 30
            END IF
            ajj = sqrt( ajj )
            ab( 1, j ) = ajj
*
*           Compute elements J+1:J+KN of column J and update the
*           trailing submatrix within the band.
*
            kn = min( kd, n-j )
            IF( kn.GT.0 ) THEN
               CALL csscal( kn, one / ajj, ab( 2, j ), 1 )
               CALL cher( 'Lower', kn, -one, ab( 2, j ), 1,
     $                    ab( 1, j+1 ), kld )
            END IF
   20    CONTINUE
      END IF
      RETURN
*
   30 CONTINUE
      info = j
      RETURN
*
*     End of CPBTF2
*

◆ cpbtrf()

subroutine cpbtrf	(	character	uplo,
		integer	n,
		integer	kd,
		complex, dimension( ldab, * )	ab,
		integer	ldab,
		integer	info )

CPBTRF

Download CPBTRF + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CPBTRF computes the Cholesky factorization of a complex Hermitian
!> positive definite band matrix A.
!>
!> The factorization has the form
!>    A = U**H * U,  if UPLO = 'U', or
!>    A = L  * L**H,  if UPLO = 'L',
!> where U is an upper triangular matrix and L is lower triangular.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': Upper triangle of A is stored; !> = 'L': Lower triangle of A is stored. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in]	KD	!> KD is INTEGER !> The number of superdiagonals of the matrix A if UPLO = 'U', !> or the number of subdiagonals if UPLO = 'L'. KD >= 0. !>
[in,out]	AB	!> AB is COMPLEX array, dimension (LDAB,N) !> On entry, the upper or lower triangle of the Hermitian band !> matrix A, stored in the first KD+1 rows of the array. The !> j-th column of A is stored in the j-th column of the array AB !> as follows: !> if UPLO = 'U', AB(kd+1+i-j,j) = A(i,j) for max(1,j-kd)<=i<=j; !> if UPLO = 'L', AB(1+i-j,j) = A(i,j) for j<=i<=min(n,j+kd). !> !> On exit, if INFO = 0, the triangular factor U or L from the !> Cholesky factorization A = U*HU or A = LL*H of the band !> matrix A, in the same storage format as A. !>
[in]	LDAB	!> LDAB is INTEGER !> The leading dimension of the array AB. LDAB >= KD+1. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !> > 0: if INFO = i, the leading minor of order i is not !> positive definite, and the factorization could not be !> completed. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  The band storage scheme is illustrated by the following example, when
!>  N = 6, KD = 2, and UPLO = 'U':
!>
!>  On entry:                       On exit:
!>
!>      *    *   a13  a24  a35  a46      *    *   u13  u24  u35  u46
!>      *   a12  a23  a34  a45  a56      *   u12  u23  u34  u45  u56
!>     a11  a22  a33  a44  a55  a66     u11  u22  u33  u44  u55  u66
!>
!>  Similarly, if UPLO = 'L' the format of A is as follows:
!>
!>  On entry:                       On exit:
!>
!>     a11  a22  a33  a44  a55  a66     l11  l22  l33  l44  l55  l66
!>     a21  a32  a43  a54  a65   *      l21  l32  l43  l54  l65   *
!>     a31  a42  a53  a64   *    *      l31  l42  l53  l64   *    *
!>
!>  Array elements marked * are not used by the routine.
!>

Contributors:: Peter Mayes and Giuseppe Radicati, IBM ECSEC, Rome, March 23, 1989

Definition at line 141 of file cpbtrf.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          UPLO
      INTEGER            INFO, KD, LDAB, N
*     ..
*     .. Array Arguments ..
      COMPLEX            AB( LDAB, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ONE, ZERO
      parameter( one = 1.0e+0, zero = 0.0e+0 )
      COMPLEX            CONE
      parameter( cone = ( 1.0e+0, 0.0e+0 ) )
      INTEGER            NBMAX, LDWORK
      parameter( nbmax = 32, ldwork = nbmax+1 )
*     ..
*     .. Local Scalars ..
      INTEGER            I, I2, I3, IB, II, J, JJ, NB
*     ..
*     .. Local Arrays ..
      COMPLEX            WORK( LDWORK, NBMAX )
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      INTEGER            ILAENV
      EXTERNAL           lsame, ilaenv
*     ..
*     .. External Subroutines ..
      EXTERNAL           cgemm, cherk, cpbtf2, cpotf2, ctrsm, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          min
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      IF( ( .NOT.lsame( uplo, 'U' ) ) .AND.
     $    ( .NOT.lsame( uplo, 'L' ) ) ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( kd.LT.0 ) THEN
         info = -3
      ELSE IF( ldab.LT.kd+1 ) THEN
         info = -5
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CPBTRF', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
*     Determine the block size for this environment
*
      nb = ilaenv( 1, 'CPBTRF', uplo, n, kd, -1, -1 )
*
*     The block size must not exceed the semi-bandwidth KD, and must not
*     exceed the limit set by the size of the local array WORK.
*
      nb = min( nb, nbmax )
*
      IF( nb.LE.1 .OR. nb.GT.kd ) THEN
*
*        Use unblocked code
*
         CALL cpbtf2( uplo, n, kd, ab, ldab, info )
      ELSE
*
*        Use blocked code
*
         IF( lsame( uplo, 'U' ) ) THEN
*
*           Compute the Cholesky factorization of a Hermitian band
*           matrix, given the upper triangle of the matrix in band
*           storage.
*
*           Zero the upper triangle of the work array.
*
            DO 20 j = 1, nb
               DO 10 i = 1, j - 1
                  work( i, j ) = zero
   10          CONTINUE
   20       CONTINUE
*
*           Process the band matrix one diagonal block at a time.
*
            DO 70 i = 1, n, nb
               ib = min( nb, n-i+1 )
*
*              Factorize the diagonal block
*
               CALL cpotf2( uplo, ib, ab( kd+1, i ), ldab-1, ii )
               IF( ii.NE.0 ) THEN
                  info = i + ii - 1
                  GO TO 150
               END IF
               IF( i+ib.LE.n ) THEN
*
*                 Update the relevant part of the trailing submatrix.
*                 If A11 denotes the diagonal block which has just been
*                 factorized, then we need to update the remaining
*                 blocks in the diagram:
*
*                    A11   A12   A13
*                          A22   A23
*                                A33
*
*                 The numbers of rows and columns in the partitioning
*                 are IB, I2, I3 respectively. The blocks A12, A22 and
*                 A23 are empty if IB = KD. The upper triangle of A13
*                 lies outside the band.
*
                  i2 = min( kd-ib, n-i-ib+1 )
                  i3 = min( ib, n-i-kd+1 )
*
                  IF( i2.GT.0 ) THEN
*
*                    Update A12
*
                     CALL ctrsm( 'Left', 'Upper', 'Conjugate transpose',
     $                           'Non-unit', ib, i2, cone,
     $                           ab( kd+1, i ), ldab-1,
     $                           ab( kd+1-ib, i+ib ), ldab-1 )
*
*                    Update A22
*
                     CALL cherk( 'Upper', 'Conjugate transpose', i2, ib,
     $                           -one, ab( kd+1-ib, i+ib ), ldab-1, one,
     $                           ab( kd+1, i+ib ), ldab-1 )
                  END IF
*
                  IF( i3.GT.0 ) THEN
*
*                    Copy the lower triangle of A13 into the work array.
*
                     DO 40 jj = 1, i3
                        DO 30 ii = jj, ib
                           work( ii, jj ) = ab( ii-jj+1, jj+i+kd-1 )
   30                   CONTINUE
   40                CONTINUE
*
*                    Update A13 (in the work array).
*
                     CALL ctrsm( 'Left', 'Upper', 'Conjugate transpose',
     $                           'Non-unit', ib, i3, cone,
     $                           ab( kd+1, i ), ldab-1, work, ldwork )
*
*                    Update A23
*
                     IF( i2.GT.0 )
     $                  CALL cgemm( 'Conjugate transpose',
     $                              'No transpose', i2, i3, ib, -cone,
     $                              ab( kd+1-ib, i+ib ), ldab-1, work,
     $                              ldwork, cone, ab( 1+ib, i+kd ),
     $                              ldab-1 )
*
*                    Update A33
*
                     CALL cherk( 'Upper', 'Conjugate transpose', i3, ib,
     $                           -one, work, ldwork, one,
     $                           ab( kd+1, i+kd ), ldab-1 )
*
*                    Copy the lower triangle of A13 back into place.
*
                     DO 60 jj = 1, i3
                        DO 50 ii = jj, ib
                           ab( ii-jj+1, jj+i+kd-1 ) = work( ii, jj )
   50                   CONTINUE
   60                CONTINUE
                  END IF
               END IF
   70       CONTINUE
         ELSE
*
*           Compute the Cholesky factorization of a Hermitian band
*           matrix, given the lower triangle of the matrix in band
*           storage.
*
*           Zero the lower triangle of the work array.
*
            DO 90 j = 1, nb
               DO 80 i = j + 1, nb
                  work( i, j ) = zero
   80          CONTINUE
   90       CONTINUE
*
*           Process the band matrix one diagonal block at a time.
*
            DO 140 i = 1, n, nb
               ib = min( nb, n-i+1 )
*
*              Factorize the diagonal block
*
               CALL cpotf2( uplo, ib, ab( 1, i ), ldab-1, ii )
               IF( ii.NE.0 ) THEN
                  info = i + ii - 1
                  GO TO 150
               END IF
               IF( i+ib.LE.n ) THEN
*
*                 Update the relevant part of the trailing submatrix.
*                 If A11 denotes the diagonal block which has just been
*                 factorized, then we need to update the remaining
*                 blocks in the diagram:
*
*                    A11
*                    A21   A22
*                    A31   A32   A33
*
*                 The numbers of rows and columns in the partitioning
*                 are IB, I2, I3 respectively. The blocks A21, A22 and
*                 A32 are empty if IB = KD. The lower triangle of A31
*                 lies outside the band.
*
                  i2 = min( kd-ib, n-i-ib+1 )
                  i3 = min( ib, n-i-kd+1 )
*
                  IF( i2.GT.0 ) THEN
*
*                    Update A21
*
                     CALL ctrsm( 'Right', 'Lower',
     $                           'Conjugate transpose', 'Non-unit', i2,
     $                           ib, cone, ab( 1, i ), ldab-1,
     $                           ab( 1+ib, i ), ldab-1 )
*
*                    Update A22
*
                     CALL cherk( 'Lower', 'No transpose', i2, ib, -one,
     $                           ab( 1+ib, i ), ldab-1, one,
     $                           ab( 1, i+ib ), ldab-1 )
                  END IF
*
                  IF( i3.GT.0 ) THEN
*
*                    Copy the upper triangle of A31 into the work array.
*
                     DO 110 jj = 1, ib
                        DO 100 ii = 1, min( jj, i3 )
                           work( ii, jj ) = ab( kd+1-jj+ii, jj+i-1 )
  100                   CONTINUE
  110                CONTINUE
*
*                    Update A31 (in the work array).
*
                     CALL ctrsm( 'Right', 'Lower',
     $                           'Conjugate transpose', 'Non-unit', i3,
     $                           ib, cone, ab( 1, i ), ldab-1, work,
     $                           ldwork )
*
*                    Update A32
*
                     IF( i2.GT.0 )
     $                  CALL cgemm( 'No transpose',
     $                              'Conjugate transpose', i3, i2, ib,
     $                              -cone, work, ldwork, ab( 1+ib, i ),
     $                              ldab-1, cone, ab( 1+kd-ib, i+ib ),
     $                              ldab-1 )
*
*                    Update A33
*
                     CALL cherk( 'Lower', 'No transpose', i3, ib, -one,
     $                           work, ldwork, one, ab( 1, i+kd ),
     $                           ldab-1 )
*
*                    Copy the upper triangle of A31 back into place.
*
                     DO 130 jj = 1, ib
                        DO 120 ii = 1, min( jj, i3 )
                           ab( kd+1-jj+ii, jj+i-1 ) = work( ii, jj )
  120                   CONTINUE
  130                CONTINUE
                  END IF
               END IF
  140       CONTINUE
         END IF
      END IF
      RETURN
*
  150 CONTINUE
      RETURN
*
*     End of CPBTRF
*

◆ cpbtrs()

subroutine cpbtrs	(	character	uplo,
		integer	n,
		integer	kd,
		integer	nrhs,
		complex, dimension( ldab, * )	ab,
		integer	ldab,
		complex, dimension( ldb, * )	b,
		integer	ldb,
		integer	info )

CPBTRS

Download CPBTRS + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CPBTRS solves a system of linear equations A*X = B with a Hermitian
!> positive definite band matrix A using the Cholesky factorization
!> A = U**H*U or A = L*L**H computed by CPBTRF.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': Upper triangular factor stored in AB; !> = 'L': Lower triangular factor stored in AB. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in]	KD	!> KD is INTEGER !> The number of superdiagonals of the matrix A if UPLO = 'U', !> or the number of subdiagonals if UPLO = 'L'. KD >= 0. !>
[in]	NRHS	!> NRHS is INTEGER !> The number of right hand sides, i.e., the number of columns !> of the matrix B. NRHS >= 0. !>
[in]	AB	!> AB is COMPLEX array, dimension (LDAB,N) !> The triangular factor U or L from the Cholesky factorization !> A = U*HU or A = LL*H of the band matrix A, stored in the !> first KD+1 rows of the array. The j-th column of U or L is !> stored in the j-th column of the array AB as follows: !> if UPLO ='U', AB(kd+1+i-j,j) = U(i,j) for max(1,j-kd)<=i<=j; !> if UPLO ='L', AB(1+i-j,j) = L(i,j) for j<=i<=min(n,j+kd). !>
[in]	LDAB	!> LDAB is INTEGER !> The leading dimension of the array AB. LDAB >= KD+1. !>
[in,out]	B	!> B is COMPLEX array, dimension (LDB,NRHS) !> On entry, the right hand side matrix B. !> On exit, the solution matrix X. !>
[in]	LDB	!> LDB is INTEGER !> The leading dimension of the array B. LDB >= max(1,N). !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 120 of file cpbtrs.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          UPLO
      INTEGER            INFO, KD, LDAB, LDB, N, NRHS
*     ..
*     .. Array Arguments ..
      COMPLEX            AB( LDAB, * ), B( LDB, * )
*     ..
*
*  =====================================================================
*
*     .. Local Scalars ..
      LOGICAL            UPPER
      INTEGER            J
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           ctbsv, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      upper = lsame( uplo, 'U' )
      IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( kd.LT.0 ) THEN
         info = -3
      ELSE IF( nrhs.LT.0 ) THEN
         info = -4
      ELSE IF( ldab.LT.kd+1 ) THEN
         info = -6
      ELSE IF( ldb.LT.max( 1, n ) ) THEN
         info = -8
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CPBTRS', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 .OR. nrhs.EQ.0 )
     $   RETURN
*
      IF( upper ) THEN
*
*        Solve A*X = B where A = U**H *U.
*
         DO 10 j = 1, nrhs
*
*           Solve U**H *X = B, overwriting B with X.
*
            CALL ctbsv( 'Upper', 'Conjugate transpose', 'Non-unit', n,
     $                  kd, ab, ldab, b( 1, j ), 1 )
*
*           Solve U*X = B, overwriting B with X.
*
            CALL ctbsv( 'Upper', 'No transpose', 'Non-unit', n, kd, ab,
     $                  ldab, b( 1, j ), 1 )
   10    CONTINUE
      ELSE
*
*        Solve A*X = B where A = L*L**H.
*
         DO 20 j = 1, nrhs
*
*           Solve L*X = B, overwriting B with X.
*
            CALL ctbsv( 'Lower', 'No transpose', 'Non-unit', n, kd, ab,
     $                  ldab, b( 1, j ), 1 )
*
*           Solve L**H *X = B, overwriting B with X.
*
            CALL ctbsv( 'Lower', 'Conjugate transpose', 'Non-unit', n,
     $                  kd, ab, ldab, b( 1, j ), 1 )
   20    CONTINUE
      END IF
*
      RETURN
*
*     End of CPBTRS
*

◆ cpftrf()

subroutine cpftrf	(	character	transr,
		character	uplo,
		integer	n,
		complex, dimension( 0: * )	a,
		integer	info )

CPFTRF

Download CPFTRF + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CPFTRF computes the Cholesky factorization of a complex Hermitian
!> positive definite matrix A.
!>
!> The factorization has the form
!>    A = U**H * U,  if UPLO = 'U', or
!>    A = L  * L**H,  if UPLO = 'L',
!> where U is an upper triangular matrix and L is lower triangular.
!>
!> This is the block version of the algorithm, calling Level 3 BLAS.
!>

Parameters

[in]	TRANSR	!> TRANSR is CHARACTER*1 !> = 'N': The Normal TRANSR of RFP A is stored; !> = 'C': The Conjugate-transpose TRANSR of RFP A is stored. !>
[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': Upper triangle of RFP A is stored; !> = 'L': Lower triangle of RFP A is stored. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in,out]	A	!> A is COMPLEX array, dimension ( N(N+1)/2 ); !> On entry, the Hermitian matrix A in RFP format. RFP format is !> described by TRANSR, UPLO, and N as follows: If TRANSR = 'N' !> then RFP A is (0:N,0:k-1) when N is even; k=N/2. RFP A is !> (0:N-1,0:k) when N is odd; k=N/2. IF TRANSR = 'C' then RFP is !> the Conjugate-transpose of RFP A as defined when !> TRANSR = 'N'. The contents of RFP A are defined by UPLO as !> follows: If UPLO = 'U' the RFP A contains the nt elements of !> upper packed A. If UPLO = 'L' the RFP A contains the elements !> of lower packed A. The LDA of RFP A is (N+1)/2 when TRANSR = !> 'C'. When TRANSR is 'N' the LDA is N+1 when N is even and N !> is odd. See the Note below for more details. !> !> On exit, if INFO = 0, the factor U or L from the Cholesky !> factorization RFP A = UHU or RFP A = LL*H. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !> > 0: if INFO = i, the leading minor of order i is not !> positive definite, and the factorization could not be !> completed. !> !> Further Notes on RFP Format: !> ============================ !> !> We first consider Standard Packed Format when N is even. !> We give an example where N = 6. !> !> AP is Upper AP is Lower !> !> 00 01 02 03 04 05 00 !> 11 12 13 14 15 10 11 !> 22 23 24 25 20 21 22 !> 33 34 35 30 31 32 33 !> 44 45 40 41 42 43 44 !> 55 50 51 52 53 54 55 !> !> Let TRANSR = 'N'. RFP holds AP as follows: !> For UPLO = 'U' the upper trapezoid A(0:5,0:2) consists of the last !> three columns of AP upper. The lower triangle A(4:6,0:2) consists of !> conjugate-transpose of the first three columns of AP upper. !> For UPLO = 'L' the lower trapezoid A(1:6,0:2) consists of the first !> three columns of AP lower. The upper triangle A(0:2,0:2) consists of !> conjugate-transpose of the last three columns of AP lower. !> To denote conjugate we place -- above the element. This covers the !> case N even and TRANSR = 'N'. !> !> RFP A RFP A !> !> -- -- -- !> 03 04 05 33 43 53 !> -- -- !> 13 14 15 00 44 54 !> -- !> 23 24 25 10 11 55 !> !> 33 34 35 20 21 22 !> -- !> 00 44 45 30 31 32 !> -- -- !> 01 11 55 40 41 42 !> -- -- -- !> 02 12 22 50 51 52 !> !> Now let TRANSR = 'C'. RFP A in both UPLO cases is just the conjugate- !> transpose of RFP A above. One therefore gets: !> !> RFP A RFP A !> !> -- -- -- -- -- -- -- -- -- -- !> 03 13 23 33 00 01 02 33 00 10 20 30 40 50 !> -- -- -- -- -- -- -- -- -- -- !> 04 14 24 34 44 11 12 43 44 11 21 31 41 51 !> -- -- -- -- -- -- -- -- -- -- !> 05 15 25 35 45 55 22 53 54 55 22 32 42 52 !> !> We next consider Standard Packed Format when N is odd. !> We give an example where N = 5. !> !> AP is Upper AP is Lower !> !> 00 01 02 03 04 00 !> 11 12 13 14 10 11 !> 22 23 24 20 21 22 !> 33 34 30 31 32 33 !> 44 40 41 42 43 44 !> !> Let TRANSR = 'N'. RFP holds AP as follows: !> For UPLO = 'U' the upper trapezoid A(0:4,0:2) consists of the last !> three columns of AP upper. The lower triangle A(3:4,0:1) consists of !> conjugate-transpose of the first two columns of AP upper. !> For UPLO = 'L' the lower trapezoid A(0:4,0:2) consists of the first !> three columns of AP lower. The upper triangle A(0:1,1:2) consists of !> conjugate-transpose of the last two columns of AP lower. !> To denote conjugate we place -- above the element. This covers the !> case N odd and TRANSR = 'N'. !> !> RFP A RFP A !> !> -- -- !> 02 03 04 00 33 43 !> -- !> 12 13 14 10 11 44 !> !> 22 23 24 20 21 22 !> -- !> 00 33 34 30 31 32 !> -- -- !> 01 11 44 40 41 42 !> !> Now let TRANSR = 'C'. RFP A in both UPLO cases is just the conjugate- !> transpose of RFP A above. One therefore gets: !> !> RFP A RFP A !> !> -- -- -- -- -- -- -- -- -- !> 02 12 22 00 01 00 10 20 30 40 50 !> -- -- -- -- -- -- -- -- -- !> 03 13 23 33 11 33 11 21 31 41 51 !> -- -- -- -- -- -- -- -- -- !> 04 14 24 34 44 43 44 22 32 42 52 !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 210 of file cpftrf.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          TRANSR, UPLO
      INTEGER            N, INFO
*     ..
*     .. Array Arguments ..
      COMPLEX            A( 0: * )
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ONE
      COMPLEX            CONE
      parameter( one = 1.0e+0, cone = ( 1.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      LOGICAL            LOWER, NISODD, NORMALTRANSR
      INTEGER            N1, N2, K
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           xerbla, cherk, cpotrf, ctrsm
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          mod
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      normaltransr = lsame( transr, 'N' )
      lower = lsame( uplo, 'L' )
      IF( .NOT.normaltransr .AND. .NOT.lsame( transr, 'C' ) ) THEN
         info = -1
      ELSE IF( .NOT.lower .AND. .NOT.lsame( uplo, 'U' ) ) THEN
         info = -2
      ELSE IF( n.LT.0 ) THEN
         info = -3
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CPFTRF', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
*     If N is odd, set NISODD = .TRUE.
*     If N is even, set K = N/2 and NISODD = .FALSE.
*
      IF( mod( n, 2 ).EQ.0 ) THEN
         k = n / 2
         nisodd = .false.
      ELSE
         nisodd = .true.
      END IF
*
*     Set N1 and N2 depending on LOWER
*
      IF( lower ) THEN
         n2 = n / 2
         n1 = n - n2
      ELSE
         n1 = n / 2
         n2 = n - n1
      END IF
*
*     start execution: there are eight cases
*
      IF( nisodd ) THEN
*
*        N is odd
*
         IF( normaltransr ) THEN
*
*           N is odd and TRANSR = 'N'
*
            IF( lower ) THEN
*
*             SRPA for LOWER, NORMAL and N is odd ( a(0:n-1,0:n1-1) )
*             T1 -> a(0,0), T2 -> a(0,1), S -> a(n1,0)
*             T1 -> a(0), T2 -> a(n), S -> a(n1)
*
               CALL cpotrf( 'L', n1, a( 0 ), n, info )
               IF( info.GT.0 )
     $            RETURN
               CALL ctrsm( 'R', 'L', 'C', 'N', n2, n1, cone, a( 0 ), n,
     $                     a( n1 ), n )
               CALL cherk( 'U', 'N', n2, n1, -one, a( n1 ), n, one,
     $                     a( n ), n )
               CALL cpotrf( 'U', n2, a( n ), n, info )
               IF( info.GT.0 )
     $            info = info + n1
*
            ELSE
*
*             SRPA for UPPER, NORMAL and N is odd ( a(0:n-1,0:n2-1)
*             T1 -> a(n1+1,0), T2 -> a(n1,0), S -> a(0,0)
*             T1 -> a(n2), T2 -> a(n1), S -> a(0)
*
               CALL cpotrf( 'L', n1, a( n2 ), n, info )
               IF( info.GT.0 )
     $            RETURN
               CALL ctrsm( 'L', 'L', 'N', 'N', n1, n2, cone, a( n2 ), n,
     $                     a( 0 ), n )
               CALL cherk( 'U', 'C', n2, n1, -one, a( 0 ), n, one,
     $                     a( n1 ), n )
               CALL cpotrf( 'U', n2, a( n1 ), n, info )
               IF( info.GT.0 )
     $            info = info + n1
*
            END IF
*
         ELSE
*
*           N is odd and TRANSR = 'C'
*
            IF( lower ) THEN
*
*              SRPA for LOWER, TRANSPOSE and N is odd
*              T1 -> A(0,0) , T2 -> A(1,0) , S -> A(0,n1)
*              T1 -> a(0+0) , T2 -> a(1+0) , S -> a(0+n1*n1); lda=n1
*
               CALL cpotrf( 'U', n1, a( 0 ), n1, info )
               IF( info.GT.0 )
     $            RETURN
               CALL ctrsm( 'L', 'U', 'C', 'N', n1, n2, cone, a( 0 ), n1,
     $                     a( n1*n1 ), n1 )
               CALL cherk( 'L', 'C', n2, n1, -one, a( n1*n1 ), n1, one,
     $                     a( 1 ), n1 )
               CALL cpotrf( 'L', n2, a( 1 ), n1, info )
               IF( info.GT.0 )
     $            info = info + n1
*
            ELSE
*
*              SRPA for UPPER, TRANSPOSE and N is odd
*              T1 -> A(0,n1+1), T2 -> A(0,n1), S -> A(0,0)
*              T1 -> a(n2*n2), T2 -> a(n1*n2), S -> a(0); lda = n2
*
               CALL cpotrf( 'U', n1, a( n2*n2 ), n2, info )
               IF( info.GT.0 )
     $            RETURN
               CALL ctrsm( 'R', 'U', 'N', 'N', n2, n1, cone, a( n2*n2 ),
     $                     n2, a( 0 ), n2 )
               CALL cherk( 'L', 'N', n2, n1, -one, a( 0 ), n2, one,
     $                     a( n1*n2 ), n2 )
               CALL cpotrf( 'L', n2, a( n1*n2 ), n2, info )
               IF( info.GT.0 )
     $            info = info + n1
*
            END IF
*
         END IF
*
      ELSE
*
*        N is even
*
         IF( normaltransr ) THEN
*
*           N is even and TRANSR = 'N'
*
            IF( lower ) THEN
*
*              SRPA for LOWER, NORMAL, and N is even ( a(0:n,0:k-1) )
*              T1 -> a(1,0), T2 -> a(0,0), S -> a(k+1,0)
*              T1 -> a(1), T2 -> a(0), S -> a(k+1)
*
               CALL cpotrf( 'L', k, a( 1 ), n+1, info )
               IF( info.GT.0 )
     $            RETURN
               CALL ctrsm( 'R', 'L', 'C', 'N', k, k, cone, a( 1 ), n+1,
     $                     a( k+1 ), n+1 )
               CALL cherk( 'U', 'N', k, k, -one, a( k+1 ), n+1, one,
     $                     a( 0 ), n+1 )
               CALL cpotrf( 'U', k, a( 0 ), n+1, info )
               IF( info.GT.0 )
     $            info = info + k
*
            ELSE
*
*              SRPA for UPPER, NORMAL, and N is even ( a(0:n,0:k-1) )
*              T1 -> a(k+1,0) ,  T2 -> a(k,0),   S -> a(0,0)
*              T1 -> a(k+1), T2 -> a(k), S -> a(0)
*
               CALL cpotrf( 'L', k, a( k+1 ), n+1, info )
               IF( info.GT.0 )
     $            RETURN
               CALL ctrsm( 'L', 'L', 'N', 'N', k, k, cone, a( k+1 ),
     $                     n+1, a( 0 ), n+1 )
               CALL cherk( 'U', 'C', k, k, -one, a( 0 ), n+1, one,
     $                     a( k ), n+1 )
               CALL cpotrf( 'U', k, a( k ), n+1, info )
               IF( info.GT.0 )
     $            info = info + k
*
            END IF
*
         ELSE
*
*           N is even and TRANSR = 'C'
*
            IF( lower ) THEN
*
*              SRPA for LOWER, TRANSPOSE and N is even (see paper)
*              T1 -> B(0,1), T2 -> B(0,0), S -> B(0,k+1)
*              T1 -> a(0+k), T2 -> a(0+0), S -> a(0+k*(k+1)); lda=k
*
               CALL cpotrf( 'U', k, a( 0+k ), k, info )
               IF( info.GT.0 )
     $            RETURN
               CALL ctrsm( 'L', 'U', 'C', 'N', k, k, cone, a( k ), n1,
     $                     a( k*( k+1 ) ), k )
               CALL cherk( 'L', 'C', k, k, -one, a( k*( k+1 ) ), k, one,
     $                     a( 0 ), k )
               CALL cpotrf( 'L', k, a( 0 ), k, info )
               IF( info.GT.0 )
     $            info = info + k
*
            ELSE
*
*              SRPA for UPPER, TRANSPOSE and N is even (see paper)
*              T1 -> B(0,k+1),     T2 -> B(0,k),   S -> B(0,0)
*              T1 -> a(0+k*(k+1)), T2 -> a(0+k*k), S -> a(0+0)); lda=k
*
               CALL cpotrf( 'U', k, a( k*( k+1 ) ), k, info )
               IF( info.GT.0 )
     $            RETURN
               CALL ctrsm( 'R', 'U', 'N', 'N', k, k, cone,
     $                     a( k*( k+1 ) ), k, a( 0 ), k )
               CALL cherk( 'L', 'N', k, k, -one, a( 0 ), k, one,
     $                     a( k*k ), k )
               CALL cpotrf( 'L', k, a( k*k ), k, info )
               IF( info.GT.0 )
     $            info = info + k
*
            END IF
*
         END IF
*
      END IF
*
      RETURN
*
*     End of CPFTRF
*

◆ cpftri()

subroutine cpftri	(	character	transr,
		character	uplo,
		integer	n,
		complex, dimension( 0: * )	a,
		integer	info )

CPFTRI

Download CPFTRI + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CPFTRI computes the inverse of a complex Hermitian positive definite
!> matrix A using the Cholesky factorization A = U**H*U or A = L*L**H
!> computed by CPFTRF.
!>

Parameters

[in]	TRANSR	!> TRANSR is CHARACTER*1 !> = 'N': The Normal TRANSR of RFP A is stored; !> = 'C': The Conjugate-transpose TRANSR of RFP A is stored. !>
[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': Upper triangle of A is stored; !> = 'L': Lower triangle of A is stored. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in,out]	A	!> A is COMPLEX array, dimension ( N*(N+1)/2 ); !> On entry, the Hermitian matrix A in RFP format. RFP format is !> described by TRANSR, UPLO, and N as follows: If TRANSR = 'N' !> then RFP A is (0:N,0:k-1) when N is even; k=N/2. RFP A is !> (0:N-1,0:k) when N is odd; k=N/2. IF TRANSR = 'C' then RFP is !> the Conjugate-transpose of RFP A as defined when !> TRANSR = 'N'. The contents of RFP A are defined by UPLO as !> follows: If UPLO = 'U' the RFP A contains the nt elements of !> upper packed A. If UPLO = 'L' the RFP A contains the elements !> of lower packed A. The LDA of RFP A is (N+1)/2 when TRANSR = !> 'C'. When TRANSR is 'N' the LDA is N+1 when N is even and N !> is odd. See the Note below for more details. !> !> On exit, the Hermitian inverse of the original matrix, in the !> same storage format. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !> > 0: if INFO = i, the (i,i) element of the factor U or L is !> zero, and the inverse could not be computed. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  We first consider Standard Packed Format when N is even.
!>  We give an example where N = 6.
!>
!>      AP is Upper             AP is Lower
!>
!>   00 01 02 03 04 05       00
!>      11 12 13 14 15       10 11
!>         22 23 24 25       20 21 22
!>            33 34 35       30 31 32 33
!>               44 45       40 41 42 43 44
!>                  55       50 51 52 53 54 55
!>
!>
!>  Let TRANSR = 'N'. RFP holds AP as follows:
!>  For UPLO = 'U' the upper trapezoid A(0:5,0:2) consists of the last
!>  three columns of AP upper. The lower triangle A(4:6,0:2) consists of
!>  conjugate-transpose of the first three columns of AP upper.
!>  For UPLO = 'L' the lower trapezoid A(1:6,0:2) consists of the first
!>  three columns of AP lower. The upper triangle A(0:2,0:2) consists of
!>  conjugate-transpose of the last three columns of AP lower.
!>  To denote conjugate we place -- above the element. This covers the
!>  case N even and TRANSR = 'N'.
!>
!>         RFP A                   RFP A
!>
!>                                -- -- --
!>        03 04 05                33 43 53
!>                                   -- --
!>        13 14 15                00 44 54
!>                                      --
!>        23 24 25                10 11 55
!>
!>        33 34 35                20 21 22
!>        --
!>        00 44 45                30 31 32
!>        -- --
!>        01 11 55                40 41 42
!>        -- -- --
!>        02 12 22                50 51 52
!>
!>  Now let TRANSR = 'C'. RFP A in both UPLO cases is just the conjugate-
!>  transpose of RFP A above. One therefore gets:
!>
!>
!>           RFP A                   RFP A
!>
!>     -- -- -- --                -- -- -- -- -- --
!>     03 13 23 33 00 01 02    33 00 10 20 30 40 50
!>     -- -- -- -- --                -- -- -- -- --
!>     04 14 24 34 44 11 12    43 44 11 21 31 41 51
!>     -- -- -- -- -- --                -- -- -- --
!>     05 15 25 35 45 55 22    53 54 55 22 32 42 52
!>
!>
!>  We next  consider Standard Packed Format when N is odd.
!>  We give an example where N = 5.
!>
!>     AP is Upper                 AP is Lower
!>
!>   00 01 02 03 04              00
!>      11 12 13 14              10 11
!>         22 23 24              20 21 22
!>            33 34              30 31 32 33
!>               44              40 41 42 43 44
!>
!>
!>  Let TRANSR = 'N'. RFP holds AP as follows:
!>  For UPLO = 'U' the upper trapezoid A(0:4,0:2) consists of the last
!>  three columns of AP upper. The lower triangle A(3:4,0:1) consists of
!>  conjugate-transpose of the first two   columns of AP upper.
!>  For UPLO = 'L' the lower trapezoid A(0:4,0:2) consists of the first
!>  three columns of AP lower. The upper triangle A(0:1,1:2) consists of
!>  conjugate-transpose of the last two   columns of AP lower.
!>  To denote conjugate we place -- above the element. This covers the
!>  case N odd  and TRANSR = 'N'.
!>
!>         RFP A                   RFP A
!>
!>                                   -- --
!>        02 03 04                00 33 43
!>                                      --
!>        12 13 14                10 11 44
!>
!>        22 23 24                20 21 22
!>        --
!>        00 33 34                30 31 32
!>        -- --
!>        01 11 44                40 41 42
!>
!>  Now let TRANSR = 'C'. RFP A in both UPLO cases is just the conjugate-
!>  transpose of RFP A above. One therefore gets:
!>
!>
!>           RFP A                   RFP A
!>
!>     -- -- --                   -- -- -- -- -- --
!>     02 12 22 00 01             00 10 20 30 40 50
!>     -- -- -- --                   -- -- -- -- --
!>     03 13 23 33 11             33 11 21 31 41 51
!>     -- -- -- -- --                   -- -- -- --
!>     04 14 24 34 44             43 44 22 32 42 52
!>

Definition at line 211 of file cpftri.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          TRANSR, UPLO
      INTEGER            INFO, N
*     .. Array Arguments ..
      COMPLEX            A( 0: * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ONE
      COMPLEX            CONE
      parameter( one = 1.0e+0, cone = ( 1.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      LOGICAL            LOWER, NISODD, NORMALTRANSR
      INTEGER            N1, N2, K
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           xerbla, ctftri, clauum, ctrmm, cherk
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          mod
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      normaltransr = lsame( transr, 'N' )
      lower = lsame( uplo, 'L' )
      IF( .NOT.normaltransr .AND. .NOT.lsame( transr, 'C' ) ) THEN
         info = -1
      ELSE IF( .NOT.lower .AND. .NOT.lsame( uplo, 'U' ) ) THEN
         info = -2
      ELSE IF( n.LT.0 ) THEN
         info = -3
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CPFTRI', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
*     Invert the triangular Cholesky factor U or L.
*
      CALL ctftri( transr, uplo, 'N', n, a, info )
      IF( info.GT.0 )
     $   RETURN
*
*     If N is odd, set NISODD = .TRUE.
*     If N is even, set K = N/2 and NISODD = .FALSE.
*
      IF( mod( n, 2 ).EQ.0 ) THEN
         k = n / 2
         nisodd = .false.
      ELSE
         nisodd = .true.
      END IF
*
*     Set N1 and N2 depending on LOWER
*
      IF( lower ) THEN
         n2 = n / 2
         n1 = n - n2
      ELSE
         n1 = n / 2
         n2 = n - n1
      END IF
*
*     Start execution of triangular matrix multiply: inv(U)*inv(U)^C or
*     inv(L)^C*inv(L). There are eight cases.
*
      IF( nisodd ) THEN
*
*        N is odd
*
         IF( normaltransr ) THEN
*
*           N is odd and TRANSR = 'N'
*
            IF( lower ) THEN
*
*              SRPA for LOWER, NORMAL and N is odd ( a(0:n-1,0:N1-1) )
*              T1 -> a(0,0), T2 -> a(0,1), S -> a(N1,0)
*              T1 -> a(0), T2 -> a(n), S -> a(N1)
*
               CALL clauum( 'L', n1, a( 0 ), n, info )
               CALL cherk( 'L', 'C', n1, n2, one, a( n1 ), n, one,
     $                     a( 0 ), n )
               CALL ctrmm( 'L', 'U', 'N', 'N', n2, n1, cone, a( n ), n,
     $                     a( n1 ), n )
               CALL clauum( 'U', n2, a( n ), n, info )
*
            ELSE
*
*              SRPA for UPPER, NORMAL and N is odd ( a(0:n-1,0:N2-1)
*              T1 -> a(N1+1,0), T2 -> a(N1,0), S -> a(0,0)
*              T1 -> a(N2), T2 -> a(N1), S -> a(0)
*
               CALL clauum( 'L', n1, a( n2 ), n, info )
               CALL cherk( 'L', 'N', n1, n2, one, a( 0 ), n, one,
     $                     a( n2 ), n )
               CALL ctrmm( 'R', 'U', 'C', 'N', n1, n2, cone, a( n1 ), n,
     $                     a( 0 ), n )
               CALL clauum( 'U', n2, a( n1 ), n, info )
*
            END IF
*
         ELSE
*
*           N is odd and TRANSR = 'C'
*
            IF( lower ) THEN
*
*              SRPA for LOWER, TRANSPOSE, and N is odd
*              T1 -> a(0), T2 -> a(1), S -> a(0+N1*N1)
*
               CALL clauum( 'U', n1, a( 0 ), n1, info )
               CALL cherk( 'U', 'N', n1, n2, one, a( n1*n1 ), n1, one,
     $                     a( 0 ), n1 )
               CALL ctrmm( 'R', 'L', 'N', 'N', n1, n2, cone, a( 1 ), n1,
     $                     a( n1*n1 ), n1 )
               CALL clauum( 'L', n2, a( 1 ), n1, info )
*
            ELSE
*
*              SRPA for UPPER, TRANSPOSE, and N is odd
*              T1 -> a(0+N2*N2), T2 -> a(0+N1*N2), S -> a(0)
*
               CALL clauum( 'U', n1, a( n2*n2 ), n2, info )
               CALL cherk( 'U', 'C', n1, n2, one, a( 0 ), n2, one,
     $                     a( n2*n2 ), n2 )
               CALL ctrmm( 'L', 'L', 'C', 'N', n2, n1, cone, a( n1*n2 ),
     $                     n2, a( 0 ), n2 )
               CALL clauum( 'L', n2, a( n1*n2 ), n2, info )
*
            END IF
*
         END IF
*
      ELSE
*
*        N is even
*
         IF( normaltransr ) THEN
*
*           N is even and TRANSR = 'N'
*
            IF( lower ) THEN
*
*              SRPA for LOWER, NORMAL, and N is even ( a(0:n,0:k-1) )
*              T1 -> a(1,0), T2 -> a(0,0), S -> a(k+1,0)
*              T1 -> a(1), T2 -> a(0), S -> a(k+1)
*
               CALL clauum( 'L', k, a( 1 ), n+1, info )
               CALL cherk( 'L', 'C', k, k, one, a( k+1 ), n+1, one,
     $                     a( 1 ), n+1 )
               CALL ctrmm( 'L', 'U', 'N', 'N', k, k, cone, a( 0 ), n+1,
     $                     a( k+1 ), n+1 )
               CALL clauum( 'U', k, a( 0 ), n+1, info )
*
            ELSE
*
*              SRPA for UPPER, NORMAL, and N is even ( a(0:n,0:k-1) )
*              T1 -> a(k+1,0) ,  T2 -> a(k,0),   S -> a(0,0)
*              T1 -> a(k+1), T2 -> a(k), S -> a(0)
*
               CALL clauum( 'L', k, a( k+1 ), n+1, info )
               CALL cherk( 'L', 'N', k, k, one, a( 0 ), n+1, one,
     $                     a( k+1 ), n+1 )
               CALL ctrmm( 'R', 'U', 'C', 'N', k, k, cone, a( k ), n+1,
     $                     a( 0 ), n+1 )
               CALL clauum( 'U', k, a( k ), n+1, info )
*
            END IF
*
         ELSE
*
*           N is even and TRANSR = 'C'
*
            IF( lower ) THEN
*
*              SRPA for LOWER, TRANSPOSE, and N is even (see paper)
*              T1 -> B(0,1), T2 -> B(0,0), S -> B(0,k+1),
*              T1 -> a(0+k), T2 -> a(0+0), S -> a(0+k*(k+1)); lda=k
*
               CALL clauum( 'U', k, a( k ), k, info )
               CALL cherk( 'U', 'N', k, k, one, a( k*( k+1 ) ), k, one,
     $                     a( k ), k )
               CALL ctrmm( 'R', 'L', 'N', 'N', k, k, cone, a( 0 ), k,
     $                     a( k*( k+1 ) ), k )
               CALL clauum( 'L', k, a( 0 ), k, info )
*
            ELSE
*
*              SRPA for UPPER, TRANSPOSE, and N is even (see paper)
*              T1 -> B(0,k+1),     T2 -> B(0,k),   S -> B(0,0),
*              T1 -> a(0+k*(k+1)), T2 -> a(0+k*k), S -> a(0+0)); lda=k
*
               CALL clauum( 'U', k, a( k*( k+1 ) ), k, info )
               CALL cherk( 'U', 'C', k, k, one, a( 0 ), k, one,
     $                     a( k*( k+1 ) ), k )
               CALL ctrmm( 'L', 'L', 'C', 'N', k, k, cone, a( k*k ), k,
     $                     a( 0 ), k )
               CALL clauum( 'L', k, a( k*k ), k, info )
*
            END IF
*
         END IF
*
      END IF
*
      RETURN
*
*     End of CPFTRI
*

◆ cpftrs()

subroutine cpftrs	(	character	transr,
		character	uplo,
		integer	n,
		integer	nrhs,
		complex, dimension( 0: * )	a,
		complex, dimension( ldb, * )	b,
		integer	ldb,
		integer	info )

CPFTRS

Download CPFTRS + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CPFTRS solves a system of linear equations A*X = B with a Hermitian
!> positive definite matrix A using the Cholesky factorization
!> A = U**H*U or A = L*L**H computed by CPFTRF.
!>

Parameters

[in]	TRANSR	!> TRANSR is CHARACTER*1 !> = 'N': The Normal TRANSR of RFP A is stored; !> = 'C': The Conjugate-transpose TRANSR of RFP A is stored. !>
[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': Upper triangle of RFP A is stored; !> = 'L': Lower triangle of RFP A is stored. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in]	NRHS	!> NRHS is INTEGER !> The number of right hand sides, i.e., the number of columns !> of the matrix B. NRHS >= 0. !>
[in]	A	!> A is COMPLEX array, dimension ( N(N+1)/2 ); !> The triangular factor U or L from the Cholesky factorization !> of RFP A = UHU or RFP A = LL*H, as computed by CPFTRF. !> See note below for more details about RFP A. !>
[in,out]	B	!> B is COMPLEX array, dimension (LDB,NRHS) !> On entry, the right hand side matrix B. !> On exit, the solution matrix X. !>
[in]	LDB	!> LDB is INTEGER !> The leading dimension of the array B. LDB >= max(1,N). !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  We first consider Standard Packed Format when N is even.
!>  We give an example where N = 6.
!>
!>      AP is Upper             AP is Lower
!>
!>   00 01 02 03 04 05       00
!>      11 12 13 14 15       10 11
!>         22 23 24 25       20 21 22
!>            33 34 35       30 31 32 33
!>               44 45       40 41 42 43 44
!>                  55       50 51 52 53 54 55
!>
!>
!>  Let TRANSR = 'N'. RFP holds AP as follows:
!>  For UPLO = 'U' the upper trapezoid A(0:5,0:2) consists of the last
!>  three columns of AP upper. The lower triangle A(4:6,0:2) consists of
!>  conjugate-transpose of the first three columns of AP upper.
!>  For UPLO = 'L' the lower trapezoid A(1:6,0:2) consists of the first
!>  three columns of AP lower. The upper triangle A(0:2,0:2) consists of
!>  conjugate-transpose of the last three columns of AP lower.
!>  To denote conjugate we place -- above the element. This covers the
!>  case N even and TRANSR = 'N'.
!>
!>         RFP A                   RFP A
!>
!>                                -- -- --
!>        03 04 05                33 43 53
!>                                   -- --
!>        13 14 15                00 44 54
!>                                      --
!>        23 24 25                10 11 55
!>
!>        33 34 35                20 21 22
!>        --
!>        00 44 45                30 31 32
!>        -- --
!>        01 11 55                40 41 42
!>        -- -- --
!>        02 12 22                50 51 52
!>
!>  Now let TRANSR = 'C'. RFP A in both UPLO cases is just the conjugate-
!>  transpose of RFP A above. One therefore gets:
!>
!>
!>           RFP A                   RFP A
!>
!>     -- -- -- --                -- -- -- -- -- --
!>     03 13 23 33 00 01 02    33 00 10 20 30 40 50
!>     -- -- -- -- --                -- -- -- -- --
!>     04 14 24 34 44 11 12    43 44 11 21 31 41 51
!>     -- -- -- -- -- --                -- -- -- --
!>     05 15 25 35 45 55 22    53 54 55 22 32 42 52
!>
!>
!>  We next  consider Standard Packed Format when N is odd.
!>  We give an example where N = 5.
!>
!>     AP is Upper                 AP is Lower
!>
!>   00 01 02 03 04              00
!>      11 12 13 14              10 11
!>         22 23 24              20 21 22
!>            33 34              30 31 32 33
!>               44              40 41 42 43 44
!>
!>
!>  Let TRANSR = 'N'. RFP holds AP as follows:
!>  For UPLO = 'U' the upper trapezoid A(0:4,0:2) consists of the last
!>  three columns of AP upper. The lower triangle A(3:4,0:1) consists of
!>  conjugate-transpose of the first two   columns of AP upper.
!>  For UPLO = 'L' the lower trapezoid A(0:4,0:2) consists of the first
!>  three columns of AP lower. The upper triangle A(0:1,1:2) consists of
!>  conjugate-transpose of the last two   columns of AP lower.
!>  To denote conjugate we place -- above the element. This covers the
!>  case N odd  and TRANSR = 'N'.
!>
!>         RFP A                   RFP A
!>
!>                                   -- --
!>        02 03 04                00 33 43
!>                                      --
!>        12 13 14                10 11 44
!>
!>        22 23 24                20 21 22
!>        --
!>        00 33 34                30 31 32
!>        -- --
!>        01 11 44                40 41 42
!>
!>  Now let TRANSR = 'C'. RFP A in both UPLO cases is just the conjugate-
!>  transpose of RFP A above. One therefore gets:
!>
!>
!>           RFP A                   RFP A
!>
!>     -- -- --                   -- -- -- -- -- --
!>     02 12 22 00 01             00 10 20 30 40 50
!>     -- -- -- --                   -- -- -- -- --
!>     03 13 23 33 11             33 11 21 31 41 51
!>     -- -- -- -- --                   -- -- -- --
!>     04 14 24 34 44             43 44 22 32 42 52
!>

Definition at line 219 of file cpftrs.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          TRANSR, UPLO
      INTEGER            INFO, LDB, N, NRHS
*     ..
*     .. Array Arguments ..
      COMPLEX            A( 0: * ), B( LDB, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            CONE
      parameter( cone = ( 1.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      LOGICAL            LOWER, NORMALTRANSR
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           xerbla, ctfsm
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      normaltransr = lsame( transr, 'N' )
      lower = lsame( uplo, 'L' )
      IF( .NOT.normaltransr .AND. .NOT.lsame( transr, 'C' ) ) THEN
         info = -1
      ELSE IF( .NOT.lower .AND. .NOT.lsame( uplo, 'U' ) ) THEN
         info = -2
      ELSE IF( n.LT.0 ) THEN
         info = -3
      ELSE IF( nrhs.LT.0 ) THEN
         info = -4
      ELSE IF( ldb.LT.max( 1, n ) ) THEN
         info = -7
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CPFTRS', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 .OR. nrhs.EQ.0 )
     $   RETURN
*
*     start execution: there are two triangular solves
*
      IF( lower ) THEN
         CALL ctfsm( transr, 'L', uplo, 'N', 'N', n, nrhs, cone, a, b,
     $               ldb )
         CALL ctfsm( transr, 'L', uplo, 'C', 'N', n, nrhs, cone, a, b,
     $               ldb )
      ELSE
         CALL ctfsm( transr, 'L', uplo, 'C', 'N', n, nrhs, cone, a, b,
     $               ldb )
         CALL ctfsm( transr, 'L', uplo, 'N', 'N', n, nrhs, cone, a, b,
     $               ldb )
      END IF
*
      RETURN
*
*     End of CPFTRS
*

◆ cppcon()

subroutine cppcon	(	character	uplo,
		integer	n,
		complex, dimension( * )	ap,
		real	anorm,
		real	rcond,
		complex, dimension( * )	work,
		real, dimension( * )	rwork,
		integer	info )

CPPCON

Download CPPCON + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CPPCON estimates the reciprocal of the condition number (in the
!> 1-norm) of a complex Hermitian positive definite packed matrix using
!> the Cholesky factorization A = U**H*U or A = L*L**H computed by
!> CPPTRF.
!>
!> An estimate is obtained for norm(inv(A)), and the reciprocal of the
!> condition number is computed as RCOND = 1 / (ANORM * norm(inv(A))).
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': Upper triangle of A is stored; !> = 'L': Lower triangle of A is stored. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in]	AP	!> AP is COMPLEX array, dimension (N(N+1)/2) !> The triangular factor U or L from the Cholesky factorization !> A = UHU or A = LLH, packed columnwise in a linear !> array. The j-th column of U or L is stored in the array AP !> as follows: !> if UPLO = 'U', AP(i + (j-1)j/2) = U(i,j) for 1<=i<=j; !> if UPLO = 'L', AP(i + (j-1)*(2n-j)/2) = L(i,j) for j<=i<=n. !>
[in]	ANORM	!> ANORM is REAL !> The 1-norm (or infinity-norm) of the Hermitian matrix A. !>
[out]	RCOND	!> RCOND is REAL !> The reciprocal of the condition number of the matrix A, !> computed as RCOND = 1/(ANORM * AINVNM), where AINVNM is an !> estimate of the 1-norm of inv(A) computed in this routine. !>
[out]	WORK	!> WORK is COMPLEX array, dimension (2*N) !>
[out]	RWORK	!> RWORK is REAL array, dimension (N) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 117 of file cppcon.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          UPLO
      INTEGER            INFO, N
      REAL               ANORM, RCOND
*     ..
*     .. Array Arguments ..
      REAL               RWORK( * )
      COMPLEX            AP( * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ONE, ZERO
      parameter( one = 1.0e+0, zero = 0.0e+0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            UPPER
      CHARACTER          NORMIN
      INTEGER            IX, KASE
      REAL               AINVNM, SCALE, SCALEL, SCALEU, SMLNUM
      COMPLEX            ZDUM
*     ..
*     .. Local Arrays ..
      INTEGER            ISAVE( 3 )
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      INTEGER            ICAMAX
      REAL               SLAMCH
      EXTERNAL           lsame, icamax, slamch
*     ..
*     .. External Subroutines ..
      EXTERNAL           clacn2, clatps, csrscl, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, aimag, real
*     ..
*     .. Statement Functions ..
      REAL               CABS1
*     ..
*     .. Statement Function definitions ..
      cabs1( zdum ) = abs( real( zdum ) ) + abs( aimag( zdum ) )
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      upper = lsame( uplo, 'U' )
      IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( anorm.LT.zero ) THEN
         info = -4
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CPPCON', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      rcond = zero
      IF( n.EQ.0 ) THEN
         rcond = one
         RETURN
      ELSE IF( anorm.EQ.zero ) THEN
         RETURN
      END IF
*
      smlnum = slamch( 'Safe minimum' )
*
*     Estimate the 1-norm of the inverse.
*
      kase = 0
      normin = 'N'
   10 CONTINUE
      CALL clacn2( n, work( n+1 ), work, ainvnm, kase, isave )
      IF( kase.NE.0 ) THEN
         IF( upper ) THEN
*
*           Multiply by inv(U**H).
*
            CALL clatps( 'Upper', 'Conjugate transpose', 'Non-unit',
     $                   normin, n, ap, work, scalel, rwork, info )
            normin = 'Y'
*
*           Multiply by inv(U).
*
            CALL clatps( 'Upper', 'No transpose', 'Non-unit', normin, n,
     $                   ap, work, scaleu, rwork, info )
         ELSE
*
*           Multiply by inv(L).
*
            CALL clatps( 'Lower', 'No transpose', 'Non-unit', normin, n,
     $                   ap, work, scalel, rwork, info )
            normin = 'Y'
*
*           Multiply by inv(L**H).
*
            CALL clatps( 'Lower', 'Conjugate transpose', 'Non-unit',
     $                   normin, n, ap, work, scaleu, rwork, info )
         END IF
*
*        Multiply by 1/SCALE if doing so will not cause overflow.
*
         scale = scalel*scaleu
         IF( scale.NE.one ) THEN
            ix = icamax( n, work, 1 )
            IF( scale.LT.cabs1( work( ix ) )*smlnum .OR. scale.EQ.zero )
     $         GO TO 20
            CALL csrscl( n, scale, work, 1 )
         END IF
         GO TO 10
      END IF
*
*     Compute the estimate of the reciprocal condition number.
*
      IF( ainvnm.NE.zero )
     $   rcond = ( one / ainvnm ) / anorm
*
   20 CONTINUE
      RETURN
*
*     End of CPPCON
*

◆ cppequ()

subroutine cppequ	(	character	uplo,
		integer	n,
		complex, dimension( * )	ap,
		real, dimension( * )	s,
		real	scond,
		real	amax,
		integer	info )

CPPEQU

Download CPPEQU + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CPPEQU computes row and column scalings intended to equilibrate a
!> Hermitian positive definite matrix A in packed storage and reduce
!> its condition number (with respect to the two-norm).  S contains the
!> scale factors, S(i)=1/sqrt(A(i,i)), chosen so that the scaled matrix
!> B with elements B(i,j)=S(i)*A(i,j)*S(j) has ones on the diagonal.
!> This choice of S puts the condition number of B within a factor N of
!> the smallest possible condition number over all possible diagonal
!> scalings.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': Upper triangle of A is stored; !> = 'L': Lower triangle of A is stored. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in]	AP	!> AP is COMPLEX array, dimension (N(N+1)/2) !> The upper or lower triangle of the Hermitian matrix A, packed !> columnwise in a linear array. The j-th column of A is stored !> in the array AP as follows: !> if UPLO = 'U', AP(i + (j-1)j/2) = A(i,j) for 1<=i<=j; !> if UPLO = 'L', AP(i + (j-1)*(2n-j)/2) = A(i,j) for j<=i<=n. !>
[out]	S	!> S is REAL array, dimension (N) !> If INFO = 0, S contains the scale factors for A. !>
[out]	SCOND	!> SCOND is REAL !> If INFO = 0, S contains the ratio of the smallest S(i) to !> the largest S(i). If SCOND >= 0.1 and AMAX is neither too !> large nor too small, it is not worth scaling by S. !>
[out]	AMAX	!> AMAX is REAL !> Absolute value of largest matrix element. If AMAX is very !> close to overflow or very close to underflow, the matrix !> should be scaled. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !> > 0: if INFO = i, the i-th diagonal element is nonpositive. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 116 of file cppequ.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          UPLO
      INTEGER            INFO, N
      REAL               AMAX, SCOND
*     ..
*     .. Array Arguments ..
      REAL               S( * )
      COMPLEX            AP( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ONE, ZERO
      parameter( one = 1.0e+0, zero = 0.0e+0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            UPPER
      INTEGER            I, JJ
      REAL               SMIN
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, min, real, sqrt
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      upper = lsame( uplo, 'U' )
      IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CPPEQU', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 ) THEN
         scond = one
         amax = zero
         RETURN
      END IF
*
*     Initialize SMIN and AMAX.
*
      s( 1 ) = real( ap( 1 ) )
      smin = s( 1 )
      amax = s( 1 )
*
      IF( upper ) THEN
*
*        UPLO = 'U':  Upper triangle of A is stored.
*        Find the minimum and maximum diagonal elements.
*
         jj = 1
         DO 10 i = 2, n
            jj = jj + i
            s( i ) = real( ap( jj ) )
            smin = min( smin, s( i ) )
            amax = max( amax, s( i ) )
   10    CONTINUE
*
      ELSE
*
*        UPLO = 'L':  Lower triangle of A is stored.
*        Find the minimum and maximum diagonal elements.
*
         jj = 1
         DO 20 i = 2, n
            jj = jj + n - i + 2
            s( i ) = real( ap( jj ) )
            smin = min( smin, s( i ) )
            amax = max( amax, s( i ) )
   20    CONTINUE
      END IF
*
      IF( smin.LE.zero ) THEN
*
*        Find the first non-positive diagonal element and return.
*
         DO 30 i = 1, n
            IF( s( i ).LE.zero ) THEN
               info = i
               RETURN
            END IF
   30    CONTINUE
      ELSE
*
*        Set the scale factors to the reciprocals
*        of the diagonal elements.
*
         DO 40 i = 1, n
            s( i ) = one / sqrt( s( i ) )
   40    CONTINUE
*
*        Compute SCOND = min(S(I)) / max(S(I))
*
         scond = sqrt( smin ) / sqrt( amax )
      END IF
      RETURN
*
*     End of CPPEQU
*

◆ cpprfs()

subroutine cpprfs	(	character	uplo,
		integer	n,
		integer	nrhs,
		complex, dimension( * )	ap,
		complex, dimension( * )	afp,
		complex, dimension( ldb, * )	b,
		integer	ldb,
		complex, dimension( ldx, * )	x,
		integer	ldx,
		real, dimension( * )	ferr,
		real, dimension( * )	berr,
		complex, dimension( * )	work,
		real, dimension( * )	rwork,
		integer	info )

CPPRFS

Download CPPRFS + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CPPRFS improves the computed solution to a system of linear
!> equations when the coefficient matrix is Hermitian positive definite
!> and packed, and provides error bounds and backward error estimates
!> for the solution.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': Upper triangle of A is stored; !> = 'L': Lower triangle of A is stored. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in]	NRHS	!> NRHS is INTEGER !> The number of right hand sides, i.e., the number of columns !> of the matrices B and X. NRHS >= 0. !>
[in]	AP	!> AP is COMPLEX array, dimension (N(N+1)/2) !> The upper or lower triangle of the Hermitian matrix A, packed !> columnwise in a linear array. The j-th column of A is stored !> in the array AP as follows: !> if UPLO = 'U', AP(i + (j-1)j/2) = A(i,j) for 1<=i<=j; !> if UPLO = 'L', AP(i + (j-1)*(2n-j)/2) = A(i,j) for j<=i<=n. !>
[in]	AFP	!> AFP is COMPLEX array, dimension (N(N+1)/2) !> The triangular factor U or L from the Cholesky factorization !> A = UHU or A = LL*H, as computed by SPPTRF/CPPTRF, !> packed columnwise in a linear array in the same format as A !> (see AP). !>
[in]	B	!> B is COMPLEX array, dimension (LDB,NRHS) !> The right hand side matrix B. !>
[in]	LDB	!> LDB is INTEGER !> The leading dimension of the array B. LDB >= max(1,N). !>
[in,out]	X	!> X is COMPLEX array, dimension (LDX,NRHS) !> On entry, the solution matrix X, as computed by CPPTRS. !> On exit, the improved solution matrix X. !>
[in]	LDX	!> LDX is INTEGER !> The leading dimension of the array X. LDX >= max(1,N). !>
[out]	FERR	!> FERR is REAL array, dimension (NRHS) !> The estimated forward error bound for each solution vector !> X(j) (the j-th column of the solution matrix X). !> If XTRUE is the true solution corresponding to X(j), FERR(j) !> is an estimated upper bound for the magnitude of the largest !> element in (X(j) - XTRUE) divided by the magnitude of the !> largest element in X(j). The estimate is as reliable as !> the estimate for RCOND, and is almost always a slight !> overestimate of the true error. !>
[out]	BERR	!> BERR is REAL array, dimension (NRHS) !> The componentwise relative backward error of each solution !> vector X(j) (i.e., the smallest relative change in !> any element of A or B that makes X(j) an exact solution). !>
[out]	WORK	!> WORK is COMPLEX array, dimension (2*N) !>
[out]	RWORK	!> RWORK is REAL array, dimension (N) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Internal Parameters:

!>  ITMAX is the maximum number of steps of iterative refinement.
!>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 169 of file cpprfs.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          UPLO
      INTEGER            INFO, LDB, LDX, N, NRHS
*     ..
*     .. Array Arguments ..
      REAL               BERR( * ), FERR( * ), RWORK( * )
      COMPLEX            AFP( * ), AP( * ), B( LDB, * ), WORK( * ),
     $                   X( LDX, * )
*     ..
*
*  ====================================================================
*
*     .. Parameters ..
      INTEGER            ITMAX
      parameter( itmax = 5 )
      REAL               ZERO
      parameter( zero = 0.0e+0 )
      COMPLEX            CONE
      parameter( cone = ( 1.0e+0, 0.0e+0 ) )
      REAL               TWO
      parameter( two = 2.0e+0 )
      REAL               THREE
      parameter( three = 3.0e+0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            UPPER
      INTEGER            COUNT, I, IK, J, K, KASE, KK, NZ
      REAL               EPS, LSTRES, S, SAFE1, SAFE2, SAFMIN, XK
      COMPLEX            ZDUM
*     ..
*     .. Local Arrays ..
      INTEGER            ISAVE( 3 )
*     ..
*     .. External Subroutines ..
      EXTERNAL           caxpy, ccopy, chpmv, clacn2, cpptrs, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, aimag, max, real
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      REAL               SLAMCH
      EXTERNAL           lsame, slamch
*     ..
*     .. Statement Functions ..
      REAL               CABS1
*     ..
*     .. Statement Function definitions ..
      cabs1( zdum ) = abs( real( zdum ) ) + abs( aimag( zdum ) )
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      upper = lsame( uplo, 'U' )
      IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( nrhs.LT.0 ) THEN
         info = -3
      ELSE IF( ldb.LT.max( 1, n ) ) THEN
         info = -7
      ELSE IF( ldx.LT.max( 1, n ) ) THEN
         info = -9
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CPPRFS', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 .OR. nrhs.EQ.0 ) THEN
         DO 10 j = 1, nrhs
            ferr( j ) = zero
            berr( j ) = zero
   10    CONTINUE
         RETURN
      END IF
*
*     NZ = maximum number of nonzero elements in each row of A, plus 1
*
      nz = n + 1
      eps = slamch( 'Epsilon' )
      safmin = slamch( 'Safe minimum' )
      safe1 = nz*safmin
      safe2 = safe1 / eps
*
*     Do for each right hand side
*
      DO 140 j = 1, nrhs
*
         count = 1
         lstres = three
   20    CONTINUE
*
*        Loop until stopping criterion is satisfied.
*
*        Compute residual R = B - A * X
*
         CALL ccopy( n, b( 1, j ), 1, work, 1 )
         CALL chpmv( uplo, n, -cone, ap, x( 1, j ), 1, cone, work, 1 )
*
*        Compute componentwise relative backward error from formula
*
*        max(i) ( abs(R(i)) / ( abs(A)*abs(X) + abs(B) )(i) )
*
*        where abs(Z) is the componentwise absolute value of the matrix
*        or vector Z.  If the i-th component of the denominator is less
*        than SAFE2, then SAFE1 is added to the i-th components of the
*        numerator and denominator before dividing.
*
         DO 30 i = 1, n
            rwork( i ) = cabs1( b( i, j ) )
   30    CONTINUE
*
*        Compute abs(A)*abs(X) + abs(B).
*
         kk = 1
         IF( upper ) THEN
            DO 50 k = 1, n
               s = zero
               xk = cabs1( x( k, j ) )
               ik = kk
               DO 40 i = 1, k - 1
                  rwork( i ) = rwork( i ) + cabs1( ap( ik ) )*xk
                  s = s + cabs1( ap( ik ) )*cabs1( x( i, j ) )
                  ik = ik + 1
   40          CONTINUE
               rwork( k ) = rwork( k ) + abs( real( ap( kk+k-1 ) ) )*
     $                      xk + s
               kk = kk + k
   50       CONTINUE
         ELSE
            DO 70 k = 1, n
               s = zero
               xk = cabs1( x( k, j ) )
               rwork( k ) = rwork( k ) + abs( real( ap( kk ) ) )*xk
               ik = kk + 1
               DO 60 i = k + 1, n
                  rwork( i ) = rwork( i ) + cabs1( ap( ik ) )*xk
                  s = s + cabs1( ap( ik ) )*cabs1( x( i, j ) )
                  ik = ik + 1
   60          CONTINUE
               rwork( k ) = rwork( k ) + s
               kk = kk + ( n-k+1 )
   70       CONTINUE
         END IF
         s = zero
         DO 80 i = 1, n
            IF( rwork( i ).GT.safe2 ) THEN
               s = max( s, cabs1( work( i ) ) / rwork( i ) )
            ELSE
               s = max( s, ( cabs1( work( i ) )+safe1 ) /
     $             ( rwork( i )+safe1 ) )
            END IF
   80    CONTINUE
         berr( j ) = s
*
*        Test stopping criterion. Continue iterating if
*           1) The residual BERR(J) is larger than machine epsilon, and
*           2) BERR(J) decreased by at least a factor of 2 during the
*              last iteration, and
*           3) At most ITMAX iterations tried.
*
         IF( berr( j ).GT.eps .AND. two*berr( j ).LE.lstres .AND.
     $       count.LE.itmax ) THEN
*
*           Update solution and try again.
*
            CALL cpptrs( uplo, n, 1, afp, work, n, info )
            CALL caxpy( n, cone, work, 1, x( 1, j ), 1 )
            lstres = berr( j )
            count = count + 1
            GO TO 20
         END IF
*
*        Bound error from formula
*
*        norm(X - XTRUE) / norm(X) .le. FERR =
*        norm( abs(inv(A))*
*           ( abs(R) + NZ*EPS*( abs(A)*abs(X)+abs(B) ))) / norm(X)
*
*        where
*          norm(Z) is the magnitude of the largest component of Z
*          inv(A) is the inverse of A
*          abs(Z) is the componentwise absolute value of the matrix or
*             vector Z
*          NZ is the maximum number of nonzeros in any row of A, plus 1
*          EPS is machine epsilon
*
*        The i-th component of abs(R)+NZ*EPS*(abs(A)*abs(X)+abs(B))
*        is incremented by SAFE1 if the i-th component of
*        abs(A)*abs(X) + abs(B) is less than SAFE2.
*
*        Use CLACN2 to estimate the infinity-norm of the matrix
*           inv(A) * diag(W),
*        where W = abs(R) + NZ*EPS*( abs(A)*abs(X)+abs(B) )))
*
         DO 90 i = 1, n
            IF( rwork( i ).GT.safe2 ) THEN
               rwork( i ) = cabs1( work( i ) ) + nz*eps*rwork( i )
            ELSE
               rwork( i ) = cabs1( work( i ) ) + nz*eps*rwork( i ) +
     $                      safe1
            END IF
   90    CONTINUE
*
         kase = 0
  100    CONTINUE
         CALL clacn2( n, work( n+1 ), work, ferr( j ), kase, isave )
         IF( kase.NE.0 ) THEN
            IF( kase.EQ.1 ) THEN
*
*              Multiply by diag(W)*inv(A**H).
*
               CALL cpptrs( uplo, n, 1, afp, work, n, info )
               DO 110 i = 1, n
                  work( i ) = rwork( i )*work( i )
  110          CONTINUE
            ELSE IF( kase.EQ.2 ) THEN
*
*              Multiply by inv(A)*diag(W).
*
               DO 120 i = 1, n
                  work( i ) = rwork( i )*work( i )
  120          CONTINUE
               CALL cpptrs( uplo, n, 1, afp, work, n, info )
            END IF
            GO TO 100
         END IF
*
*        Normalize error.
*
         lstres = zero
         DO 130 i = 1, n
            lstres = max( lstres, cabs1( x( i, j ) ) )
  130    CONTINUE
         IF( lstres.NE.zero )
     $      ferr( j ) = ferr( j ) / lstres
*
  140 CONTINUE
*
      RETURN
*
*     End of CPPRFS
*

◆ cpptrf()

subroutine cpptrf	(	character	uplo,
		integer	n,
		complex, dimension( * )	ap,
		integer	info )

CPPTRF

Download CPPTRF + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CPPTRF computes the Cholesky factorization of a complex Hermitian
!> positive definite matrix A stored in packed format.
!>
!> The factorization has the form
!>    A = U**H * U,  if UPLO = 'U', or
!>    A = L  * L**H,  if UPLO = 'L',
!> where U is an upper triangular matrix and L is lower triangular.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': Upper triangle of A is stored; !> = 'L': Lower triangle of A is stored. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in,out]	AP	!> AP is COMPLEX array, dimension (N(N+1)/2) !> On entry, the upper or lower triangle of the Hermitian matrix !> A, packed columnwise in a linear array. The j-th column of A !> is stored in the array AP as follows: !> if UPLO = 'U', AP(i + (j-1)j/2) = A(i,j) for 1<=i<=j; !> if UPLO = 'L', AP(i + (j-1)(2n-j)/2) = A(i,j) for j<=i<=n. !> See below for further details. !> !> On exit, if INFO = 0, the triangular factor U or L from the !> Cholesky factorization A = UHU or A = LL*H, in the same !> storage format as A. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !> > 0: if INFO = i, the leading minor of order i is not !> positive definite, and the factorization could not be !> completed. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  The packed storage scheme is illustrated by the following example
!>  when N = 4, UPLO = 'U':
!>
!>  Two-dimensional storage of the Hermitian matrix A:
!>
!>     a11 a12 a13 a14
!>         a22 a23 a24
!>             a33 a34     (aij = conjg(aji))
!>                 a44
!>
!>  Packed storage of the upper triangle of A:
!>
!>  AP = [ a11, a12, a22, a13, a23, a33, a14, a24, a34, a44 ]
!>

Definition at line 118 of file cpptrf.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          UPLO
      INTEGER            INFO, N
*     ..
*     .. Array Arguments ..
      COMPLEX            AP( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ZERO, ONE
      parameter( zero = 0.0e+0, one = 1.0e+0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            UPPER
      INTEGER            J, JC, JJ
      REAL               AJJ
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      COMPLEX            CDOTC
      EXTERNAL           lsame, cdotc
*     ..
*     .. External Subroutines ..
      EXTERNAL           chpr, csscal, ctpsv, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          real, sqrt
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      upper = lsame( uplo, 'U' )
      IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CPPTRF', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
      IF( upper ) THEN
*
*        Compute the Cholesky factorization A = U**H * U.
*
         jj = 0
         DO 10 j = 1, n
            jc = jj + 1
            jj = jj + j
*
*           Compute elements 1:J-1 of column J.
*
            IF( j.GT.1 )
     $         CALL ctpsv( 'Upper', 'Conjugate transpose', 'Non-unit',
     $                     j-1, ap, ap( jc ), 1 )
*
*           Compute U(J,J) and test for non-positive-definiteness.
*
            ajj = real( real( ap( jj ) ) - cdotc( j-1,
     $            ap( jc ), 1, ap( jc ), 1 ) )
            IF( ajj.LE.zero ) THEN
               ap( jj ) = ajj
               GO TO 30
            END IF
            ap( jj ) = sqrt( ajj )
   10    CONTINUE
      ELSE
*
*        Compute the Cholesky factorization A = L * L**H.
*
         jj = 1
         DO 20 j = 1, n
*
*           Compute L(J,J) and test for non-positive-definiteness.
*
            ajj = real( ap( jj ) )
            IF( ajj.LE.zero ) THEN
               ap( jj ) = ajj
               GO TO 30
            END IF
            ajj = sqrt( ajj )
            ap( jj ) = ajj
*
*           Compute elements J+1:N of column J and update the trailing
*           submatrix.
*
            IF( j.LT.n ) THEN
               CALL csscal( n-j, one / ajj, ap( jj+1 ), 1 )
               CALL chpr( 'Lower', n-j, -one, ap( jj+1 ), 1,
     $                    ap( jj+n-j+1 ) )
               jj = jj + n - j + 1
            END IF
   20    CONTINUE
      END IF
      GO TO 40
*
   30 CONTINUE
      info = j
*
   40 CONTINUE
      RETURN
*
*     End of CPPTRF
*

◆ cpptri()

subroutine cpptri	(	character	uplo,
		integer	n,
		complex, dimension( * )	ap,
		integer	info )

CPPTRI

Download CPPTRI + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CPPTRI computes the inverse of a complex Hermitian positive definite
!> matrix A using the Cholesky factorization A = U**H*U or A = L*L**H
!> computed by CPPTRF.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': Upper triangular factor is stored in AP; !> = 'L': Lower triangular factor is stored in AP. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in,out]	AP	!> AP is COMPLEX array, dimension (N(N+1)/2) !> On entry, the triangular factor U or L from the Cholesky !> factorization A = UHU or A = LLH, packed columnwise as !> a linear array. The j-th column of U or L is stored in the !> array AP as follows: !> if UPLO = 'U', AP(i + (j-1)j/2) = U(i,j) for 1<=i<=j; !> if UPLO = 'L', AP(i + (j-1)*(2n-j)/2) = L(i,j) for j<=i<=n. !> !> On exit, the upper or lower triangle of the (Hermitian) !> inverse of A, overwriting the input factor U or L. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !> > 0: if INFO = i, the (i,i) element of the factor U or L is !> zero, and the inverse could not be computed. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 92 of file cpptri.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          UPLO
      INTEGER            INFO, N
*     ..
*     .. Array Arguments ..
      COMPLEX            AP( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ONE
      parameter( one = 1.0e+0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            UPPER
      INTEGER            J, JC, JJ, JJN
      REAL               AJJ
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      COMPLEX            CDOTC
      EXTERNAL           lsame, cdotc
*     ..
*     .. External Subroutines ..
      EXTERNAL           chpr, csscal, ctpmv, ctptri, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          real
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      upper = lsame( uplo, 'U' )
      IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CPPTRI', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
*     Invert the triangular Cholesky factor U or L.
*
      CALL ctptri( uplo, 'Non-unit', n, ap, info )
      IF( info.GT.0 )
     $   RETURN
      IF( upper ) THEN
*
*        Compute the product inv(U) * inv(U)**H.
*
         jj = 0
         DO 10 j = 1, n
            jc = jj + 1
            jj = jj + j
            IF( j.GT.1 )
     $         CALL chpr( 'Upper', j-1, one, ap( jc ), 1, ap )
            ajj = real( ap( jj ) )
            CALL csscal( j, ajj, ap( jc ), 1 )
   10    CONTINUE
*
      ELSE
*
*        Compute the product inv(L)**H * inv(L).
*
         jj = 1
         DO 20 j = 1, n
            jjn = jj + n - j + 1
            ap( jj ) = real( cdotc( n-j+1, ap( jj ), 1, ap( jj ), 1 ) )
            IF( j.LT.n )
     $         CALL ctpmv( 'Lower', 'Conjugate transpose', 'Non-unit',
     $                     n-j, ap( jjn ), ap( jj+1 ), 1 )
            jj = jjn
   20    CONTINUE
      END IF
*
      RETURN
*
*     End of CPPTRI
*

◆ cpptrs()

subroutine cpptrs	(	character	uplo,
		integer	n,
		integer	nrhs,
		complex, dimension( * )	ap,
		complex, dimension( ldb, * )	b,
		integer	ldb,
		integer	info )

CPPTRS

Download CPPTRS + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CPPTRS solves a system of linear equations A*X = B with a Hermitian
!> positive definite matrix A in packed storage using the Cholesky
!> factorization A = U**H*U or A = L*L**H computed by CPPTRF.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': Upper triangle of A is stored; !> = 'L': Lower triangle of A is stored. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in]	NRHS	!> NRHS is INTEGER !> The number of right hand sides, i.e., the number of columns !> of the matrix B. NRHS >= 0. !>
[in]	AP	!> AP is COMPLEX array, dimension (N(N+1)/2) !> The triangular factor U or L from the Cholesky factorization !> A = UHU or A = LLH, packed columnwise in a linear !> array. The j-th column of U or L is stored in the array AP !> as follows: !> if UPLO = 'U', AP(i + (j-1)j/2) = U(i,j) for 1<=i<=j; !> if UPLO = 'L', AP(i + (j-1)*(2n-j)/2) = L(i,j) for j<=i<=n. !>
[in,out]	B	!> B is COMPLEX array, dimension (LDB,NRHS) !> On entry, the right hand side matrix B. !> On exit, the solution matrix X. !>
[in]	LDB	!> LDB is INTEGER !> The leading dimension of the array B. LDB >= max(1,N). !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 107 of file cpptrs.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          UPLO
      INTEGER            INFO, LDB, N, NRHS
*     ..
*     .. Array Arguments ..
      COMPLEX            AP( * ), B( LDB, * )
*     ..
*
*  =====================================================================
*
*     .. Local Scalars ..
      LOGICAL            UPPER
      INTEGER            I
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           ctpsv, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      upper = lsame( uplo, 'U' )
      IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( nrhs.LT.0 ) THEN
         info = -3
      ELSE IF( ldb.LT.max( 1, n ) ) THEN
         info = -6
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CPPTRS', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 .OR. nrhs.EQ.0 )
     $   RETURN
*
      IF( upper ) THEN
*
*        Solve A*X = B where A = U**H * U.
*
         DO 10 i = 1, nrhs
*
*           Solve U**H *X = B, overwriting B with X.
*
            CALL ctpsv( 'Upper', 'Conjugate transpose', 'Non-unit', n,
     $                  ap, b( 1, i ), 1 )
*
*           Solve U*X = B, overwriting B with X.
*
            CALL ctpsv( 'Upper', 'No transpose', 'Non-unit', n, ap,
     $                  b( 1, i ), 1 )
   10    CONTINUE
      ELSE
*
*        Solve A*X = B where A = L * L**H.
*
         DO 20 i = 1, nrhs
*
*           Solve L*Y = B, overwriting B with X.
*
            CALL ctpsv( 'Lower', 'No transpose', 'Non-unit', n, ap,
     $                  b( 1, i ), 1 )
*
*           Solve L**H *X = Y, overwriting B with X.
*
            CALL ctpsv( 'Lower', 'Conjugate transpose', 'Non-unit', n,
     $                  ap, b( 1, i ), 1 )
   20    CONTINUE
      END IF
*
      RETURN
*
*     End of CPPTRS
*

◆ cpstf2()

subroutine cpstf2	(	character	uplo,
		integer	n,
		complex, dimension( lda, * )	a,
		integer	lda,
		integer, dimension( n )	piv,
		integer	rank,
		real	tol,
		real, dimension( 2*n )	work,
		integer	info )

CPSTF2 computes the Cholesky factorization with complete pivoting of complex Hermitian positive semidefinite matrix.

Download CPSTF2 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CPSTF2 computes the Cholesky factorization with complete
!> pivoting of a complex Hermitian positive semidefinite matrix A.
!>
!> The factorization has the form
!>    P**T * A * P = U**H * U ,  if UPLO = 'U',
!>    P**T * A * P = L  * L**H,  if UPLO = 'L',
!> where U is an upper triangular matrix and L is lower triangular, and
!> P is stored as vector PIV.
!>
!> This algorithm does not attempt to check that A is positive
!> semidefinite. This version of the algorithm calls level 2 BLAS.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> Specifies whether the upper or lower triangular part of the !> symmetric matrix A is stored. !> = 'U': Upper triangular !> = 'L': Lower triangular !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in,out]	A	!> A is COMPLEX array, dimension (LDA,N) !> On entry, the symmetric matrix A. If UPLO = 'U', the leading !> n by n upper triangular part of A contains the upper !> triangular part of the matrix A, and the strictly lower !> triangular part of A is not referenced. If UPLO = 'L', the !> leading n by n lower triangular part of A contains the lower !> triangular part of the matrix A, and the strictly upper !> triangular part of A is not referenced. !> !> On exit, if INFO = 0, the factor U or L from the Cholesky !> factorization as above. !>
[out]	PIV	!> PIV is INTEGER array, dimension (N) !> PIV is such that the nonzero entries are P( PIV(K), K ) = 1. !>
[out]	RANK	!> RANK is INTEGER !> The rank of A given by the number of steps the algorithm !> completed. !>
[in]	TOL	!> TOL is REAL !> User defined tolerance. If TOL < 0, then NUMAX( A( K,K ) ) !> will be used. The algorithm terminates at the (K-1)st step !> if the pivot <= TOL. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,N). !>
[out]	WORK	!> WORK is REAL array, dimension (2*N) !> Work space. !>
[out]	INFO	!> INFO is INTEGER !> < 0: If INFO = -K, the K-th argument had an illegal value, !> = 0: algorithm completed successfully, and !> > 0: the matrix A is either rank deficient with computed rank !> as returned in RANK, or is not positive semidefinite. See !> Section 7 of LAPACK Working Note #161 for further !> information. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 141 of file cpstf2.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      REAL               TOL
      INTEGER            INFO, LDA, N, RANK
      CHARACTER          UPLO
*     ..
*     .. Array Arguments ..
      COMPLEX            A( LDA, * )
      REAL               WORK( 2*N )
      INTEGER            PIV( N )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ONE, ZERO
      parameter( one = 1.0e+0, zero = 0.0e+0 )
      COMPLEX            CONE
      parameter( cone = ( 1.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      COMPLEX            CTEMP
      REAL               AJJ, SSTOP, STEMP
      INTEGER            I, ITEMP, J, PVT
      LOGICAL            UPPER
*     ..
*     .. External Functions ..
      REAL               SLAMCH
      LOGICAL            LSAME, SISNAN
      EXTERNAL           slamch, lsame, sisnan
*     ..
*     .. External Subroutines ..
      EXTERNAL           cgemv, clacgv, csscal, cswap, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          conjg, max, real, sqrt
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters
*
      info = 0
      upper = lsame( uplo, 'U' )
      IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( lda.LT.max( 1, n ) ) THEN
         info = -4
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CPSTF2', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
*     Initialize PIV
*
      DO 100 i = 1, n
         piv( i ) = i
  100 CONTINUE
*
*     Compute stopping value
*
      DO 110 i = 1, n
         work( i ) = real( a( i, i ) )
  110 CONTINUE
      pvt = maxloc( work( 1:n ), 1 )
      ajj = real( a( pvt, pvt ) )
      IF( ajj.LE.zero.OR.sisnan( ajj ) ) THEN
         rank = 0
         info = 1
         GO TO 200
      END IF
*
*     Compute stopping value if not supplied
*
      IF( tol.LT.zero ) THEN
         sstop = n * slamch( 'Epsilon' ) * ajj
      ELSE
         sstop = tol
      END IF
*
*     Set first half of WORK to zero, holds dot products
*
      DO 120 i = 1, n
         work( i ) = 0
  120 CONTINUE
*
      IF( upper ) THEN
*
*        Compute the Cholesky factorization P**T * A * P = U**H * U
*
         DO 150 j = 1, n
*
*        Find pivot, test for exit, else swap rows and columns
*        Update dot products, compute possible pivots which are
*        stored in the second half of WORK
*
            DO 130 i = j, n
*
               IF( j.GT.1 ) THEN
                  work( i ) = work( i ) +
     $                        real( conjg( a( j-1, i ) )*
     $                              a( j-1, i ) )
               END IF
               work( n+i ) = real( a( i, i ) ) - work( i )
*
  130       CONTINUE
*
            IF( j.GT.1 ) THEN
               itemp = maxloc( work( (n+j):(2*n) ), 1 )
               pvt = itemp + j - 1
               ajj = work( n+pvt )
               IF( ajj.LE.sstop.OR.sisnan( ajj ) ) THEN
                  a( j, j ) = ajj
                  GO TO 190
               END IF
            END IF
*
            IF( j.NE.pvt ) THEN
*
*              Pivot OK, so can now swap pivot rows and columns
*
               a( pvt, pvt ) = a( j, j )
               CALL cswap( j-1, a( 1, j ), 1, a( 1, pvt ), 1 )
               IF( pvt.LT.n )
     $            CALL cswap( n-pvt, a( j, pvt+1 ), lda,
     $                        a( pvt, pvt+1 ), lda )
               DO 140 i = j + 1, pvt - 1
                  ctemp = conjg( a( j, i ) )
                  a( j, i ) = conjg( a( i, pvt ) )
                  a( i, pvt ) = ctemp
  140          CONTINUE
               a( j, pvt ) = conjg( a( j, pvt ) )
*
*              Swap dot products and PIV
*
               stemp = work( j )
               work( j ) = work( pvt )
               work( pvt ) = stemp
               itemp = piv( pvt )
               piv( pvt ) = piv( j )
               piv( j ) = itemp
            END IF
*
            ajj = sqrt( ajj )
            a( j, j ) = ajj
*
*           Compute elements J+1:N of row J
*
            IF( j.LT.n ) THEN
               CALL clacgv( j-1, a( 1, j ), 1 )
               CALL cgemv( 'Trans', j-1, n-j, -cone, a( 1, j+1 ), lda,
     $                     a( 1, j ), 1, cone, a( j, j+1 ), lda )
               CALL clacgv( j-1, a( 1, j ), 1 )
               CALL csscal( n-j, one / ajj, a( j, j+1 ), lda )
            END IF
*
  150    CONTINUE
*
      ELSE
*
*        Compute the Cholesky factorization P**T * A * P = L * L**H
*
         DO 180 j = 1, n
*
*        Find pivot, test for exit, else swap rows and columns
*        Update dot products, compute possible pivots which are
*        stored in the second half of WORK
*
            DO 160 i = j, n
*
               IF( j.GT.1 ) THEN
                  work( i ) = work( i ) +
     $                        real( conjg( a( i, j-1 ) )*
     $                              a( i, j-1 ) )
               END IF
               work( n+i ) = real( a( i, i ) ) - work( i )
*
  160       CONTINUE
*
            IF( j.GT.1 ) THEN
               itemp = maxloc( work( (n+j):(2*n) ), 1 )
               pvt = itemp + j - 1
               ajj = work( n+pvt )
               IF( ajj.LE.sstop.OR.sisnan( ajj ) ) THEN
                  a( j, j ) = ajj
                  GO TO 190
               END IF
            END IF
*
            IF( j.NE.pvt ) THEN
*
*              Pivot OK, so can now swap pivot rows and columns
*
               a( pvt, pvt ) = a( j, j )
               CALL cswap( j-1, a( j, 1 ), lda, a( pvt, 1 ), lda )
               IF( pvt.LT.n )
     $            CALL cswap( n-pvt, a( pvt+1, j ), 1, a( pvt+1, pvt ),
     $                        1 )
               DO 170 i = j + 1, pvt - 1
                  ctemp = conjg( a( i, j ) )
                  a( i, j ) = conjg( a( pvt, i ) )
                  a( pvt, i ) = ctemp
  170          CONTINUE
               a( pvt, j ) = conjg( a( pvt, j ) )
*
*              Swap dot products and PIV
*
               stemp = work( j )
               work( j ) = work( pvt )
               work( pvt ) = stemp
               itemp = piv( pvt )
               piv( pvt ) = piv( j )
               piv( j ) = itemp
            END IF
*
            ajj = sqrt( ajj )
            a( j, j ) = ajj
*
*           Compute elements J+1:N of column J
*
            IF( j.LT.n ) THEN
               CALL clacgv( j-1, a( j, 1 ), lda )
               CALL cgemv( 'No Trans', n-j, j-1, -cone, a( j+1, 1 ),
     $                     lda, a( j, 1 ), lda, cone, a( j+1, j ), 1 )
               CALL clacgv( j-1, a( j, 1 ), lda )
               CALL csscal( n-j, one / ajj, a( j+1, j ), 1 )
            END IF
*
  180    CONTINUE
*
      END IF
*
*     Ran to completion, A has full rank
*
      rank = n
*
      GO TO 200
  190 CONTINUE
*
*     Rank is number of steps completed.  Set INFO = 1 to signal
*     that the factorization cannot be used to solve a system.
*
      rank = j - 1
      info = 1
*
  200 CONTINUE
      RETURN
*
*     End of CPSTF2
*

◆ cpstrf()

subroutine cpstrf	(	character	uplo,
		integer	n,
		complex, dimension( lda, * )	a,
		integer	lda,
		integer, dimension( n )	piv,
		integer	rank,
		real	tol,
		real, dimension( 2*n )	work,
		integer	info )

CPSTRF computes the Cholesky factorization with complete pivoting of complex Hermitian positive semidefinite matrix.

Download CPSTRF + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CPSTRF computes the Cholesky factorization with complete
!> pivoting of a complex Hermitian positive semidefinite matrix A.
!>
!> The factorization has the form
!>    P**T * A * P = U**H * U ,  if UPLO = 'U',
!>    P**T * A * P = L  * L**H,  if UPLO = 'L',
!> where U is an upper triangular matrix and L is lower triangular, and
!> P is stored as vector PIV.
!>
!> This algorithm does not attempt to check that A is positive
!> semidefinite. This version of the algorithm calls level 3 BLAS.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> Specifies whether the upper or lower triangular part of the !> symmetric matrix A is stored. !> = 'U': Upper triangular !> = 'L': Lower triangular !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in,out]	A	!> A is COMPLEX array, dimension (LDA,N) !> On entry, the symmetric matrix A. If UPLO = 'U', the leading !> n by n upper triangular part of A contains the upper !> triangular part of the matrix A, and the strictly lower !> triangular part of A is not referenced. If UPLO = 'L', the !> leading n by n lower triangular part of A contains the lower !> triangular part of the matrix A, and the strictly upper !> triangular part of A is not referenced. !> !> On exit, if INFO = 0, the factor U or L from the Cholesky !> factorization as above. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,N). !>
[out]	PIV	!> PIV is INTEGER array, dimension (N) !> PIV is such that the nonzero entries are P( PIV(K), K ) = 1. !>
[out]	RANK	!> RANK is INTEGER !> The rank of A given by the number of steps the algorithm !> completed. !>
[in]	TOL	!> TOL is REAL !> User defined tolerance. If TOL < 0, then NUMAX( A(K,K) ) !> will be used. The algorithm terminates at the (K-1)st step !> if the pivot <= TOL. !>
[out]	WORK	!> WORK is REAL array, dimension (2*N) !> Work space. !>
[out]	INFO	!> INFO is INTEGER !> < 0: If INFO = -K, the K-th argument had an illegal value, !> = 0: algorithm completed successfully, and !> > 0: the matrix A is either rank deficient with computed rank !> as returned in RANK, or is not positive semidefinite. See !> Section 7 of LAPACK Working Note #161 for further !> information. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 141 of file cpstrf.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      REAL               TOL
      INTEGER            INFO, LDA, N, RANK
      CHARACTER          UPLO
*     ..
*     .. Array Arguments ..
      COMPLEX            A( LDA, * )
      REAL               WORK( 2*N )
      INTEGER            PIV( N )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ONE, ZERO
      parameter( one = 1.0e+0, zero = 0.0e+0 )
      COMPLEX            CONE
      parameter( cone = ( 1.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      COMPLEX            CTEMP
      REAL               AJJ, SSTOP, STEMP
      INTEGER            I, ITEMP, J, JB, K, NB, PVT
      LOGICAL            UPPER
*     ..
*     .. External Functions ..
      REAL               SLAMCH
      INTEGER            ILAENV
      LOGICAL            LSAME, SISNAN
      EXTERNAL           slamch, ilaenv, lsame, sisnan
*     ..
*     .. External Subroutines ..
      EXTERNAL           cgemv, cherk, clacgv, cpstf2, csscal, cswap,
     $                   xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          conjg, max, min, real, sqrt, maxloc
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      upper = lsame( uplo, 'U' )
      IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( lda.LT.max( 1, n ) ) THEN
         info = -4
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CPSTRF', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
*     Get block size
*
      nb = ilaenv( 1, 'CPOTRF', uplo, n, -1, -1, -1 )
      IF( nb.LE.1 .OR. nb.GE.n ) THEN
*
*        Use unblocked code
*
         CALL cpstf2( uplo, n, a( 1, 1 ), lda, piv, rank, tol, work,
     $                info )
         GO TO 230
*
      ELSE
*
*     Initialize PIV
*
         DO 100 i = 1, n
            piv( i ) = i
  100    CONTINUE
*
*     Compute stopping value
*
         DO 110 i = 1, n
            work( i ) = real( a( i, i ) )
  110    CONTINUE
         pvt = maxloc( work( 1:n ), 1 )
         ajj = real( a( pvt, pvt ) )
         IF( ajj.LE.zero.OR.sisnan( ajj ) ) THEN
            rank = 0
            info = 1
            GO TO 230
         END IF
*
*     Compute stopping value if not supplied
*
         IF( tol.LT.zero ) THEN
            sstop = n * slamch( 'Epsilon' ) * ajj
         ELSE
            sstop = tol
         END IF
*
*
         IF( upper ) THEN
*
*           Compute the Cholesky factorization P**T * A * P = U**H * U
*
            DO 160 k = 1, n, nb
*
*              Account for last block not being NB wide
*
               jb = min( nb, n-k+1 )
*
*              Set relevant part of first half of WORK to zero,
*              holds dot products
*
               DO 120 i = k, n
                  work( i ) = 0
  120          CONTINUE
*
               DO 150 j = k, k + jb - 1
*
*              Find pivot, test for exit, else swap rows and columns
*              Update dot products, compute possible pivots which are
*              stored in the second half of WORK
*
                  DO 130 i = j, n
*
                     IF( j.GT.k ) THEN
                        work( i ) = work( i ) +
     $                              real( conjg( a( j-1, i ) )*
     $                                    a( j-1, i ) )
                     END IF
                     work( n+i ) = real( a( i, i ) ) - work( i )
*
  130             CONTINUE
*
                  IF( j.GT.1 ) THEN
                     itemp = maxloc( work( (n+j):(2*n) ), 1 )
                     pvt = itemp + j - 1
                     ajj = work( n+pvt )
                     IF( ajj.LE.sstop.OR.sisnan( ajj ) ) THEN
                        a( j, j ) = ajj
                        GO TO 220
                     END IF
                  END IF
*
                  IF( j.NE.pvt ) THEN
*
*                    Pivot OK, so can now swap pivot rows and columns
*
                     a( pvt, pvt ) = a( j, j )
                     CALL cswap( j-1, a( 1, j ), 1, a( 1, pvt ), 1 )
                     IF( pvt.LT.n )
     $                  CALL cswap( n-pvt, a( j, pvt+1 ), lda,
     $                              a( pvt, pvt+1 ), lda )
                     DO 140 i = j + 1, pvt - 1
                        ctemp = conjg( a( j, i ) )
                        a( j, i ) = conjg( a( i, pvt ) )
                        a( i, pvt ) = ctemp
  140                CONTINUE
                     a( j, pvt ) = conjg( a( j, pvt ) )
*
*                    Swap dot products and PIV
*
                     stemp = work( j )
                     work( j ) = work( pvt )
                     work( pvt ) = stemp
                     itemp = piv( pvt )
                     piv( pvt ) = piv( j )
                     piv( j ) = itemp
                  END IF
*
                  ajj = sqrt( ajj )
                  a( j, j ) = ajj
*
*                 Compute elements J+1:N of row J.
*
                  IF( j.LT.n ) THEN
                     CALL clacgv( j-1, a( 1, j ), 1 )
                     CALL cgemv( 'Trans', j-k, n-j, -cone, a( k, j+1 ),
     $                           lda, a( k, j ), 1, cone, a( j, j+1 ),
     $                           lda )
                     CALL clacgv( j-1, a( 1, j ), 1 )
                     CALL csscal( n-j, one / ajj, a( j, j+1 ), lda )
                  END IF
*
  150          CONTINUE
*
*              Update trailing matrix, J already incremented
*
               IF( k+jb.LE.n ) THEN
                  CALL cherk( 'Upper', 'Conj Trans', n-j+1, jb, -one,
     $                        a( k, j ), lda, one, a( j, j ), lda )
               END IF
*
  160       CONTINUE
*
         ELSE
*
*        Compute the Cholesky factorization P**T * A * P = L * L**H
*
            DO 210 k = 1, n, nb
*
*              Account for last block not being NB wide
*
               jb = min( nb, n-k+1 )
*
*              Set relevant part of first half of WORK to zero,
*              holds dot products
*
               DO 170 i = k, n
                  work( i ) = 0
  170          CONTINUE
*
               DO 200 j = k, k + jb - 1
*
*              Find pivot, test for exit, else swap rows and columns
*              Update dot products, compute possible pivots which are
*              stored in the second half of WORK
*
                  DO 180 i = j, n
*
                     IF( j.GT.k ) THEN
                        work( i ) = work( i ) +
     $                              real( conjg( a( i, j-1 ) )*
     $                                    a( i, j-1 ) )
                     END IF
                     work( n+i ) = real( a( i, i ) ) - work( i )
*
  180             CONTINUE
*
                  IF( j.GT.1 ) THEN
                     itemp = maxloc( work( (n+j):(2*n) ), 1 )
                     pvt = itemp + j - 1
                     ajj = work( n+pvt )
                     IF( ajj.LE.sstop.OR.sisnan( ajj ) ) THEN
                        a( j, j ) = ajj
                        GO TO 220
                     END IF
                  END IF
*
                  IF( j.NE.pvt ) THEN
*
*                    Pivot OK, so can now swap pivot rows and columns
*
                     a( pvt, pvt ) = a( j, j )
                     CALL cswap( j-1, a( j, 1 ), lda, a( pvt, 1 ), lda )
                     IF( pvt.LT.n )
     $                  CALL cswap( n-pvt, a( pvt+1, j ), 1,
     $                              a( pvt+1, pvt ), 1 )
                     DO 190 i = j + 1, pvt - 1
                        ctemp = conjg( a( i, j ) )
                        a( i, j ) = conjg( a( pvt, i ) )
                        a( pvt, i ) = ctemp
  190                CONTINUE
                     a( pvt, j ) = conjg( a( pvt, j ) )
*
*                    Swap dot products and PIV
*
                     stemp = work( j )
                     work( j ) = work( pvt )
                     work( pvt ) = stemp
                     itemp = piv( pvt )
                     piv( pvt ) = piv( j )
                     piv( j ) = itemp
                  END IF
*
                  ajj = sqrt( ajj )
                  a( j, j ) = ajj
*
*                 Compute elements J+1:N of column J.
*
                  IF( j.LT.n ) THEN
                     CALL clacgv( j-1, a( j, 1 ), lda )
                     CALL cgemv( 'No Trans', n-j, j-k, -cone,
     $                           a( j+1, k ), lda, a( j, k ), lda, cone,
     $                           a( j+1, j ), 1 )
                     CALL clacgv( j-1, a( j, 1 ), lda )
                     CALL csscal( n-j, one / ajj, a( j+1, j ), 1 )
                  END IF
*
  200          CONTINUE
*
*              Update trailing matrix, J already incremented
*
               IF( k+jb.LE.n ) THEN
                  CALL cherk( 'Lower', 'No Trans', n-j+1, jb, -one,
     $                        a( j, k ), lda, one, a( j, j ), lda )
               END IF
*
  210       CONTINUE
*
         END IF
      END IF
*
*     Ran to completion, A has full rank
*
      rank = n
*
      GO TO 230
  220 CONTINUE
*
*     Rank is the number of steps completed.  Set INFO = 1 to signal
*     that the factorization cannot be used to solve a system.
*
      rank = j - 1
      info = 1
*
  230 CONTINUE
      RETURN
*
*     End of CPSTRF
*

◆ cspcon()

subroutine cspcon	(	character	uplo,
		integer	n,
		complex, dimension( * )	ap,
		integer, dimension( * )	ipiv,
		real	anorm,
		real	rcond,
		complex, dimension( * )	work,
		integer	info )

CSPCON

Download CSPCON + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CSPCON estimates the reciprocal of the condition number (in the
!> 1-norm) of a complex symmetric packed matrix A using the
!> factorization A = U*D*U**T or A = L*D*L**T computed by CSPTRF.
!>
!> An estimate is obtained for norm(inv(A)), and the reciprocal of the
!> condition number is computed as RCOND = 1 / (ANORM * norm(inv(A))).
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER1 !> Specifies whether the details of the factorization are stored !> as an upper or lower triangular matrix. !> = 'U': Upper triangular, form is A = UDUT; !> = 'L': Lower triangular, form is A = LDL*T. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in]	AP	!> AP is COMPLEX array, dimension (N*(N+1)/2) !> The block diagonal matrix D and the multipliers used to !> obtain the factor U or L as computed by CSPTRF, stored as a !> packed triangular matrix. !>
[in]	IPIV	!> IPIV is INTEGER array, dimension (N) !> Details of the interchanges and the block structure of D !> as determined by CSPTRF. !>
[in]	ANORM	!> ANORM is REAL !> The 1-norm of the original matrix A. !>
[out]	RCOND	!> RCOND is REAL !> The reciprocal of the condition number of the matrix A, !> computed as RCOND = 1/(ANORM * AINVNM), where AINVNM is an !> estimate of the 1-norm of inv(A) computed in this routine. !>
[out]	WORK	!> WORK is COMPLEX array, dimension (2*N) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 117 of file cspcon.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          UPLO
      INTEGER            INFO, N
      REAL               ANORM, RCOND
*     ..
*     .. Array Arguments ..
      INTEGER            IPIV( * )
      COMPLEX            AP( * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ONE, ZERO
      parameter( one = 1.0e+0, zero = 0.0e+0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            UPPER
      INTEGER            I, IP, KASE
      REAL               AINVNM
*     ..
*     .. Local Arrays ..
      INTEGER            ISAVE( 3 )
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           clacn2, csptrs, xerbla
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      upper = lsame( uplo, 'U' )
      IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( anorm.LT.zero ) THEN
         info = -5
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CSPCON', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      rcond = zero
      IF( n.EQ.0 ) THEN
         rcond = one
         RETURN
      ELSE IF( anorm.LE.zero ) THEN
         RETURN
      END IF
*
*     Check that the diagonal matrix D is nonsingular.
*
      IF( upper ) THEN
*
*        Upper triangular storage: examine D from bottom to top
*
         ip = n*( n+1 ) / 2
         DO 10 i = n, 1, -1
            IF( ipiv( i ).GT.0 .AND. ap( ip ).EQ.zero )
     $         RETURN
            ip = ip - i
   10    CONTINUE
      ELSE
*
*        Lower triangular storage: examine D from top to bottom.
*
         ip = 1
         DO 20 i = 1, n
            IF( ipiv( i ).GT.0 .AND. ap( ip ).EQ.zero )
     $         RETURN
            ip = ip + n - i + 1
   20    CONTINUE
      END IF
*
*     Estimate the 1-norm of the inverse.
*
      kase = 0
   30 CONTINUE
      CALL clacn2( n, work( n+1 ), work, ainvnm, kase, isave )
      IF( kase.NE.0 ) THEN
*
*        Multiply by inv(L*D*L**T) or inv(U*D*U**T).
*
         CALL csptrs( uplo, n, 1, ap, ipiv, work, n, info )
         GO TO 30
      END IF
*
*     Compute the estimate of the reciprocal condition number.
*
      IF( ainvnm.NE.zero )
     $   rcond = ( one / ainvnm ) / anorm
*
      RETURN
*
*     End of CSPCON
*

◆ csprfs()

subroutine csprfs	(	character	uplo,
		integer	n,
		integer	nrhs,
		complex, dimension( * )	ap,
		complex, dimension( * )	afp,
		integer, dimension( * )	ipiv,
		complex, dimension( ldb, * )	b,
		integer	ldb,
		complex, dimension( ldx, * )	x,
		integer	ldx,
		real, dimension( * )	ferr,
		real, dimension( * )	berr,
		complex, dimension( * )	work,
		real, dimension( * )	rwork,
		integer	info )

CSPRFS

Download CSPRFS + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CSPRFS improves the computed solution to a system of linear
!> equations when the coefficient matrix is symmetric indefinite
!> and packed, and provides error bounds and backward error estimates
!> for the solution.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': Upper triangle of A is stored; !> = 'L': Lower triangle of A is stored. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in]	NRHS	!> NRHS is INTEGER !> The number of right hand sides, i.e., the number of columns !> of the matrices B and X. NRHS >= 0. !>
[in]	AP	!> AP is COMPLEX array, dimension (N(N+1)/2) !> The upper or lower triangle of the symmetric matrix A, packed !> columnwise in a linear array. The j-th column of A is stored !> in the array AP as follows: !> if UPLO = 'U', AP(i + (j-1)j/2) = A(i,j) for 1<=i<=j; !> if UPLO = 'L', AP(i + (j-1)(2n-j)/2) = A(i,j) for j<=i<=n. !>
[in]	AFP	!> AFP is COMPLEX array, dimension (N(N+1)/2) !> The factored form of the matrix A. AFP contains the block !> diagonal matrix D and the multipliers used to obtain the !> factor U or L from the factorization A = UDUT or !> A = LDL*T as computed by CSPTRF, stored as a packed !> triangular matrix. !>
[in]	IPIV	!> IPIV is INTEGER array, dimension (N) !> Details of the interchanges and the block structure of D !> as determined by CSPTRF. !>
[in]	B	!> B is COMPLEX array, dimension (LDB,NRHS) !> The right hand side matrix B. !>
[in]	LDB	!> LDB is INTEGER !> The leading dimension of the array B. LDB >= max(1,N). !>
[in,out]	X	!> X is COMPLEX array, dimension (LDX,NRHS) !> On entry, the solution matrix X, as computed by CSPTRS. !> On exit, the improved solution matrix X. !>
[in]	LDX	!> LDX is INTEGER !> The leading dimension of the array X. LDX >= max(1,N). !>
[out]	FERR	!> FERR is REAL array, dimension (NRHS) !> The estimated forward error bound for each solution vector !> X(j) (the j-th column of the solution matrix X). !> If XTRUE is the true solution corresponding to X(j), FERR(j) !> is an estimated upper bound for the magnitude of the largest !> element in (X(j) - XTRUE) divided by the magnitude of the !> largest element in X(j). The estimate is as reliable as !> the estimate for RCOND, and is almost always a slight !> overestimate of the true error. !>
[out]	BERR	!> BERR is REAL array, dimension (NRHS) !> The componentwise relative backward error of each solution !> vector X(j) (i.e., the smallest relative change in !> any element of A or B that makes X(j) an exact solution). !>
[out]	WORK	!> WORK is COMPLEX array, dimension (2*N) !>
[out]	RWORK	!> RWORK is REAL array, dimension (N) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Internal Parameters:

!>  ITMAX is the maximum number of steps of iterative refinement.
!>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 178 of file csprfs.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          UPLO
      INTEGER            INFO, LDB, LDX, N, NRHS
*     ..
*     .. Array Arguments ..
      INTEGER            IPIV( * )
      REAL               BERR( * ), FERR( * ), RWORK( * )
      COMPLEX            AFP( * ), AP( * ), B( LDB, * ), WORK( * ),
     $                   X( LDX, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      INTEGER            ITMAX
      parameter( itmax = 5 )
      REAL               ZERO
      parameter( zero = 0.0e+0 )
      COMPLEX            ONE
      parameter( one = ( 1.0e+0, 0.0e+0 ) )
      REAL               TWO
      parameter( two = 2.0e+0 )
      REAL               THREE
      parameter( three = 3.0e+0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            UPPER
      INTEGER            COUNT, I, IK, J, K, KASE, KK, NZ
      REAL               EPS, LSTRES, S, SAFE1, SAFE2, SAFMIN, XK
      COMPLEX            ZDUM
*     ..
*     .. Local Arrays ..
      INTEGER            ISAVE( 3 )
*     ..
*     .. External Subroutines ..
      EXTERNAL           caxpy, ccopy, clacn2, cspmv, csptrs, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, aimag, max, real
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      REAL               SLAMCH
      EXTERNAL           lsame, slamch
*     ..
*     .. Statement Functions ..
      REAL               CABS1
*     ..
*     .. Statement Function definitions ..
      cabs1( zdum ) = abs( real( zdum ) ) + abs( aimag( zdum ) )
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      upper = lsame( uplo, 'U' )
      IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( nrhs.LT.0 ) THEN
         info = -3
      ELSE IF( ldb.LT.max( 1, n ) ) THEN
         info = -8
      ELSE IF( ldx.LT.max( 1, n ) ) THEN
         info = -10
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CSPRFS', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 .OR. nrhs.EQ.0 ) THEN
         DO 10 j = 1, nrhs
            ferr( j ) = zero
            berr( j ) = zero
   10    CONTINUE
         RETURN
      END IF
*
*     NZ = maximum number of nonzero elements in each row of A, plus 1
*
      nz = n + 1
      eps = slamch( 'Epsilon' )
      safmin = slamch( 'Safe minimum' )
      safe1 = nz*safmin
      safe2 = safe1 / eps
*
*     Do for each right hand side
*
      DO 140 j = 1, nrhs
*
         count = 1
         lstres = three
   20    CONTINUE
*
*        Loop until stopping criterion is satisfied.
*
*        Compute residual R = B - A * X
*
         CALL ccopy( n, b( 1, j ), 1, work, 1 )
         CALL cspmv( uplo, n, -one, ap, x( 1, j ), 1, one, work, 1 )
*
*        Compute componentwise relative backward error from formula
*
*        max(i) ( abs(R(i)) / ( abs(A)*abs(X) + abs(B) )(i) )
*
*        where abs(Z) is the componentwise absolute value of the matrix
*        or vector Z.  If the i-th component of the denominator is less
*        than SAFE2, then SAFE1 is added to the i-th components of the
*        numerator and denominator before dividing.
*
         DO 30 i = 1, n
            rwork( i ) = cabs1( b( i, j ) )
   30    CONTINUE
*
*        Compute abs(A)*abs(X) + abs(B).
*
         kk = 1
         IF( upper ) THEN
            DO 50 k = 1, n
               s = zero
               xk = cabs1( x( k, j ) )
               ik = kk
               DO 40 i = 1, k - 1
                  rwork( i ) = rwork( i ) + cabs1( ap( ik ) )*xk
                  s = s + cabs1( ap( ik ) )*cabs1( x( i, j ) )
                  ik = ik + 1
   40          CONTINUE
               rwork( k ) = rwork( k ) + cabs1( ap( kk+k-1 ) )*xk + s
               kk = kk + k
   50       CONTINUE
         ELSE
            DO 70 k = 1, n
               s = zero
               xk = cabs1( x( k, j ) )
               rwork( k ) = rwork( k ) + cabs1( ap( kk ) )*xk
               ik = kk + 1
               DO 60 i = k + 1, n
                  rwork( i ) = rwork( i ) + cabs1( ap( ik ) )*xk
                  s = s + cabs1( ap( ik ) )*cabs1( x( i, j ) )
                  ik = ik + 1
   60          CONTINUE
               rwork( k ) = rwork( k ) + s
               kk = kk + ( n-k+1 )
   70       CONTINUE
         END IF
         s = zero
         DO 80 i = 1, n
            IF( rwork( i ).GT.safe2 ) THEN
               s = max( s, cabs1( work( i ) ) / rwork( i ) )
            ELSE
               s = max( s, ( cabs1( work( i ) )+safe1 ) /
     $             ( rwork( i )+safe1 ) )
            END IF
   80    CONTINUE
         berr( j ) = s
*
*        Test stopping criterion. Continue iterating if
*           1) The residual BERR(J) is larger than machine epsilon, and
*           2) BERR(J) decreased by at least a factor of 2 during the
*              last iteration, and
*           3) At most ITMAX iterations tried.
*
         IF( berr( j ).GT.eps .AND. two*berr( j ).LE.lstres .AND.
     $       count.LE.itmax ) THEN
*
*           Update solution and try again.
*
            CALL csptrs( uplo, n, 1, afp, ipiv, work, n, info )
            CALL caxpy( n, one, work, 1, x( 1, j ), 1 )
            lstres = berr( j )
            count = count + 1
            GO TO 20
         END IF
*
*        Bound error from formula
*
*        norm(X - XTRUE) / norm(X) .le. FERR =
*        norm( abs(inv(A))*
*           ( abs(R) + NZ*EPS*( abs(A)*abs(X)+abs(B) ))) / norm(X)
*
*        where
*          norm(Z) is the magnitude of the largest component of Z
*          inv(A) is the inverse of A
*          abs(Z) is the componentwise absolute value of the matrix or
*             vector Z
*          NZ is the maximum number of nonzeros in any row of A, plus 1
*          EPS is machine epsilon
*
*        The i-th component of abs(R)+NZ*EPS*(abs(A)*abs(X)+abs(B))
*        is incremented by SAFE1 if the i-th component of
*        abs(A)*abs(X) + abs(B) is less than SAFE2.
*
*        Use CLACN2 to estimate the infinity-norm of the matrix
*           inv(A) * diag(W),
*        where W = abs(R) + NZ*EPS*( abs(A)*abs(X)+abs(B) )))
*
         DO 90 i = 1, n
            IF( rwork( i ).GT.safe2 ) THEN
               rwork( i ) = cabs1( work( i ) ) + nz*eps*rwork( i )
            ELSE
               rwork( i ) = cabs1( work( i ) ) + nz*eps*rwork( i ) +
     $                      safe1
            END IF
   90    CONTINUE
*
         kase = 0
  100    CONTINUE
         CALL clacn2( n, work( n+1 ), work, ferr( j ), kase, isave )
         IF( kase.NE.0 ) THEN
            IF( kase.EQ.1 ) THEN
*
*              Multiply by diag(W)*inv(A**T).
*
               CALL csptrs( uplo, n, 1, afp, ipiv, work, n, info )
               DO 110 i = 1, n
                  work( i ) = rwork( i )*work( i )
  110          CONTINUE
            ELSE IF( kase.EQ.2 ) THEN
*
*              Multiply by inv(A)*diag(W).
*
               DO 120 i = 1, n
                  work( i ) = rwork( i )*work( i )
  120          CONTINUE
               CALL csptrs( uplo, n, 1, afp, ipiv, work, n, info )
            END IF
            GO TO 100
         END IF
*
*        Normalize error.
*
         lstres = zero
         DO 130 i = 1, n
            lstres = max( lstres, cabs1( x( i, j ) ) )
  130    CONTINUE
         IF( lstres.NE.zero )
     $      ferr( j ) = ferr( j ) / lstres
*
  140 CONTINUE
*
      RETURN
*
*     End of CSPRFS
*

◆ csptrf()

subroutine csptrf	(	character	uplo,
		integer	n,
		complex, dimension( * )	ap,
		integer, dimension( * )	ipiv,
		integer	info )

CSPTRF

Download CSPTRF + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CSPTRF computes the factorization of a complex symmetric matrix A
!> stored in packed format using the Bunch-Kaufman diagonal pivoting
!> method:
!>
!>    A = U*D*U**T  or  A = L*D*L**T
!>
!> where U (or L) is a product of permutation and unit upper (lower)
!> triangular matrices, and D is symmetric and block diagonal with
!> 1-by-1 and 2-by-2 diagonal blocks.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': Upper triangle of A is stored; !> = 'L': Lower triangle of A is stored. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in,out]	AP	!> AP is COMPLEX array, dimension (N(N+1)/2) !> On entry, the upper or lower triangle of the symmetric matrix !> A, packed columnwise in a linear array. The j-th column of A !> is stored in the array AP as follows: !> if UPLO = 'U', AP(i + (j-1)j/2) = A(i,j) for 1<=i<=j; !> if UPLO = 'L', AP(i + (j-1)*(2n-j)/2) = A(i,j) for j<=i<=n. !> !> On exit, the block diagonal matrix D and the multipliers used !> to obtain the factor U or L, stored as a packed triangular !> matrix overwriting A (see below for further details). !>
[out]	IPIV	!> IPIV is INTEGER array, dimension (N) !> Details of the interchanges and the block structure of D. !> If IPIV(k) > 0, then rows and columns k and IPIV(k) were !> interchanged and D(k,k) is a 1-by-1 diagonal block. !> If UPLO = 'U' and IPIV(k) = IPIV(k-1) < 0, then rows and !> columns k-1 and -IPIV(k) were interchanged and D(k-1:k,k-1:k) !> is a 2-by-2 diagonal block. If UPLO = 'L' and IPIV(k) = !> IPIV(k+1) < 0, then rows and columns k+1 and -IPIV(k) were !> interchanged and D(k:k+1,k:k+1) is a 2-by-2 diagonal block. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !> > 0: if INFO = i, D(i,i) is exactly zero. The factorization !> has been completed, but the block diagonal matrix D is !> exactly singular, and division by zero will occur if it !> is used to solve a system of equations. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  5-96 - Based on modifications by J. Lewis, Boeing Computer Services
!>         Company
!>
!>  If UPLO = 'U', then A = U*D*U**T, where
!>     U = P(n)*U(n)* ... *P(k)U(k)* ...,
!>  i.e., U is a product of terms P(k)*U(k), where k decreases from n to
!>  1 in steps of 1 or 2, and D is a block diagonal matrix with 1-by-1
!>  and 2-by-2 diagonal blocks D(k).  P(k) is a permutation matrix as
!>  defined by IPIV(k), and U(k) is a unit upper triangular matrix, such
!>  that if the diagonal block D(k) is of order s (s = 1 or 2), then
!>
!>             (   I    v    0   )   k-s
!>     U(k) =  (   0    I    0   )   s
!>             (   0    0    I   )   n-k
!>                k-s   s   n-k
!>
!>  If s = 1, D(k) overwrites A(k,k), and v overwrites A(1:k-1,k).
!>  If s = 2, the upper triangle of D(k) overwrites A(k-1,k-1), A(k-1,k),
!>  and A(k,k), and v overwrites A(1:k-2,k-1:k).
!>
!>  If UPLO = 'L', then A = L*D*L**T, where
!>     L = P(1)*L(1)* ... *P(k)*L(k)* ...,
!>  i.e., L is a product of terms P(k)*L(k), where k increases from 1 to
!>  n in steps of 1 or 2, and D is a block diagonal matrix with 1-by-1
!>  and 2-by-2 diagonal blocks D(k).  P(k) is a permutation matrix as
!>  defined by IPIV(k), and L(k) is a unit lower triangular matrix, such
!>  that if the diagonal block D(k) is of order s (s = 1 or 2), then
!>
!>             (   I    0     0   )  k-1
!>     L(k) =  (   0    I     0   )  s
!>             (   0    v     I   )  n-k-s+1
!>                k-1   s  n-k-s+1
!>
!>  If s = 1, D(k) overwrites A(k,k), and v overwrites A(k+1:n,k).
!>  If s = 2, the lower triangle of D(k) overwrites A(k,k), A(k+1,k),
!>  and A(k+1,k+1), and v overwrites A(k+2:n,k:k+1).
!>

Definition at line 157 of file csptrf.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          UPLO
      INTEGER            INFO, N
*     ..
*     .. Array Arguments ..
      INTEGER            IPIV( * )
      COMPLEX            AP( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ZERO, ONE
      parameter( zero = 0.0e+0, one = 1.0e+0 )
      REAL               EIGHT, SEVTEN
      parameter( eight = 8.0e+0, sevten = 17.0e+0 )
      COMPLEX            CONE
      parameter( cone = ( 1.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      LOGICAL            UPPER
      INTEGER            I, IMAX, J, JMAX, K, KC, KK, KNC, KP, KPC,
     $                   KSTEP, KX, NPP
      REAL               ABSAKK, ALPHA, COLMAX, ROWMAX
      COMPLEX            D11, D12, D21, D22, R1, T, WK, WKM1, WKP1, ZDUM
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      INTEGER            ICAMAX
      EXTERNAL           lsame, icamax
*     ..
*     .. External Subroutines ..
      EXTERNAL           cscal, cspr, cswap, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, aimag, max, real, sqrt
*     ..
*     .. Statement Functions ..
      REAL               CABS1
*     ..
*     .. Statement Function definitions ..
      cabs1( zdum ) = abs( real( zdum ) ) + abs( aimag( zdum ) )
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      upper = lsame( uplo, 'U' )
      IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CSPTRF', -info )
         RETURN
      END IF
*
*     Initialize ALPHA for use in choosing pivot block size.
*
      alpha = ( one+sqrt( sevten ) ) / eight
*
      IF( upper ) THEN
*
*        Factorize A as U*D*U**T using the upper triangle of A
*
*        K is the main loop index, decreasing from N to 1 in steps of
*        1 or 2
*
         k = n
         kc = ( n-1 )*n / 2 + 1
   10    CONTINUE
         knc = kc
*
*        If K < 1, exit from loop
*
         IF( k.LT.1 )
     $      GO TO 110
         kstep = 1
*
*        Determine rows and columns to be interchanged and whether
*        a 1-by-1 or 2-by-2 pivot block will be used
*
         absakk = cabs1( ap( kc+k-1 ) )
*
*        IMAX is the row-index of the largest off-diagonal element in
*        column K, and COLMAX is its absolute value
*
         IF( k.GT.1 ) THEN
            imax = icamax( k-1, ap( kc ), 1 )
            colmax = cabs1( ap( kc+imax-1 ) )
         ELSE
            colmax = zero
         END IF
*
         IF( max( absakk, colmax ).EQ.zero ) THEN
*
*           Column K is zero: set INFO and continue
*
            IF( info.EQ.0 )
     $         info = k
            kp = k
         ELSE
            IF( absakk.GE.alpha*colmax ) THEN
*
*              no interchange, use 1-by-1 pivot block
*
               kp = k
            ELSE
*
               rowmax = zero
               jmax = imax
               kx = imax*( imax+1 ) / 2 + imax
               DO 20 j = imax + 1, k
                  IF( cabs1( ap( kx ) ).GT.rowmax ) THEN
                     rowmax = cabs1( ap( kx ) )
                     jmax = j
                  END IF
                  kx = kx + j
   20          CONTINUE
               kpc = ( imax-1 )*imax / 2 + 1
               IF( imax.GT.1 ) THEN
                  jmax = icamax( imax-1, ap( kpc ), 1 )
                  rowmax = max( rowmax, cabs1( ap( kpc+jmax-1 ) ) )
               END IF
*
               IF( absakk.GE.alpha*colmax*( colmax / rowmax ) ) THEN
*
*                 no interchange, use 1-by-1 pivot block
*
                  kp = k
               ELSE IF( cabs1( ap( kpc+imax-1 ) ).GE.alpha*rowmax ) THEN
*
*                 interchange rows and columns K and IMAX, use 1-by-1
*                 pivot block
*
                  kp = imax
               ELSE
*
*                 interchange rows and columns K-1 and IMAX, use 2-by-2
*                 pivot block
*
                  kp = imax
                  kstep = 2
               END IF
            END IF
*
            kk = k - kstep + 1
            IF( kstep.EQ.2 )
     $         knc = knc - k + 1
            IF( kp.NE.kk ) THEN
*
*              Interchange rows and columns KK and KP in the leading
*              submatrix A(1:k,1:k)
*
               CALL cswap( kp-1, ap( knc ), 1, ap( kpc ), 1 )
               kx = kpc + kp - 1
               DO 30 j = kp + 1, kk - 1
                  kx = kx + j - 1
                  t = ap( knc+j-1 )
                  ap( knc+j-1 ) = ap( kx )
                  ap( kx ) = t
   30          CONTINUE
               t = ap( knc+kk-1 )
               ap( knc+kk-1 ) = ap( kpc+kp-1 )
               ap( kpc+kp-1 ) = t
               IF( kstep.EQ.2 ) THEN
                  t = ap( kc+k-2 )
                  ap( kc+k-2 ) = ap( kc+kp-1 )
                  ap( kc+kp-1 ) = t
               END IF
            END IF
*
*           Update the leading submatrix
*
            IF( kstep.EQ.1 ) THEN
*
*              1-by-1 pivot block D(k): column k now holds
*
*              W(k) = U(k)*D(k)
*
*              where U(k) is the k-th column of U
*
*              Perform a rank-1 update of A(1:k-1,1:k-1) as
*
*              A := A - U(k)*D(k)*U(k)**T = A - W(k)*1/D(k)*W(k)**T
*
               r1 = cone / ap( kc+k-1 )
               CALL cspr( uplo, k-1, -r1, ap( kc ), 1, ap )
*
*              Store U(k) in column k
*
               CALL cscal( k-1, r1, ap( kc ), 1 )
            ELSE
*
*              2-by-2 pivot block D(k): columns k and k-1 now hold
*
*              ( W(k-1) W(k) ) = ( U(k-1) U(k) )*D(k)
*
*              where U(k) and U(k-1) are the k-th and (k-1)-th columns
*              of U
*
*              Perform a rank-2 update of A(1:k-2,1:k-2) as
*
*              A := A - ( U(k-1) U(k) )*D(k)*( U(k-1) U(k) )**T
*                 = A - ( W(k-1) W(k) )*inv(D(k))*( W(k-1) W(k) )**T
*
               IF( k.GT.2 ) THEN
*
                  d12 = ap( k-1+( k-1 )*k / 2 )
                  d22 = ap( k-1+( k-2 )*( k-1 ) / 2 ) / d12
                  d11 = ap( k+( k-1 )*k / 2 ) / d12
                  t = cone / ( d11*d22-cone )
                  d12 = t / d12
*
                  DO 50 j = k - 2, 1, -1
                     wkm1 = d12*( d11*ap( j+( k-2 )*( k-1 ) / 2 )-
     $                      ap( j+( k-1 )*k / 2 ) )
                     wk = d12*( d22*ap( j+( k-1 )*k / 2 )-
     $                    ap( j+( k-2 )*( k-1 ) / 2 ) )
                     DO 40 i = j, 1, -1
                        ap( i+( j-1 )*j / 2 ) = ap( i+( j-1 )*j / 2 ) -
     $                     ap( i+( k-1 )*k / 2 )*wk -
     $                     ap( i+( k-2 )*( k-1 ) / 2 )*wkm1
   40                CONTINUE
                     ap( j+( k-1 )*k / 2 ) = wk
                     ap( j+( k-2 )*( k-1 ) / 2 ) = wkm1
   50             CONTINUE
*
               END IF
            END IF
         END IF
*
*        Store details of the interchanges in IPIV
*
         IF( kstep.EQ.1 ) THEN
            ipiv( k ) = kp
         ELSE
            ipiv( k ) = -kp
            ipiv( k-1 ) = -kp
         END IF
*
*        Decrease K and return to the start of the main loop
*
         k = k - kstep
         kc = knc - k
         GO TO 10
*
      ELSE
*
*        Factorize A as L*D*L**T using the lower triangle of A
*
*        K is the main loop index, increasing from 1 to N in steps of
*        1 or 2
*
         k = 1
         kc = 1
         npp = n*( n+1 ) / 2
   60    CONTINUE
         knc = kc
*
*        If K > N, exit from loop
*
         IF( k.GT.n )
     $      GO TO 110
         kstep = 1
*
*        Determine rows and columns to be interchanged and whether
*        a 1-by-1 or 2-by-2 pivot block will be used
*
         absakk = cabs1( ap( kc ) )
*
*        IMAX is the row-index of the largest off-diagonal element in
*        column K, and COLMAX is its absolute value
*
         IF( k.LT.n ) THEN
            imax = k + icamax( n-k, ap( kc+1 ), 1 )
            colmax = cabs1( ap( kc+imax-k ) )
         ELSE
            colmax = zero
         END IF
*
         IF( max( absakk, colmax ).EQ.zero ) THEN
*
*           Column K is zero: set INFO and continue
*
            IF( info.EQ.0 )
     $         info = k
            kp = k
         ELSE
            IF( absakk.GE.alpha*colmax ) THEN
*
*              no interchange, use 1-by-1 pivot block
*
               kp = k
            ELSE
*
*              JMAX is the column-index of the largest off-diagonal
*              element in row IMAX, and ROWMAX is its absolute value
*
               rowmax = zero
               kx = kc + imax - k
               DO 70 j = k, imax - 1
                  IF( cabs1( ap( kx ) ).GT.rowmax ) THEN
                     rowmax = cabs1( ap( kx ) )
                     jmax = j
                  END IF
                  kx = kx + n - j
   70          CONTINUE
               kpc = npp - ( n-imax+1 )*( n-imax+2 ) / 2 + 1
               IF( imax.LT.n ) THEN
                  jmax = imax + icamax( n-imax, ap( kpc+1 ), 1 )
                  rowmax = max( rowmax, cabs1( ap( kpc+jmax-imax ) ) )
               END IF
*
               IF( absakk.GE.alpha*colmax*( colmax / rowmax ) ) THEN
*
*                 no interchange, use 1-by-1 pivot block
*
                  kp = k
               ELSE IF( cabs1( ap( kpc ) ).GE.alpha*rowmax ) THEN
*
*                 interchange rows and columns K and IMAX, use 1-by-1
*                 pivot block
*
                  kp = imax
               ELSE
*
*                 interchange rows and columns K+1 and IMAX, use 2-by-2
*                 pivot block
*
                  kp = imax
                  kstep = 2
               END IF
            END IF
*
            kk = k + kstep - 1
            IF( kstep.EQ.2 )
     $         knc = knc + n - k + 1
            IF( kp.NE.kk ) THEN
*
*              Interchange rows and columns KK and KP in the trailing
*              submatrix A(k:n,k:n)
*
               IF( kp.LT.n )
     $            CALL cswap( n-kp, ap( knc+kp-kk+1 ), 1, ap( kpc+1 ),
     $                        1 )
               kx = knc + kp - kk
               DO 80 j = kk + 1, kp - 1
                  kx = kx + n - j + 1
                  t = ap( knc+j-kk )
                  ap( knc+j-kk ) = ap( kx )
                  ap( kx ) = t
   80          CONTINUE
               t = ap( knc )
               ap( knc ) = ap( kpc )
               ap( kpc ) = t
               IF( kstep.EQ.2 ) THEN
                  t = ap( kc+1 )
                  ap( kc+1 ) = ap( kc+kp-k )
                  ap( kc+kp-k ) = t
               END IF
            END IF
*
*           Update the trailing submatrix
*
            IF( kstep.EQ.1 ) THEN
*
*              1-by-1 pivot block D(k): column k now holds
*
*              W(k) = L(k)*D(k)
*
*              where L(k) is the k-th column of L
*
               IF( k.LT.n ) THEN
*
*                 Perform a rank-1 update of A(k+1:n,k+1:n) as
*
*                 A := A - L(k)*D(k)*L(k)**T = A - W(k)*(1/D(k))*W(k)**T
*
                  r1 = cone / ap( kc )
                  CALL cspr( uplo, n-k, -r1, ap( kc+1 ), 1,
     $                       ap( kc+n-k+1 ) )
*
*                 Store L(k) in column K
*
                  CALL cscal( n-k, r1, ap( kc+1 ), 1 )
               END IF
            ELSE
*
*              2-by-2 pivot block D(k): columns K and K+1 now hold
*
*              ( W(k) W(k+1) ) = ( L(k) L(k+1) )*D(k)
*
*              where L(k) and L(k+1) are the k-th and (k+1)-th columns
*              of L
*
               IF( k.LT.n-1 ) THEN
*
*                 Perform a rank-2 update of A(k+2:n,k+2:n) as
*
*                 A := A - ( L(k) L(k+1) )*D(k)*( L(k) L(k+1) )**T
*                    = A - ( W(k) W(k+1) )*inv(D(k))*( W(k) W(k+1) )**T
*
*                 where L(k) and L(k+1) are the k-th and (k+1)-th
*                 columns of L
*
                  d21 = ap( k+1+( k-1 )*( 2*n-k ) / 2 )
                  d11 = ap( k+1+k*( 2*n-k-1 ) / 2 ) / d21
                  d22 = ap( k+( k-1 )*( 2*n-k ) / 2 ) / d21
                  t = cone / ( d11*d22-cone )
                  d21 = t / d21
*
                  DO 100 j = k + 2, n
                     wk = d21*( d11*ap( j+( k-1 )*( 2*n-k ) / 2 )-
     $                    ap( j+k*( 2*n-k-1 ) / 2 ) )
                     wkp1 = d21*( d22*ap( j+k*( 2*n-k-1 ) / 2 )-
     $                      ap( j+( k-1 )*( 2*n-k ) / 2 ) )
                     DO 90 i = j, n
                        ap( i+( j-1 )*( 2*n-j ) / 2 ) = ap( i+( j-1 )*
     $                     ( 2*n-j ) / 2 ) - ap( i+( k-1 )*( 2*n-k ) /
     $                     2 )*wk - ap( i+k*( 2*n-k-1 ) / 2 )*wkp1
   90                CONTINUE
                     ap( j+( k-1 )*( 2*n-k ) / 2 ) = wk
                     ap( j+k*( 2*n-k-1 ) / 2 ) = wkp1
  100             CONTINUE
               END IF
            END IF
         END IF
*
*        Store details of the interchanges in IPIV
*
         IF( kstep.EQ.1 ) THEN
            ipiv( k ) = kp
         ELSE
            ipiv( k ) = -kp
            ipiv( k+1 ) = -kp
         END IF
*
*        Increase K and return to the start of the main loop
*
         k = k + kstep
         kc = knc + n - k + 2
         GO TO 60
*
      END IF
*
  110 CONTINUE
      RETURN
*
*     End of CSPTRF
*

◆ csptri()

subroutine csptri	(	character	uplo,
		integer	n,
		complex, dimension( * )	ap,
		integer, dimension( * )	ipiv,
		complex, dimension( * )	work,
		integer	info )

CSPTRI

Download CSPTRI + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CSPTRI computes the inverse of a complex symmetric indefinite matrix
!> A in packed storage using the factorization A = U*D*U**T or
!> A = L*D*L**T computed by CSPTRF.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER1 !> Specifies whether the details of the factorization are stored !> as an upper or lower triangular matrix. !> = 'U': Upper triangular, form is A = UDUT; !> = 'L': Lower triangular, form is A = LDL*T. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in,out]	AP	!> AP is COMPLEX array, dimension (N(N+1)/2) !> On entry, the block diagonal matrix D and the multipliers !> used to obtain the factor U or L as computed by CSPTRF, !> stored as a packed triangular matrix. !> !> On exit, if INFO = 0, the (symmetric) inverse of the original !> matrix, stored as a packed triangular matrix. The j-th column !> of inv(A) is stored in the array AP as follows: !> if UPLO = 'U', AP(i + (j-1)j/2) = inv(A)(i,j) for 1<=i<=j; !> if UPLO = 'L', !> AP(i + (j-1)*(2n-j)/2) = inv(A)(i,j) for j<=i<=n. !>
[in]	IPIV	!> IPIV is INTEGER array, dimension (N) !> Details of the interchanges and the block structure of D !> as determined by CSPTRF. !>
[out]	WORK	!> WORK is COMPLEX array, dimension (N) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !> > 0: if INFO = i, D(i,i) = 0; the matrix is singular and its !> inverse could not be computed. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 108 of file csptri.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          UPLO
      INTEGER            INFO, N
*     ..
*     .. Array Arguments ..
      INTEGER            IPIV( * )
      COMPLEX            AP( * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            ONE, ZERO
      parameter( one = ( 1.0e+0, 0.0e+0 ),
     $                   zero = ( 0.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      LOGICAL            UPPER
      INTEGER            J, K, KC, KCNEXT, KP, KPC, KSTEP, KX, NPP
      COMPLEX            AK, AKKP1, AKP1, D, T, TEMP
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      COMPLEX            CDOTU
      EXTERNAL           lsame, cdotu
*     ..
*     .. External Subroutines ..
      EXTERNAL           ccopy, cspmv, cswap, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      upper = lsame( uplo, 'U' )
      IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CSPTRI', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
*     Check that the diagonal matrix D is nonsingular.
*
      IF( upper ) THEN
*
*        Upper triangular storage: examine D from bottom to top
*
         kp = n*( n+1 ) / 2
         DO 10 info = n, 1, -1
            IF( ipiv( info ).GT.0 .AND. ap( kp ).EQ.zero )
     $         RETURN
            kp = kp - info
   10    CONTINUE
      ELSE
*
*        Lower triangular storage: examine D from top to bottom.
*
         kp = 1
         DO 20 info = 1, n
            IF( ipiv( info ).GT.0 .AND. ap( kp ).EQ.zero )
     $         RETURN
            kp = kp + n - info + 1
   20    CONTINUE
      END IF
      info = 0
*
      IF( upper ) THEN
*
*        Compute inv(A) from the factorization A = U*D*U**T.
*
*        K is the main loop index, increasing from 1 to N in steps of
*        1 or 2, depending on the size of the diagonal blocks.
*
         k = 1
         kc = 1
   30    CONTINUE
*
*        If K > N, exit from loop.
*
         IF( k.GT.n )
     $      GO TO 50
*
         kcnext = kc + k
         IF( ipiv( k ).GT.0 ) THEN
*
*           1 x 1 diagonal block
*
*           Invert the diagonal block.
*
            ap( kc+k-1 ) = one / ap( kc+k-1 )
*
*           Compute column K of the inverse.
*
            IF( k.GT.1 ) THEN
               CALL ccopy( k-1, ap( kc ), 1, work, 1 )
               CALL cspmv( uplo, k-1, -one, ap, work, 1, zero, ap( kc ),
     $                     1 )
               ap( kc+k-1 ) = ap( kc+k-1 ) -
     $                        cdotu( k-1, work, 1, ap( kc ), 1 )
            END IF
            kstep = 1
         ELSE
*
*           2 x 2 diagonal block
*
*           Invert the diagonal block.
*
            t = ap( kcnext+k-1 )
            ak = ap( kc+k-1 ) / t
            akp1 = ap( kcnext+k ) / t
            akkp1 = ap( kcnext+k-1 ) / t
            d = t*( ak*akp1-one )
            ap( kc+k-1 ) = akp1 / d
            ap( kcnext+k ) = ak / d
            ap( kcnext+k-1 ) = -akkp1 / d
*
*           Compute columns K and K+1 of the inverse.
*
            IF( k.GT.1 ) THEN
               CALL ccopy( k-1, ap( kc ), 1, work, 1 )
               CALL cspmv( uplo, k-1, -one, ap, work, 1, zero, ap( kc ),
     $                     1 )
               ap( kc+k-1 ) = ap( kc+k-1 ) -
     $                        cdotu( k-1, work, 1, ap( kc ), 1 )
               ap( kcnext+k-1 ) = ap( kcnext+k-1 ) -
     $                            cdotu( k-1, ap( kc ), 1, ap( kcnext ),
     $                            1 )
               CALL ccopy( k-1, ap( kcnext ), 1, work, 1 )
               CALL cspmv( uplo, k-1, -one, ap, work, 1, zero,
     $                     ap( kcnext ), 1 )
               ap( kcnext+k ) = ap( kcnext+k ) -
     $                          cdotu( k-1, work, 1, ap( kcnext ), 1 )
            END IF
            kstep = 2
            kcnext = kcnext + k + 1
         END IF
*
         kp = abs( ipiv( k ) )
         IF( kp.NE.k ) THEN
*
*           Interchange rows and columns K and KP in the leading
*           submatrix A(1:k+1,1:k+1)
*
            kpc = ( kp-1 )*kp / 2 + 1
            CALL cswap( kp-1, ap( kc ), 1, ap( kpc ), 1 )
            kx = kpc + kp - 1
            DO 40 j = kp + 1, k - 1
               kx = kx + j - 1
               temp = ap( kc+j-1 )
               ap( kc+j-1 ) = ap( kx )
               ap( kx ) = temp
   40       CONTINUE
            temp = ap( kc+k-1 )
            ap( kc+k-1 ) = ap( kpc+kp-1 )
            ap( kpc+kp-1 ) = temp
            IF( kstep.EQ.2 ) THEN
               temp = ap( kc+k+k-1 )
               ap( kc+k+k-1 ) = ap( kc+k+kp-1 )
               ap( kc+k+kp-1 ) = temp
            END IF
         END IF
*
         k = k + kstep
         kc = kcnext
         GO TO 30
   50    CONTINUE
*
      ELSE
*
*        Compute inv(A) from the factorization A = L*D*L**T.
*
*        K is the main loop index, increasing from 1 to N in steps of
*        1 or 2, depending on the size of the diagonal blocks.
*
         npp = n*( n+1 ) / 2
         k = n
         kc = npp
   60    CONTINUE
*
*        If K < 1, exit from loop.
*
         IF( k.LT.1 )
     $      GO TO 80
*
         kcnext = kc - ( n-k+2 )
         IF( ipiv( k ).GT.0 ) THEN
*
*           1 x 1 diagonal block
*
*           Invert the diagonal block.
*
            ap( kc ) = one / ap( kc )
*
*           Compute column K of the inverse.
*
            IF( k.LT.n ) THEN
               CALL ccopy( n-k, ap( kc+1 ), 1, work, 1 )
               CALL cspmv( uplo, n-k, -one, ap( kc+n-k+1 ), work, 1,
     $                     zero, ap( kc+1 ), 1 )
               ap( kc ) = ap( kc ) - cdotu( n-k, work, 1, ap( kc+1 ),
     $                    1 )
            END IF
            kstep = 1
         ELSE
*
*           2 x 2 diagonal block
*
*           Invert the diagonal block.
*
            t = ap( kcnext+1 )
            ak = ap( kcnext ) / t
            akp1 = ap( kc ) / t
            akkp1 = ap( kcnext+1 ) / t
            d = t*( ak*akp1-one )
            ap( kcnext ) = akp1 / d
            ap( kc ) = ak / d
            ap( kcnext+1 ) = -akkp1 / d
*
*           Compute columns K-1 and K of the inverse.
*
            IF( k.LT.n ) THEN
               CALL ccopy( n-k, ap( kc+1 ), 1, work, 1 )
               CALL cspmv( uplo, n-k, -one, ap( kc+( n-k+1 ) ), work, 1,
     $                     zero, ap( kc+1 ), 1 )
               ap( kc ) = ap( kc ) - cdotu( n-k, work, 1, ap( kc+1 ),
     $                    1 )
               ap( kcnext+1 ) = ap( kcnext+1 ) -
     $                          cdotu( n-k, ap( kc+1 ), 1,
     $                          ap( kcnext+2 ), 1 )
               CALL ccopy( n-k, ap( kcnext+2 ), 1, work, 1 )
               CALL cspmv( uplo, n-k, -one, ap( kc+( n-k+1 ) ), work, 1,
     $                     zero, ap( kcnext+2 ), 1 )
               ap( kcnext ) = ap( kcnext ) -
     $                        cdotu( n-k, work, 1, ap( kcnext+2 ), 1 )
            END IF
            kstep = 2
            kcnext = kcnext - ( n-k+3 )
         END IF
*
         kp = abs( ipiv( k ) )
         IF( kp.NE.k ) THEN
*
*           Interchange rows and columns K and KP in the trailing
*           submatrix A(k-1:n,k-1:n)
*
            kpc = npp - ( n-kp+1 )*( n-kp+2 ) / 2 + 1
            IF( kp.LT.n )
     $         CALL cswap( n-kp, ap( kc+kp-k+1 ), 1, ap( kpc+1 ), 1 )
            kx = kc + kp - k
            DO 70 j = k + 1, kp - 1
               kx = kx + n - j + 1
               temp = ap( kc+j-k )
               ap( kc+j-k ) = ap( kx )
               ap( kx ) = temp
   70       CONTINUE
            temp = ap( kc )
            ap( kc ) = ap( kpc )
            ap( kpc ) = temp
            IF( kstep.EQ.2 ) THEN
               temp = ap( kc-n+k-1 )
               ap( kc-n+k-1 ) = ap( kc-n+kp-1 )
               ap( kc-n+kp-1 ) = temp
            END IF
         END IF
*
         k = k - kstep
         kc = kcnext
         GO TO 60
   80    CONTINUE
      END IF
*
      RETURN
*
*     End of CSPTRI
*

◆ csptrs()

subroutine csptrs	(	character	uplo,
		integer	n,
		integer	nrhs,
		complex, dimension( * )	ap,
		integer, dimension( * )	ipiv,
		complex, dimension( ldb, * )	b,
		integer	ldb,
		integer	info )

CSPTRS

Download CSPTRS + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CSPTRS solves a system of linear equations A*X = B with a complex
!> symmetric matrix A stored in packed format using the factorization
!> A = U*D*U**T or A = L*D*L**T computed by CSPTRF.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER1 !> Specifies whether the details of the factorization are stored !> as an upper or lower triangular matrix. !> = 'U': Upper triangular, form is A = UDUT; !> = 'L': Lower triangular, form is A = LDL*T. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in]	NRHS	!> NRHS is INTEGER !> The number of right hand sides, i.e., the number of columns !> of the matrix B. NRHS >= 0. !>
[in]	AP	!> AP is COMPLEX array, dimension (N*(N+1)/2) !> The block diagonal matrix D and the multipliers used to !> obtain the factor U or L as computed by CSPTRF, stored as a !> packed triangular matrix. !>
[in]	IPIV	!> IPIV is INTEGER array, dimension (N) !> Details of the interchanges and the block structure of D !> as determined by CSPTRF. !>
[in,out]	B	!> B is COMPLEX array, dimension (LDB,NRHS) !> On entry, the right hand side matrix B. !> On exit, the solution matrix X. !>
[in]	LDB	!> LDB is INTEGER !> The leading dimension of the array B. LDB >= max(1,N). !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 114 of file csptrs.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          UPLO
      INTEGER            INFO, LDB, N, NRHS
*     ..
*     .. Array Arguments ..
      INTEGER            IPIV( * )
      COMPLEX            AP( * ), B( LDB, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            ONE
      parameter( one = ( 1.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      LOGICAL            UPPER
      INTEGER            J, K, KC, KP
      COMPLEX            AK, AKM1, AKM1K, BK, BKM1, DENOM
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           cgemv, cgeru, cscal, cswap, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max
*     ..
*     .. Executable Statements ..
*
      info = 0
      upper = lsame( uplo, 'U' )
      IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( nrhs.LT.0 ) THEN
         info = -3
      ELSE IF( ldb.LT.max( 1, n ) ) THEN
         info = -7
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CSPTRS', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 .OR. nrhs.EQ.0 )
     $   RETURN
*
      IF( upper ) THEN
*
*        Solve A*X = B, where A = U*D*U**T.
*
*        First solve U*D*X = B, overwriting B with X.
*
*        K is the main loop index, decreasing from N to 1 in steps of
*        1 or 2, depending on the size of the diagonal blocks.
*
         k = n
         kc = n*( n+1 ) / 2 + 1
   10    CONTINUE
*
*        If K < 1, exit from loop.
*
         IF( k.LT.1 )
     $      GO TO 30
*
         kc = kc - k
         IF( ipiv( k ).GT.0 ) THEN
*
*           1 x 1 diagonal block
*
*           Interchange rows K and IPIV(K).
*
            kp = ipiv( k )
            IF( kp.NE.k )
     $         CALL cswap( nrhs, b( k, 1 ), ldb, b( kp, 1 ), ldb )
*
*           Multiply by inv(U(K)), where U(K) is the transformation
*           stored in column K of A.
*
            CALL cgeru( k-1, nrhs, -one, ap( kc ), 1, b( k, 1 ), ldb,
     $                  b( 1, 1 ), ldb )
*
*           Multiply by the inverse of the diagonal block.
*
            CALL cscal( nrhs, one / ap( kc+k-1 ), b( k, 1 ), ldb )
            k = k - 1
         ELSE
*
*           2 x 2 diagonal block
*
*           Interchange rows K-1 and -IPIV(K).
*
            kp = -ipiv( k )
            IF( kp.NE.k-1 )
     $         CALL cswap( nrhs, b( k-1, 1 ), ldb, b( kp, 1 ), ldb )
*
*           Multiply by inv(U(K)), where U(K) is the transformation
*           stored in columns K-1 and K of A.
*
            CALL cgeru( k-2, nrhs, -one, ap( kc ), 1, b( k, 1 ), ldb,
     $                  b( 1, 1 ), ldb )
            CALL cgeru( k-2, nrhs, -one, ap( kc-( k-1 ) ), 1,
     $                  b( k-1, 1 ), ldb, b( 1, 1 ), ldb )
*
*           Multiply by the inverse of the diagonal block.
*
            akm1k = ap( kc+k-2 )
            akm1 = ap( kc-1 ) / akm1k
            ak = ap( kc+k-1 ) / akm1k
            denom = akm1*ak - one
            DO 20 j = 1, nrhs
               bkm1 = b( k-1, j ) / akm1k
               bk = b( k, j ) / akm1k
               b( k-1, j ) = ( ak*bkm1-bk ) / denom
               b( k, j ) = ( akm1*bk-bkm1 ) / denom
   20       CONTINUE
            kc = kc - k + 1
            k = k - 2
         END IF
*
         GO TO 10
   30    CONTINUE
*
*        Next solve U**T*X = B, overwriting B with X.
*
*        K is the main loop index, increasing from 1 to N in steps of
*        1 or 2, depending on the size of the diagonal blocks.
*
         k = 1
         kc = 1
   40    CONTINUE
*
*        If K > N, exit from loop.
*
         IF( k.GT.n )
     $      GO TO 50
*
         IF( ipiv( k ).GT.0 ) THEN
*
*           1 x 1 diagonal block
*
*           Multiply by inv(U**T(K)), where U(K) is the transformation
*           stored in column K of A.
*
            CALL cgemv( 'Transpose', k-1, nrhs, -one, b, ldb, ap( kc ),
     $                  1, one, b( k, 1 ), ldb )
*
*           Interchange rows K and IPIV(K).
*
            kp = ipiv( k )
            IF( kp.NE.k )
     $         CALL cswap( nrhs, b( k, 1 ), ldb, b( kp, 1 ), ldb )
            kc = kc + k
            k = k + 1
         ELSE
*
*           2 x 2 diagonal block
*
*           Multiply by inv(U**T(K+1)), where U(K+1) is the transformation
*           stored in columns K and K+1 of A.
*
            CALL cgemv( 'Transpose', k-1, nrhs, -one, b, ldb, ap( kc ),
     $                  1, one, b( k, 1 ), ldb )
            CALL cgemv( 'Transpose', k-1, nrhs, -one, b, ldb,
     $                  ap( kc+k ), 1, one, b( k+1, 1 ), ldb )
*
*           Interchange rows K and -IPIV(K).
*
            kp = -ipiv( k )
            IF( kp.NE.k )
     $         CALL cswap( nrhs, b( k, 1 ), ldb, b( kp, 1 ), ldb )
            kc = kc + 2*k + 1
            k = k + 2
         END IF
*
         GO TO 40
   50    CONTINUE
*
      ELSE
*
*        Solve A*X = B, where A = L*D*L**T.
*
*        First solve L*D*X = B, overwriting B with X.
*
*        K is the main loop index, increasing from 1 to N in steps of
*        1 or 2, depending on the size of the diagonal blocks.
*
         k = 1
         kc = 1
   60    CONTINUE
*
*        If K > N, exit from loop.
*
         IF( k.GT.n )
     $      GO TO 80
*
         IF( ipiv( k ).GT.0 ) THEN
*
*           1 x 1 diagonal block
*
*           Interchange rows K and IPIV(K).
*
            kp = ipiv( k )
            IF( kp.NE.k )
     $         CALL cswap( nrhs, b( k, 1 ), ldb, b( kp, 1 ), ldb )
*
*           Multiply by inv(L(K)), where L(K) is the transformation
*           stored in column K of A.
*
            IF( k.LT.n )
     $         CALL cgeru( n-k, nrhs, -one, ap( kc+1 ), 1, b( k, 1 ),
     $                     ldb, b( k+1, 1 ), ldb )
*
*           Multiply by the inverse of the diagonal block.
*
            CALL cscal( nrhs, one / ap( kc ), b( k, 1 ), ldb )
            kc = kc + n - k + 1
            k = k + 1
         ELSE
*
*           2 x 2 diagonal block
*
*           Interchange rows K+1 and -IPIV(K).
*
            kp = -ipiv( k )
            IF( kp.NE.k+1 )
     $         CALL cswap( nrhs, b( k+1, 1 ), ldb, b( kp, 1 ), ldb )
*
*           Multiply by inv(L(K)), where L(K) is the transformation
*           stored in columns K and K+1 of A.
*
            IF( k.LT.n-1 ) THEN
               CALL cgeru( n-k-1, nrhs, -one, ap( kc+2 ), 1, b( k, 1 ),
     $                     ldb, b( k+2, 1 ), ldb )
               CALL cgeru( n-k-1, nrhs, -one, ap( kc+n-k+2 ), 1,
     $                     b( k+1, 1 ), ldb, b( k+2, 1 ), ldb )
            END IF
*
*           Multiply by the inverse of the diagonal block.
*
            akm1k = ap( kc+1 )
            akm1 = ap( kc ) / akm1k
            ak = ap( kc+n-k+1 ) / akm1k
            denom = akm1*ak - one
            DO 70 j = 1, nrhs
               bkm1 = b( k, j ) / akm1k
               bk = b( k+1, j ) / akm1k
               b( k, j ) = ( ak*bkm1-bk ) / denom
               b( k+1, j ) = ( akm1*bk-bkm1 ) / denom
   70       CONTINUE
            kc = kc + 2*( n-k ) + 1
            k = k + 2
         END IF
*
         GO TO 60
   80    CONTINUE
*
*        Next solve L**T*X = B, overwriting B with X.
*
*        K is the main loop index, decreasing from N to 1 in steps of
*        1 or 2, depending on the size of the diagonal blocks.
*
         k = n
         kc = n*( n+1 ) / 2 + 1
   90    CONTINUE
*
*        If K < 1, exit from loop.
*
         IF( k.LT.1 )
     $      GO TO 100
*
         kc = kc - ( n-k+1 )
         IF( ipiv( k ).GT.0 ) THEN
*
*           1 x 1 diagonal block
*
*           Multiply by inv(L**T(K)), where L(K) is the transformation
*           stored in column K of A.
*
            IF( k.LT.n )
     $         CALL cgemv( 'Transpose', n-k, nrhs, -one, b( k+1, 1 ),
     $                     ldb, ap( kc+1 ), 1, one, b( k, 1 ), ldb )
*
*           Interchange rows K and IPIV(K).
*
            kp = ipiv( k )
            IF( kp.NE.k )
     $         CALL cswap( nrhs, b( k, 1 ), ldb, b( kp, 1 ), ldb )
            k = k - 1
         ELSE
*
*           2 x 2 diagonal block
*
*           Multiply by inv(L**T(K-1)), where L(K-1) is the transformation
*           stored in columns K-1 and K of A.
*
            IF( k.LT.n ) THEN
               CALL cgemv( 'Transpose', n-k, nrhs, -one, b( k+1, 1 ),
     $                     ldb, ap( kc+1 ), 1, one, b( k, 1 ), ldb )
               CALL cgemv( 'Transpose', n-k, nrhs, -one, b( k+1, 1 ),
     $                     ldb, ap( kc-( n-k ) ), 1, one, b( k-1, 1 ),
     $                     ldb )
            END IF
*
*           Interchange rows K and -IPIV(K).
*
            kp = -ipiv( k )
            IF( kp.NE.k )
     $         CALL cswap( nrhs, b( k, 1 ), ldb, b( kp, 1 ), ldb )
            kc = kc - ( n-k+2 )
            k = k - 2
         END IF
*
         GO TO 90
  100    CONTINUE
      END IF
*
      RETURN
*
*     End of CSPTRS
*

◆ cstedc()

subroutine cstedc	(	character	compz,
		integer	n,
		real, dimension( * )	d,
		real, dimension( * )	e,
		complex, dimension( ldz, * )	z,
		integer	ldz,
		complex, dimension( * )	work,
		integer	lwork,
		real, dimension( * )	rwork,
		integer	lrwork,
		integer, dimension( * )	iwork,
		integer	liwork,
		integer	info )

CSTEDC

Download CSTEDC + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CSTEDC computes all eigenvalues and, optionally, eigenvectors of a
!> symmetric tridiagonal matrix using the divide and conquer method.
!> The eigenvectors of a full or band complex Hermitian matrix can also
!> be found if CHETRD or CHPTRD or CHBTRD has been used to reduce this
!> matrix to tridiagonal form.
!>
!> This code makes very mild assumptions about floating point
!> arithmetic. It will work on machines with a guard digit in
!> add/subtract, or on those binary machines without guard digits
!> which subtract like the Cray X-MP, Cray Y-MP, Cray C-90, or Cray-2.
!> It could conceivably fail on hexadecimal or decimal machines
!> without guard digits, but we know of none.  See SLAED3 for details.
!>

Parameters

[in]	COMPZ	!> COMPZ is CHARACTER*1 !> = 'N': Compute eigenvalues only. !> = 'I': Compute eigenvectors of tridiagonal matrix also. !> = 'V': Compute eigenvectors of original Hermitian matrix !> also. On entry, Z contains the unitary matrix used !> to reduce the original matrix to tridiagonal form. !>
[in]	N	!> N is INTEGER !> The dimension of the symmetric tridiagonal matrix. N >= 0. !>
[in,out]	D	!> D is REAL array, dimension (N) !> On entry, the diagonal elements of the tridiagonal matrix. !> On exit, if INFO = 0, the eigenvalues in ascending order. !>
[in,out]	E	!> E is REAL array, dimension (N-1) !> On entry, the subdiagonal elements of the tridiagonal matrix. !> On exit, E has been destroyed. !>
[in,out]	Z	!> Z is COMPLEX array, dimension (LDZ,N) !> On entry, if COMPZ = 'V', then Z contains the unitary !> matrix used in the reduction to tridiagonal form. !> On exit, if INFO = 0, then if COMPZ = 'V', Z contains the !> orthonormal eigenvectors of the original Hermitian matrix, !> and if COMPZ = 'I', Z contains the orthonormal eigenvectors !> of the symmetric tridiagonal matrix. !> If COMPZ = 'N', then Z is not referenced. !>
[in]	LDZ	!> LDZ is INTEGER !> The leading dimension of the array Z. LDZ >= 1. !> If eigenvectors are desired, then LDZ >= max(1,N). !>
[out]	WORK	!> WORK is COMPLEX array, dimension (MAX(1,LWORK)) !> On exit, if INFO = 0, WORK(1) returns the optimal LWORK. !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the array WORK. !> If COMPZ = 'N' or 'I', or N <= 1, LWORK must be at least 1. !> If COMPZ = 'V' and N > 1, LWORK must be at least N*N. !> Note that for COMPZ = 'V', then if N is less than or !> equal to the minimum divide size, usually 25, then LWORK need !> only be 1. !> !> If LWORK = -1, then a workspace query is assumed; the routine !> only calculates the optimal sizes of the WORK, RWORK and !> IWORK arrays, returns these values as the first entries of !> the WORK, RWORK and IWORK arrays, and no error message !> related to LWORK or LRWORK or LIWORK is issued by XERBLA. !>
[out]	RWORK	!> RWORK is REAL array, dimension (MAX(1,LRWORK)) !> On exit, if INFO = 0, RWORK(1) returns the optimal LRWORK. !>
[in]	LRWORK	!> LRWORK is INTEGER !> The dimension of the array RWORK. !> If COMPZ = 'N' or N <= 1, LRWORK must be at least 1. !> If COMPZ = 'V' and N > 1, LRWORK must be at least !> 1 + 3N + 2Nlg N + 4N2 , !> where lg( N ) = smallest integer k such !> that 2k >= N. !> If COMPZ = 'I' and N > 1, LRWORK must be at least !> 1 + 4N + 2N*2 . !> Note that for COMPZ = 'I' or 'V', then if N is less than or !> equal to the minimum divide size, usually 25, then LRWORK !> need only be max(1,2(N-1)). !> !> If LRWORK = -1, then a workspace query is assumed; the !> routine only calculates the optimal sizes of the WORK, RWORK !> and IWORK arrays, returns these values as the first entries !> of the WORK, RWORK and IWORK arrays, and no error message !> related to LWORK or LRWORK or LIWORK is issued by XERBLA. !>
[out]	IWORK	!> IWORK is INTEGER array, dimension (MAX(1,LIWORK)) !> On exit, if INFO = 0, IWORK(1) returns the optimal LIWORK. !>
[in]	LIWORK	!> LIWORK is INTEGER !> The dimension of the array IWORK. !> If COMPZ = 'N' or N <= 1, LIWORK must be at least 1. !> If COMPZ = 'V' or N > 1, LIWORK must be at least !> 6 + 6N + 5Nlg N. !> If COMPZ = 'I' or N > 1, LIWORK must be at least !> 3 + 5N . !> Note that for COMPZ = 'I' or 'V', then if N is less than or !> equal to the minimum divide size, usually 25, then LIWORK !> need only be 1. !> !> If LIWORK = -1, then a workspace query is assumed; the !> routine only calculates the optimal sizes of the WORK, RWORK !> and IWORK arrays, returns these values as the first entries !> of the WORK, RWORK and IWORK arrays, and no error message !> related to LWORK or LRWORK or LIWORK is issued by XERBLA. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> < 0: if INFO = -i, the i-th argument had an illegal value. !> > 0: The algorithm failed to compute an eigenvalue while !> working on the submatrix lying in rows and columns !> INFO/(N+1) through mod(INFO,N+1). !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: Jeff Rutter, Computer Science Division, University of California at Berkeley, USA

Definition at line 210 of file cstedc.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          COMPZ
      INTEGER            INFO, LDZ, LIWORK, LRWORK, LWORK, N
*     ..
*     .. Array Arguments ..
      INTEGER            IWORK( * )
      REAL               D( * ), E( * ), RWORK( * )
      COMPLEX            WORK( * ), Z( LDZ, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ZERO, ONE, TWO
      parameter( zero = 0.0e0, one = 1.0e0, two = 2.0e0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            LQUERY
      INTEGER            FINISH, I, ICOMPZ, II, J, K, LGN, LIWMIN, LL,
     $                   LRWMIN, LWMIN, M, SMLSIZ, START
      REAL               EPS, ORGNRM, P, TINY
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      INTEGER            ILAENV
      REAL               SLAMCH, SLANST
      EXTERNAL           ilaenv, lsame, slamch, slanst
*     ..
*     .. External Subroutines ..
      EXTERNAL           xerbla, clacpy, clacrm, claed0, csteqr, cswap,
     $                   slascl, slaset, sstedc, ssteqr, ssterf
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, int, log, max, mod, real, sqrt
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      lquery = ( lwork.EQ.-1 .OR. lrwork.EQ.-1 .OR. liwork.EQ.-1 )
*
      IF( lsame( compz, 'N' ) ) THEN
         icompz = 0
      ELSE IF( lsame( compz, 'V' ) ) THEN
         icompz = 1
      ELSE IF( lsame( compz, 'I' ) ) THEN
         icompz = 2
      ELSE
         icompz = -1
      END IF
      IF( icompz.LT.0 ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( ( ldz.LT.1 ) .OR.
     $         ( icompz.GT.0 .AND. ldz.LT.max( 1, n ) ) ) THEN
         info = -6
      END IF
*
      IF( info.EQ.0 ) THEN
*
*        Compute the workspace requirements
*
         smlsiz = ilaenv( 9, 'CSTEDC', ' ', 0, 0, 0, 0 )
         IF( n.LE.1 .OR. icompz.EQ.0 ) THEN
            lwmin = 1
            liwmin = 1
            lrwmin = 1
         ELSE IF( n.LE.smlsiz ) THEN
            lwmin = 1
            liwmin = 1
            lrwmin = 2*( n - 1 )
         ELSE IF( icompz.EQ.1 ) THEN
            lgn = int( log( real( n ) ) / log( two ) )
            IF( 2**lgn.LT.n )
     $         lgn = lgn + 1
            IF( 2**lgn.LT.n )
     $         lgn = lgn + 1
            lwmin = n*n
            lrwmin = 1 + 3*n + 2*n*lgn + 4*n**2
            liwmin = 6 + 6*n + 5*n*lgn
         ELSE IF( icompz.EQ.2 ) THEN
            lwmin = 1
            lrwmin = 1 + 4*n + 2*n**2
            liwmin = 3 + 5*n
         END IF
         work( 1 ) = lwmin
         rwork( 1 ) = lrwmin
         iwork( 1 ) = liwmin
*
         IF( lwork.LT.lwmin .AND. .NOT.lquery ) THEN
            info = -8
         ELSE IF( lrwork.LT.lrwmin .AND. .NOT.lquery ) THEN
            info = -10
         ELSE IF( liwork.LT.liwmin .AND. .NOT.lquery ) THEN
            info = -12
         END IF
      END IF
*
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CSTEDC', -info )
         RETURN
      ELSE IF( lquery ) THEN
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
      IF( n.EQ.1 ) THEN
         IF( icompz.NE.0 )
     $      z( 1, 1 ) = one
         RETURN
      END IF
*
*     If the following conditional clause is removed, then the routine
*     will use the Divide and Conquer routine to compute only the
*     eigenvalues, which requires (3N + 3N**2) real workspace and
*     (2 + 5N + 2N lg(N)) integer workspace.
*     Since on many architectures SSTERF is much faster than any other
*     algorithm for finding eigenvalues only, it is used here
*     as the default. If the conditional clause is removed, then
*     information on the size of workspace needs to be changed.
*
*     If COMPZ = 'N', use SSTERF to compute the eigenvalues.
*
      IF( icompz.EQ.0 ) THEN
         CALL ssterf( n, d, e, info )
         GO TO 70
      END IF
*
*     If N is smaller than the minimum divide size (SMLSIZ+1), then
*     solve the problem with another solver.
*
      IF( n.LE.smlsiz ) THEN
*
         CALL csteqr( compz, n, d, e, z, ldz, rwork, info )
*
      ELSE
*
*        If COMPZ = 'I', we simply call SSTEDC instead.
*
         IF( icompz.EQ.2 ) THEN
            CALL slaset( 'Full', n, n, zero, one, rwork, n )
            ll = n*n + 1
            CALL sstedc( 'I', n, d, e, rwork, n,
     $                   rwork( ll ), lrwork-ll+1, iwork, liwork, info )
            DO 20 j = 1, n
               DO 10 i = 1, n
                  z( i, j ) = rwork( ( j-1 )*n+i )
   10          CONTINUE
   20       CONTINUE
            GO TO 70
         END IF
*
*        From now on, only option left to be handled is COMPZ = 'V',
*        i.e. ICOMPZ = 1.
*
*        Scale.
*
         orgnrm = slanst( 'M', n, d, e )
         IF( orgnrm.EQ.zero )
     $      GO TO 70
*
         eps = slamch( 'Epsilon' )
*
         start = 1
*
*        while ( START <= N )
*
   30    CONTINUE
         IF( start.LE.n ) THEN
*
*           Let FINISH be the position of the next subdiagonal entry
*           such that E( FINISH ) <= TINY or FINISH = N if no such
*           subdiagonal exists.  The matrix identified by the elements
*           between START and FINISH constitutes an independent
*           sub-problem.
*
            finish = start
   40       CONTINUE
            IF( finish.LT.n ) THEN
               tiny = eps*sqrt( abs( d( finish ) ) )*
     $                    sqrt( abs( d( finish+1 ) ) )
               IF( abs( e( finish ) ).GT.tiny ) THEN
                  finish = finish + 1
                  GO TO 40
               END IF
            END IF
*
*           (Sub) Problem determined.  Compute its size and solve it.
*
            m = finish - start + 1
            IF( m.GT.smlsiz ) THEN
*
*              Scale.
*
               orgnrm = slanst( 'M', m, d( start ), e( start ) )
               CALL slascl( 'G', 0, 0, orgnrm, one, m, 1, d( start ), m,
     $                      info )
               CALL slascl( 'G', 0, 0, orgnrm, one, m-1, 1, e( start ),
     $                      m-1, info )
*
               CALL claed0( n, m, d( start ), e( start ), z( 1, start ),
     $                      ldz, work, n, rwork, iwork, info )
               IF( info.GT.0 ) THEN
                  info = ( info / ( m+1 )+start-1 )*( n+1 ) +
     $                   mod( info, ( m+1 ) ) + start - 1
                  GO TO 70
               END IF
*
*              Scale back.
*
               CALL slascl( 'G', 0, 0, one, orgnrm, m, 1, d( start ), m,
     $                      info )
*
            ELSE
               CALL ssteqr( 'I', m, d( start ), e( start ), rwork, m,
     $                      rwork( m*m+1 ), info )
               CALL clacrm( n, m, z( 1, start ), ldz, rwork, m, work, n,
     $                      rwork( m*m+1 ) )
               CALL clacpy( 'A', n, m, work, n, z( 1, start ), ldz )
               IF( info.GT.0 ) THEN
                  info = start*( n+1 ) + finish
                  GO TO 70
               END IF
            END IF
*
            start = finish + 1
            GO TO 30
         END IF
*
*        endwhile
*
*
*        Use Selection Sort to minimize swaps of eigenvectors
*
         DO 60 ii = 2, n
           i = ii - 1
           k = i
           p = d( i )
           DO 50 j = ii, n
              IF( d( j ).LT.p ) THEN
                 k = j
                 p = d( j )
              END IF
   50      CONTINUE
           IF( k.NE.i ) THEN
              d( k ) = d( i )
              d( i ) = p
              CALL cswap( n, z( 1, i ), 1, z( 1, k ), 1 )
           END IF
   60    CONTINUE
      END IF
*
   70 CONTINUE
      work( 1 ) = lwmin
      rwork( 1 ) = lrwmin
      iwork( 1 ) = liwmin
*
      RETURN
*
*     End of CSTEDC
*

◆ cstegr()

subroutine cstegr	(	character	jobz,
		character	range,
		integer	n,
		real, dimension( * )	d,
		real, dimension( * )	e,
		real	vl,
		real	vu,
		integer	il,
		integer	iu,
		real	abstol,
		integer	m,
		real, dimension( * )	w,
		complex, dimension( ldz, * )	z,
		integer	ldz,
		integer, dimension( * )	isuppz,
		real, dimension( * )	work,
		integer	lwork,
		integer, dimension( * )	iwork,
		integer	liwork,
		integer	info )

CSTEGR

Download CSTEGR + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CSTEGR computes selected eigenvalues and, optionally, eigenvectors
!> of a real symmetric tridiagonal matrix T. Any such unreduced matrix has
!> a well defined set of pairwise different real eigenvalues, the corresponding
!> real eigenvectors are pairwise orthogonal.
!>
!> The spectrum may be computed either completely or partially by specifying
!> either an interval (VL,VU] or a range of indices IL:IU for the desired
!> eigenvalues.
!>
!> CSTEGR is a compatibility wrapper around the improved CSTEMR routine.
!> See SSTEMR for further details.
!>
!> One important change is that the ABSTOL parameter no longer provides any
!> benefit and hence is no longer used.
!>
!> Note : CSTEGR and CSTEMR work only on machines which follow
!> IEEE-754 floating-point standard in their handling of infinities and
!> NaNs.  Normal execution may create these exceptiona values and hence
!> may abort due to a floating point exception in environments which
!> do not conform to the IEEE-754 standard.
!>

Parameters

[in]	JOBZ	!> JOBZ is CHARACTER*1 !> = 'N': Compute eigenvalues only; !> = 'V': Compute eigenvalues and eigenvectors. !>
[in]	RANGE	!> RANGE is CHARACTER*1 !> = 'A': all eigenvalues will be found. !> = 'V': all eigenvalues in the half-open interval (VL,VU] !> will be found. !> = 'I': the IL-th through IU-th eigenvalues will be found. !>
[in]	N	!> N is INTEGER !> The order of the matrix. N >= 0. !>
[in,out]	D	!> D is REAL array, dimension (N) !> On entry, the N diagonal elements of the tridiagonal matrix !> T. On exit, D is overwritten. !>
[in,out]	E	!> E is REAL array, dimension (N) !> On entry, the (N-1) subdiagonal elements of the tridiagonal !> matrix T in elements 1 to N-1 of E. E(N) need not be set on !> input, but is used internally as workspace. !> On exit, E is overwritten. !>
[in]	VL	!> VL is REAL !> !> If RANGE='V', the lower bound of the interval to !> be searched for eigenvalues. VL < VU. !> Not referenced if RANGE = 'A' or 'I'. !>
[in]	VU	!> VU is REAL !> !> If RANGE='V', the upper bound of the interval to !> be searched for eigenvalues. VL < VU. !> Not referenced if RANGE = 'A' or 'I'. !>
[in]	IL	!> IL is INTEGER !> !> If RANGE='I', the index of the !> smallest eigenvalue to be returned. !> 1 <= IL <= IU <= N, if N > 0. !> Not referenced if RANGE = 'A' or 'V'. !>
[in]	IU	!> IU is INTEGER !> !> If RANGE='I', the index of the !> largest eigenvalue to be returned. !> 1 <= IL <= IU <= N, if N > 0. !> Not referenced if RANGE = 'A' or 'V'. !>
[in]	ABSTOL	!> ABSTOL is REAL !> Unused. Was the absolute error tolerance for the !> eigenvalues/eigenvectors in previous versions. !>
[out]	M	!> M is INTEGER !> The total number of eigenvalues found. 0 <= M <= N. !> If RANGE = 'A', M = N, and if RANGE = 'I', M = IU-IL+1. !>
[out]	W	!> W is REAL array, dimension (N) !> The first M elements contain the selected eigenvalues in !> ascending order. !>
[out]	Z	!> Z is COMPLEX array, dimension (LDZ, max(1,M) ) !> If JOBZ = 'V', and if INFO = 0, then the first M columns of Z !> contain the orthonormal eigenvectors of the matrix T !> corresponding to the selected eigenvalues, with the i-th !> column of Z holding the eigenvector associated with W(i). !> If JOBZ = 'N', then Z is not referenced. !> Note: the user must ensure that at least max(1,M) columns are !> supplied in the array Z; if RANGE = 'V', the exact value of M !> is not known in advance and an upper bound must be used. !> Supplying N columns is always safe. !>
[in]	LDZ	!> LDZ is INTEGER !> The leading dimension of the array Z. LDZ >= 1, and if !> JOBZ = 'V', then LDZ >= max(1,N). !>
[out]	ISUPPZ	!> ISUPPZ is INTEGER array, dimension ( 2max(1,M) ) !> The support of the eigenvectors in Z, i.e., the indices !> indicating the nonzero elements in Z. The i-th computed eigenvector !> is nonzero only in elements ISUPPZ( 2i-1 ) through !> ISUPPZ( 2*i ). This is relevant in the case when the matrix !> is split. ISUPPZ is only accessed when JOBZ is 'V' and N > 0. !>
[out]	WORK	!> WORK is REAL array, dimension (LWORK) !> On exit, if INFO = 0, WORK(1) returns the optimal !> (and minimal) LWORK. !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the array WORK. LWORK >= max(1,18N) !> if JOBZ = 'V', and LWORK >= max(1,12N) if JOBZ = 'N'. !> If LWORK = -1, then a workspace query is assumed; the routine !> only calculates the optimal size of the WORK array, returns !> this value as the first entry of the WORK array, and no error !> message related to LWORK is issued by XERBLA. !>
[out]	IWORK	!> IWORK is INTEGER array, dimension (LIWORK) !> On exit, if INFO = 0, IWORK(1) returns the optimal LIWORK. !>
[in]	LIWORK	!> LIWORK is INTEGER !> The dimension of the array IWORK. LIWORK >= max(1,10N) !> if the eigenvectors are desired, and LIWORK >= max(1,8N) !> if only the eigenvalues are to be computed. !> If LIWORK = -1, then a workspace query is assumed; the !> routine only calculates the optimal size of the IWORK array, !> returns this value as the first entry of the IWORK array, and !> no error message related to LIWORK is issued by XERBLA. !>
[out]	INFO	!> INFO is INTEGER !> On exit, INFO !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !> > 0: if INFO = 1X, internal error in SLARRE, !> if INFO = 2X, internal error in CLARRV. !> Here, the digit X = ABS( IINFO ) < 10, where IINFO is !> the nonzero error code returned by SLARRE or !> CLARRV, respectively. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: Inderjit Dhillon, IBM Almaden, USA
Osni Marques, LBNL/NERSC, USA
Christof Voemel, LBNL/NERSC, USA

Definition at line 262 of file cstegr.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          JOBZ, RANGE
      INTEGER            IL, INFO, IU, LDZ, LIWORK, LWORK, M, N
      REAL             ABSTOL, VL, VU
*     ..
*     .. Array Arguments ..
      INTEGER            ISUPPZ( * ), IWORK( * )
      REAL               D( * ), E( * ), W( * ), WORK( * )
      COMPLEX            Z( LDZ, * )
*     ..
*
*  =====================================================================
*
*     .. Local Scalars ..
      LOGICAL TRYRAC
*     ..
*     .. External Subroutines ..
      EXTERNAL cstemr
*     ..
*     .. Executable Statements ..
      info = 0
      tryrac = .false.
 
      CALL cstemr( jobz, range, n, d, e, vl, vu, il, iu,
     $                   m, w, z, ldz, n, isuppz, tryrac, work, lwork,
     $                   iwork, liwork, info )
*
*     End of CSTEGR
*

◆ cstein()

subroutine cstein	(	integer	n,
		real, dimension( * )	d,
		real, dimension( * )	e,
		integer	m,
		real, dimension( * )	w,
		integer, dimension( * )	iblock,
		integer, dimension( * )	isplit,
		complex, dimension( ldz, * )	z,
		integer	ldz,
		real, dimension( * )	work,
		integer, dimension( * )	iwork,
		integer, dimension( * )	ifail,
		integer	info )

CSTEIN

Download CSTEIN + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CSTEIN computes the eigenvectors of a real symmetric tridiagonal
!> matrix T corresponding to specified eigenvalues, using inverse
!> iteration.
!>
!> The maximum number of iterations allowed for each eigenvector is
!> specified by an internal parameter MAXITS (currently set to 5).
!>
!> Although the eigenvectors are real, they are stored in a complex
!> array, which may be passed to CUNMTR or CUPMTR for back
!> transformation to the eigenvectors of a complex Hermitian matrix
!> which was reduced to tridiagonal form.
!>
!>

Parameters

[in]	N	!> N is INTEGER !> The order of the matrix. N >= 0. !>
[in]	D	!> D is REAL array, dimension (N) !> The n diagonal elements of the tridiagonal matrix T. !>
[in]	E	!> E is REAL array, dimension (N-1) !> The (n-1) subdiagonal elements of the tridiagonal matrix !> T, stored in elements 1 to N-1. !>
[in]	M	!> M is INTEGER !> The number of eigenvectors to be found. 0 <= M <= N. !>
[in]	W	!> W is REAL array, dimension (N) !> The first M elements of W contain the eigenvalues for !> which eigenvectors are to be computed. The eigenvalues !> should be grouped by split-off block and ordered from !> smallest to largest within the block. ( The output array !> W from SSTEBZ with ORDER = 'B' is expected here. ) !>
[in]	IBLOCK	!> IBLOCK is INTEGER array, dimension (N) !> The submatrix indices associated with the corresponding !> eigenvalues in W; IBLOCK(i)=1 if eigenvalue W(i) belongs to !> the first submatrix from the top, =2 if W(i) belongs to !> the second submatrix, etc. ( The output array IBLOCK !> from SSTEBZ is expected here. ) !>
[in]	ISPLIT	!> ISPLIT is INTEGER array, dimension (N) !> The splitting points, at which T breaks up into submatrices. !> The first submatrix consists of rows/columns 1 to !> ISPLIT( 1 ), the second of rows/columns ISPLIT( 1 )+1 !> through ISPLIT( 2 ), etc. !> ( The output array ISPLIT from SSTEBZ is expected here. ) !>
[out]	Z	!> Z is COMPLEX array, dimension (LDZ, M) !> The computed eigenvectors. The eigenvector associated !> with the eigenvalue W(i) is stored in the i-th column of !> Z. Any vector which fails to converge is set to its current !> iterate after MAXITS iterations. !> The imaginary parts of the eigenvectors are set to zero. !>
[in]	LDZ	!> LDZ is INTEGER !> The leading dimension of the array Z. LDZ >= max(1,N). !>
[out]	WORK	!> WORK is REAL array, dimension (5*N) !>
[out]	IWORK	!> IWORK is INTEGER array, dimension (N) !>
[out]	IFAIL	!> IFAIL is INTEGER array, dimension (M) !> On normal exit, all elements of IFAIL are zero. !> If one or more eigenvectors fail to converge after !> MAXITS iterations, then their indices are stored in !> array IFAIL. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !> > 0: if INFO = i, then i eigenvectors failed to converge !> in MAXITS iterations. Their indices are stored in !> array IFAIL. !>

Internal Parameters:

!>  MAXITS  INTEGER, default = 5
!>          The maximum number of iterations performed.
!>
!>  EXTRA   INTEGER, default = 2
!>          The number of iterations performed after norm growth
!>          criterion is satisfied, should be at least 1.
!>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 180 of file cstein.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INFO, LDZ, M, N
*     ..
*     .. Array Arguments ..
      INTEGER            IBLOCK( * ), IFAIL( * ), ISPLIT( * ),
     $                   IWORK( * )
      REAL               D( * ), E( * ), W( * ), WORK( * )
      COMPLEX            Z( LDZ, * )
*     ..
*
* =====================================================================
*
*     .. Parameters ..
      COMPLEX            CZERO, CONE
      parameter( czero = ( 0.0e+0, 0.0e+0 ),
     $                   cone = ( 1.0e+0, 0.0e+0 ) )
      REAL               ZERO, ONE, TEN, ODM3, ODM1
      parameter( zero = 0.0e+0, one = 1.0e+0, ten = 1.0e+1,
     $                   odm3 = 1.0e-3, odm1 = 1.0e-1 )
      INTEGER            MAXITS, EXTRA
      parameter( maxits = 5, extra = 2 )
*     ..
*     .. Local Scalars ..
      INTEGER            B1, BLKSIZ, BN, GPIND, I, IINFO, INDRV1,
     $                   INDRV2, INDRV3, INDRV4, INDRV5, ITS, J, J1,
     $                   JBLK, JMAX, JR, NBLK, NRMCHK
      REAL               CTR, EPS, EPS1, NRM, ONENRM, ORTOL, PERTOL,
     $                   SCL, SEP, STPCRT, TOL, XJ, XJM
*     ..
*     .. Local Arrays ..
      INTEGER            ISEED( 4 )
*     ..
*     .. External Functions ..
      INTEGER            ISAMAX
      REAL               SLAMCH, SNRM2
      EXTERNAL           isamax, slamch, snrm2
*     ..
*     .. External Subroutines ..
      EXTERNAL           scopy, slagtf, slagts, slarnv, sscal, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, cmplx, max, real, sqrt
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      DO 10 i = 1, m
         ifail( i ) = 0
   10 CONTINUE
*
      IF( n.LT.0 ) THEN
         info = -1
      ELSE IF( m.LT.0 .OR. m.GT.n ) THEN
         info = -4
      ELSE IF( ldz.LT.max( 1, n ) ) THEN
         info = -9
      ELSE
         DO 20 j = 2, m
            IF( iblock( j ).LT.iblock( j-1 ) ) THEN
               info = -6
               GO TO 30
            END IF
            IF( iblock( j ).EQ.iblock( j-1 ) .AND. w( j ).LT.w( j-1 ) )
     $           THEN
               info = -5
               GO TO 30
            END IF
   20    CONTINUE
   30    CONTINUE
      END IF
*
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CSTEIN', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 .OR. m.EQ.0 ) THEN
         RETURN
      ELSE IF( n.EQ.1 ) THEN
         z( 1, 1 ) = cone
         RETURN
      END IF
*
*     Get machine constants.
*
      eps = slamch( 'Precision' )
*
*     Initialize seed for random number generator SLARNV.
*
      DO 40 i = 1, 4
         iseed( i ) = 1
   40 CONTINUE
*
*     Initialize pointers.
*
      indrv1 = 0
      indrv2 = indrv1 + n
      indrv3 = indrv2 + n
      indrv4 = indrv3 + n
      indrv5 = indrv4 + n
*
*     Compute eigenvectors of matrix blocks.
*
      j1 = 1
      DO 180 nblk = 1, iblock( m )
*
*        Find starting and ending indices of block nblk.
*
         IF( nblk.EQ.1 ) THEN
            b1 = 1
         ELSE
            b1 = isplit( nblk-1 ) + 1
         END IF
         bn = isplit( nblk )
         blksiz = bn - b1 + 1
         IF( blksiz.EQ.1 )
     $      GO TO 60
         gpind = j1
*
*        Compute reorthogonalization criterion and stopping criterion.
*
         onenrm = abs( d( b1 ) ) + abs( e( b1 ) )
         onenrm = max( onenrm, abs( d( bn ) )+abs( e( bn-1 ) ) )
         DO 50 i = b1 + 1, bn - 1
            onenrm = max( onenrm, abs( d( i ) )+abs( e( i-1 ) )+
     $               abs( e( i ) ) )
   50    CONTINUE
         ortol = odm3*onenrm
*
         stpcrt = sqrt( odm1 / blksiz )
*
*        Loop through eigenvalues of block nblk.
*
   60    CONTINUE
         jblk = 0
         DO 170 j = j1, m
            IF( iblock( j ).NE.nblk ) THEN
               j1 = j
               GO TO 180
            END IF
            jblk = jblk + 1
            xj = w( j )
*
*           Skip all the work if the block size is one.
*
            IF( blksiz.EQ.1 ) THEN
               work( indrv1+1 ) = one
               GO TO 140
            END IF
*
*           If eigenvalues j and j-1 are too close, add a relatively
*           small perturbation.
*
            IF( jblk.GT.1 ) THEN
               eps1 = abs( eps*xj )
               pertol = ten*eps1
               sep = xj - xjm
               IF( sep.LT.pertol )
     $            xj = xjm + pertol
            END IF
*
            its = 0
            nrmchk = 0
*
*           Get random starting vector.
*
            CALL slarnv( 2, iseed, blksiz, work( indrv1+1 ) )
*
*           Copy the matrix T so it won't be destroyed in factorization.
*
            CALL scopy( blksiz, d( b1 ), 1, work( indrv4+1 ), 1 )
            CALL scopy( blksiz-1, e( b1 ), 1, work( indrv2+2 ), 1 )
            CALL scopy( blksiz-1, e( b1 ), 1, work( indrv3+1 ), 1 )
*
*           Compute LU factors with partial pivoting  ( PT = LU )
*
            tol = zero
            CALL slagtf( blksiz, work( indrv4+1 ), xj, work( indrv2+2 ),
     $                   work( indrv3+1 ), tol, work( indrv5+1 ), iwork,
     $                   iinfo )
*
*           Update iteration count.
*
   70       CONTINUE
            its = its + 1
            IF( its.GT.maxits )
     $         GO TO 120
*
*           Normalize and scale the righthand side vector Pb.
*
            jmax = isamax( blksiz, work( indrv1+1 ), 1 )
            scl = blksiz*onenrm*max( eps,
     $            abs( work( indrv4+blksiz ) ) ) /
     $            abs( work( indrv1+jmax ) )
            CALL sscal( blksiz, scl, work( indrv1+1 ), 1 )
*
*           Solve the system LU = Pb.
*
            CALL slagts( -1, blksiz, work( indrv4+1 ), work( indrv2+2 ),
     $                   work( indrv3+1 ), work( indrv5+1 ), iwork,
     $                   work( indrv1+1 ), tol, iinfo )
*
*           Reorthogonalize by modified Gram-Schmidt if eigenvalues are
*           close enough.
*
            IF( jblk.EQ.1 )
     $         GO TO 110
            IF( abs( xj-xjm ).GT.ortol )
     $         gpind = j
            IF( gpind.NE.j ) THEN
               DO 100 i = gpind, j - 1
                  ctr = zero
                  DO 80 jr = 1, blksiz
                     ctr = ctr + work( indrv1+jr )*
     $                     real( z( b1-1+jr, i ) )
   80             CONTINUE
                  DO 90 jr = 1, blksiz
                     work( indrv1+jr ) = work( indrv1+jr ) -
     $                                   ctr*real( z( b1-1+jr, i ) )
   90             CONTINUE
  100          CONTINUE
            END IF
*
*           Check the infinity norm of the iterate.
*
  110       CONTINUE
            jmax = isamax( blksiz, work( indrv1+1 ), 1 )
            nrm = abs( work( indrv1+jmax ) )
*
*           Continue for additional iterations after norm reaches
*           stopping criterion.
*
            IF( nrm.LT.stpcrt )
     $         GO TO 70
            nrmchk = nrmchk + 1
            IF( nrmchk.LT.extra+1 )
     $         GO TO 70
*
            GO TO 130
*
*           If stopping criterion was not satisfied, update info and
*           store eigenvector number in array ifail.
*
  120       CONTINUE
            info = info + 1
            ifail( info ) = j
*
*           Accept iterate as jth eigenvector.
*
  130       CONTINUE
            scl = one / snrm2( blksiz, work( indrv1+1 ), 1 )
            jmax = isamax( blksiz, work( indrv1+1 ), 1 )
            IF( work( indrv1+jmax ).LT.zero )
     $         scl = -scl
            CALL sscal( blksiz, scl, work( indrv1+1 ), 1 )
  140       CONTINUE
            DO 150 i = 1, n
               z( i, j ) = czero
  150       CONTINUE
            DO 160 i = 1, blksiz
               z( b1+i-1, j ) = cmplx( work( indrv1+i ), zero )
  160       CONTINUE
*
*           Save the shift to check eigenvalue spacing at next
*           iteration.
*
            xjm = xj
*
  170    CONTINUE
  180 CONTINUE
*
      RETURN
*
*     End of CSTEIN
*

◆ cstemr()

subroutine cstemr	(	character	jobz,
		character	range,
		integer	n,
		real, dimension( * )	d,
		real, dimension( * )	e,
		real	vl,
		real	vu,
		integer	il,
		integer	iu,
		integer	m,
		real, dimension( * )	w,
		complex, dimension( ldz, * )	z,
		integer	ldz,
		integer	nzc,
		integer, dimension( * )	isuppz,
		logical	tryrac,
		real, dimension( * )	work,
		integer	lwork,
		integer, dimension( * )	iwork,
		integer	liwork,
		integer	info )

CSTEMR

Download CSTEMR + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CSTEMR computes selected eigenvalues and, optionally, eigenvectors
!> of a real symmetric tridiagonal matrix T. Any such unreduced matrix has
!> a well defined set of pairwise different real eigenvalues, the corresponding
!> real eigenvectors are pairwise orthogonal.
!>
!> The spectrum may be computed either completely or partially by specifying
!> either an interval (VL,VU] or a range of indices IL:IU for the desired
!> eigenvalues.
!>
!> Depending on the number of desired eigenvalues, these are computed either
!> by bisection or the dqds algorithm. Numerically orthogonal eigenvectors are
!> computed by the use of various suitable L D L^T factorizations near clusters
!> of close eigenvalues (referred to as RRRs, Relatively Robust
!> Representations). An informal sketch of the algorithm follows.
!>
!> For each unreduced block (submatrix) of T,
!>    (a) Compute T - sigma I  = L D L^T, so that L and D
!>        define all the wanted eigenvalues to high relative accuracy.
!>        This means that small relative changes in the entries of D and L
!>        cause only small relative changes in the eigenvalues and
!>        eigenvectors. The standard (unfactored) representation of the
!>        tridiagonal matrix T does not have this property in general.
!>    (b) Compute the eigenvalues to suitable accuracy.
!>        If the eigenvectors are desired, the algorithm attains full
!>        accuracy of the computed eigenvalues only right before
!>        the corresponding vectors have to be computed, see steps c) and d).
!>    (c) For each cluster of close eigenvalues, select a new
!>        shift close to the cluster, find a new factorization, and refine
!>        the shifted eigenvalues to suitable accuracy.
!>    (d) For each eigenvalue with a large enough relative separation compute
!>        the corresponding eigenvector by forming a rank revealing twisted
!>        factorization. Go back to (c) for any clusters that remain.
!>
!> For more details, see:
!> - Inderjit S. Dhillon and Beresford N. Parlett: 
!>   Linear Algebra and its Applications, 387(1), pp. 1-28, August 2004.
!> - Inderjit Dhillon and Beresford Parlett:  SIAM Journal on Matrix Analysis and Applications, Vol. 25,
!>   2004.  Also LAPACK Working Note 154.
!> - Inderjit Dhillon: ,
!>   Computer Science Division Technical Report No. UCB/CSD-97-971,
!>   UC Berkeley, May 1997.
!>
!> Further Details
!> 1.CSTEMR works only on machines which follow IEEE-754
!> floating-point standard in their handling of infinities and NaNs.
!> This permits the use of efficient inner loops avoiding a check for
!> zero divisors.
!>
!> 2. LAPACK routines can be used to reduce a complex Hermitean matrix to
!> real symmetric tridiagonal form.
!>
!> (Any complex Hermitean tridiagonal matrix has real values on its diagonal
!> and potentially complex numbers on its off-diagonals. By applying a
!> similarity transform with an appropriate diagonal matrix
!> diag(1,e^{i \phy_1}, ... , e^{i \phy_{n-1}}), the complex Hermitean
!> matrix can be transformed into a real symmetric matrix and complex
!> arithmetic can be entirely avoided.)
!>
!> While the eigenvectors of the real symmetric tridiagonal matrix are real,
!> the eigenvectors of original complex Hermitean matrix have complex entries
!> in general.
!> Since LAPACK drivers overwrite the matrix data with the eigenvectors,
!> CSTEMR accepts complex workspace to facilitate interoperability
!> with CUNMTR or CUPMTR.
!>

Parameters

[in]	JOBZ	!> JOBZ is CHARACTER*1 !> = 'N': Compute eigenvalues only; !> = 'V': Compute eigenvalues and eigenvectors. !>
[in]	RANGE	!> RANGE is CHARACTER*1 !> = 'A': all eigenvalues will be found. !> = 'V': all eigenvalues in the half-open interval (VL,VU] !> will be found. !> = 'I': the IL-th through IU-th eigenvalues will be found. !>
[in]	N	!> N is INTEGER !> The order of the matrix. N >= 0. !>
[in,out]	D	!> D is REAL array, dimension (N) !> On entry, the N diagonal elements of the tridiagonal matrix !> T. On exit, D is overwritten. !>
[in,out]	E	!> E is REAL array, dimension (N) !> On entry, the (N-1) subdiagonal elements of the tridiagonal !> matrix T in elements 1 to N-1 of E. E(N) need not be set on !> input, but is used internally as workspace. !> On exit, E is overwritten. !>
[in]	VL	!> VL is REAL !> !> If RANGE='V', the lower bound of the interval to !> be searched for eigenvalues. VL < VU. !> Not referenced if RANGE = 'A' or 'I'. !>
[in]	VU	!> VU is REAL !> !> If RANGE='V', the upper bound of the interval to !> be searched for eigenvalues. VL < VU. !> Not referenced if RANGE = 'A' or 'I'. !>
[in]	IL	!> IL is INTEGER !> !> If RANGE='I', the index of the !> smallest eigenvalue to be returned. !> 1 <= IL <= IU <= N, if N > 0. !> Not referenced if RANGE = 'A' or 'V'. !>
[in]	IU	!> IU is INTEGER !> !> If RANGE='I', the index of the !> largest eigenvalue to be returned. !> 1 <= IL <= IU <= N, if N > 0. !> Not referenced if RANGE = 'A' or 'V'. !>
[out]	M	!> M is INTEGER !> The total number of eigenvalues found. 0 <= M <= N. !> If RANGE = 'A', M = N, and if RANGE = 'I', M = IU-IL+1. !>
[out]	W	!> W is REAL array, dimension (N) !> The first M elements contain the selected eigenvalues in !> ascending order. !>
[out]	Z	!> Z is COMPLEX array, dimension (LDZ, max(1,M) ) !> If JOBZ = 'V', and if INFO = 0, then the first M columns of Z !> contain the orthonormal eigenvectors of the matrix T !> corresponding to the selected eigenvalues, with the i-th !> column of Z holding the eigenvector associated with W(i). !> If JOBZ = 'N', then Z is not referenced. !> Note: the user must ensure that at least max(1,M) columns are !> supplied in the array Z; if RANGE = 'V', the exact value of M !> is not known in advance and can be computed with a workspace !> query by setting NZC = -1, see below. !>
[in]	LDZ	!> LDZ is INTEGER !> The leading dimension of the array Z. LDZ >= 1, and if !> JOBZ = 'V', then LDZ >= max(1,N). !>
[in]	NZC	!> NZC is INTEGER !> The number of eigenvectors to be held in the array Z. !> If RANGE = 'A', then NZC >= max(1,N). !> If RANGE = 'V', then NZC >= the number of eigenvalues in (VL,VU]. !> If RANGE = 'I', then NZC >= IU-IL+1. !> If NZC = -1, then a workspace query is assumed; the !> routine calculates the number of columns of the array Z that !> are needed to hold the eigenvectors. !> This value is returned as the first entry of the Z array, and !> no error message related to NZC is issued by XERBLA. !>
[out]	ISUPPZ	!> ISUPPZ is INTEGER array, dimension ( 2max(1,M) ) !> The support of the eigenvectors in Z, i.e., the indices !> indicating the nonzero elements in Z. The i-th computed eigenvector !> is nonzero only in elements ISUPPZ( 2i-1 ) through !> ISUPPZ( 2*i ). This is relevant in the case when the matrix !> is split. ISUPPZ is only accessed when JOBZ is 'V' and N > 0. !>
[in,out]	TRYRAC	!> TRYRAC is LOGICAL !> If TRYRAC = .TRUE., indicates that the code should check whether !> the tridiagonal matrix defines its eigenvalues to high relative !> accuracy. If so, the code uses relative-accuracy preserving !> algorithms that might be (a bit) slower depending on the matrix. !> If the matrix does not define its eigenvalues to high relative !> accuracy, the code can uses possibly faster algorithms. !> If TRYRAC = .FALSE., the code is not required to guarantee !> relatively accurate eigenvalues and can use the fastest possible !> techniques. !> On exit, a .TRUE. TRYRAC will be set to .FALSE. if the matrix !> does not define its eigenvalues to high relative accuracy. !>
[out]	WORK	!> WORK is REAL array, dimension (LWORK) !> On exit, if INFO = 0, WORK(1) returns the optimal !> (and minimal) LWORK. !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the array WORK. LWORK >= max(1,18N) !> if JOBZ = 'V', and LWORK >= max(1,12N) if JOBZ = 'N'. !> If LWORK = -1, then a workspace query is assumed; the routine !> only calculates the optimal size of the WORK array, returns !> this value as the first entry of the WORK array, and no error !> message related to LWORK is issued by XERBLA. !>
[out]	IWORK	!> IWORK is INTEGER array, dimension (LIWORK) !> On exit, if INFO = 0, IWORK(1) returns the optimal LIWORK. !>
[in]	LIWORK	!> LIWORK is INTEGER !> The dimension of the array IWORK. LIWORK >= max(1,10N) !> if the eigenvectors are desired, and LIWORK >= max(1,8N) !> if only the eigenvalues are to be computed. !> If LIWORK = -1, then a workspace query is assumed; the !> routine only calculates the optimal size of the IWORK array, !> returns this value as the first entry of the IWORK array, and !> no error message related to LIWORK is issued by XERBLA. !>
[out]	INFO	!> INFO is INTEGER !> On exit, INFO !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !> > 0: if INFO = 1X, internal error in SLARRE, !> if INFO = 2X, internal error in CLARRV. !> Here, the digit X = ABS( IINFO ) < 10, where IINFO is !> the nonzero error code returned by SLARRE or !> CLARRV, respectively. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: Beresford Parlett, University of California, Berkeley, USA
Jim Demmel, University of California, Berkeley, USA
Inderjit Dhillon, University of Texas, Austin, USA
Osni Marques, LBNL/NERSC, USA
Christof Voemel, University of California, Berkeley, USA

Definition at line 335 of file cstemr.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          JOBZ, RANGE
      LOGICAL            TRYRAC
      INTEGER            IL, INFO, IU, LDZ, NZC, LIWORK, LWORK, M, N
      REAL             VL, VU
*     ..
*     .. Array Arguments ..
      INTEGER            ISUPPZ( * ), IWORK( * )
      REAL               D( * ), E( * ), W( * ), WORK( * )
      COMPLEX            Z( LDZ, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ZERO, ONE, FOUR, MINRGP
      parameter( zero = 0.0e0, one = 1.0e0,
     $                     four = 4.0e0,
     $                     minrgp = 3.0e-3 )
*     ..
*     .. Local Scalars ..
      LOGICAL            ALLEIG, INDEIG, LQUERY, VALEIG, WANTZ, ZQUERY
      INTEGER            I, IBEGIN, IEND, IFIRST, IIL, IINDBL, IINDW,
     $                   IINDWK, IINFO, IINSPL, IIU, ILAST, IN, INDD,
     $                   INDE2, INDERR, INDGP, INDGRS, INDWRK, ITMP,
     $                   ITMP2, J, JBLK, JJ, LIWMIN, LWMIN, NSPLIT,
     $                   NZCMIN, OFFSET, WBEGIN, WEND
      REAL               BIGNUM, CS, EPS, PIVMIN, R1, R2, RMAX, RMIN,
     $                   RTOL1, RTOL2, SAFMIN, SCALE, SMLNUM, SN,
     $                   THRESH, TMP, TNRM, WL, WU
*     ..
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      REAL               SLAMCH, SLANST
      EXTERNAL           lsame, slamch, slanst
*     ..
*     .. External Subroutines ..
      EXTERNAL           clarrv, cswap, scopy, slae2, slaev2, slarrc,
     $                   slarre, slarrj, slarrr, slasrt, sscal, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, min, sqrt
 
 
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      wantz = lsame( jobz, 'V' )
      alleig = lsame( range, 'A' )
      valeig = lsame( range, 'V' )
      indeig = lsame( range, 'I' )
*
      lquery = ( ( lwork.EQ.-1 ).OR.( liwork.EQ.-1 ) )
      zquery = ( nzc.EQ.-1 )
 
*     SSTEMR needs WORK of size 6*N, IWORK of size 3*N.
*     In addition, SLARRE needs WORK of size 6*N, IWORK of size 5*N.
*     Furthermore, CLARRV needs WORK of size 12*N, IWORK of size 7*N.
      IF( wantz ) THEN
         lwmin = 18*n
         liwmin = 10*n
      ELSE
*        need less workspace if only the eigenvalues are wanted
         lwmin = 12*n
         liwmin = 8*n
      ENDIF
 
      wl = zero
      wu = zero
      iil = 0
      iiu = 0
      nsplit = 0
 
      IF( valeig ) THEN
*        We do not reference VL, VU in the cases RANGE = 'I','A'
*        The interval (WL, WU] contains all the wanted eigenvalues.
*        It is either given by the user or computed in SLARRE.
         wl = vl
         wu = vu
      ELSEIF( indeig ) THEN
*        We do not reference IL, IU in the cases RANGE = 'V','A'
         iil = il
         iiu = iu
      ENDIF
*
      info = 0
      IF( .NOT.( wantz .OR. lsame( jobz, 'N' ) ) ) THEN
         info = -1
      ELSE IF( .NOT.( alleig .OR. valeig .OR. indeig ) ) THEN
         info = -2
      ELSE IF( n.LT.0 ) THEN
         info = -3
      ELSE IF( valeig .AND. n.GT.0 .AND. wu.LE.wl ) THEN
         info = -7
      ELSE IF( indeig .AND. ( iil.LT.1 .OR. iil.GT.n ) ) THEN
         info = -8
      ELSE IF( indeig .AND. ( iiu.LT.iil .OR. iiu.GT.n ) ) THEN
         info = -9
      ELSE IF( ldz.LT.1 .OR. ( wantz .AND. ldz.LT.n ) ) THEN
         info = -13
      ELSE IF( lwork.LT.lwmin .AND. .NOT.lquery ) THEN
         info = -17
      ELSE IF( liwork.LT.liwmin .AND. .NOT.lquery ) THEN
         info = -19
      END IF
*
*     Get machine constants.
*
      safmin = slamch( 'Safe minimum' )
      eps = slamch( 'Precision' )
      smlnum = safmin / eps
      bignum = one / smlnum
      rmin = sqrt( smlnum )
      rmax = min( sqrt( bignum ), one / sqrt( sqrt( safmin ) ) )
*
      IF( info.EQ.0 ) THEN
         work( 1 ) = lwmin
         iwork( 1 ) = liwmin
*
         IF( wantz .AND. alleig ) THEN
            nzcmin = n
         ELSE IF( wantz .AND. valeig ) THEN
            CALL slarrc( 'T', n, vl, vu, d, e, safmin,
     $                            nzcmin, itmp, itmp2, info )
         ELSE IF( wantz .AND. indeig ) THEN
            nzcmin = iiu-iil+1
         ELSE
*           WANTZ .EQ. FALSE.
            nzcmin = 0
         ENDIF
         IF( zquery .AND. info.EQ.0 ) THEN
            z( 1,1 ) = nzcmin
         ELSE IF( nzc.LT.nzcmin .AND. .NOT.zquery ) THEN
            info = -14
         END IF
      END IF
 
      IF( info.NE.0 ) THEN
*
         CALL xerbla( 'CSTEMR', -info )
*
         RETURN
      ELSE IF( lquery .OR. zquery ) THEN
         RETURN
      END IF
*
*     Handle N = 0, 1, and 2 cases immediately
*
      m = 0
      IF( n.EQ.0 )
     $   RETURN
*
      IF( n.EQ.1 ) THEN
         IF( alleig .OR. indeig ) THEN
            m = 1
            w( 1 ) = d( 1 )
         ELSE
            IF( wl.LT.d( 1 ) .AND. wu.GE.d( 1 ) ) THEN
               m = 1
               w( 1 ) = d( 1 )
            END IF
         END IF
         IF( wantz.AND.(.NOT.zquery) ) THEN
            z( 1, 1 ) = one
            isuppz(1) = 1
            isuppz(2) = 1
         END IF
         RETURN
      END IF
*
      IF( n.EQ.2 ) THEN
         IF( .NOT.wantz ) THEN
            CALL slae2( d(1), e(1), d(2), r1, r2 )
         ELSE IF( wantz.AND.(.NOT.zquery) ) THEN
            CALL slaev2( d(1), e(1), d(2), r1, r2, cs, sn )
         END IF
         IF( alleig.OR.
     $      (valeig.AND.(r2.GT.wl).AND.
     $                  (r2.LE.wu)).OR.
     $      (indeig.AND.(iil.EQ.1)) ) THEN
            m = m+1
            w( m ) = r2
            IF( wantz.AND.(.NOT.zquery) ) THEN
               z( 1, m ) = -sn
               z( 2, m ) = cs
*              Note: At most one of SN and CS can be zero.
               IF (sn.NE.zero) THEN
                  IF (cs.NE.zero) THEN
                     isuppz(2*m-1) = 1
                     isuppz(2*m) = 2
                  ELSE
                     isuppz(2*m-1) = 1
                     isuppz(2*m) = 1
                  END IF
               ELSE
                  isuppz(2*m-1) = 2
                  isuppz(2*m) = 2
               END IF
            ENDIF
         ENDIF
         IF( alleig.OR.
     $      (valeig.AND.(r1.GT.wl).AND.
     $                  (r1.LE.wu)).OR.
     $      (indeig.AND.(iiu.EQ.2)) ) THEN
            m = m+1
            w( m ) = r1
            IF( wantz.AND.(.NOT.zquery) ) THEN
               z( 1, m ) = cs
               z( 2, m ) = sn
*              Note: At most one of SN and CS can be zero.
               IF (sn.NE.zero) THEN
                  IF (cs.NE.zero) THEN
                     isuppz(2*m-1) = 1
                     isuppz(2*m) = 2
                  ELSE
                     isuppz(2*m-1) = 1
                     isuppz(2*m) = 1
                  END IF
               ELSE
                  isuppz(2*m-1) = 2
                  isuppz(2*m) = 2
               END IF
            ENDIF
         ENDIF
      ELSE
 
*        Continue with general N
 
         indgrs = 1
         inderr = 2*n + 1
         indgp = 3*n + 1
         indd = 4*n + 1
         inde2 = 5*n + 1
         indwrk = 6*n + 1
*
         iinspl = 1
         iindbl = n + 1
         iindw = 2*n + 1
         iindwk = 3*n + 1
*
*        Scale matrix to allowable range, if necessary.
*        The allowable range is related to the PIVMIN parameter; see the
*        comments in SLARRD.  The preference for scaling small values
*        up is heuristic; we expect users' matrices not to be close to the
*        RMAX threshold.
*
         scale = one
         tnrm = slanst( 'M', n, d, e )
         IF( tnrm.GT.zero .AND. tnrm.LT.rmin ) THEN
            scale = rmin / tnrm
         ELSE IF( tnrm.GT.rmax ) THEN
            scale = rmax / tnrm
         END IF
         IF( scale.NE.one ) THEN
            CALL sscal( n, scale, d, 1 )
            CALL sscal( n-1, scale, e, 1 )
            tnrm = tnrm*scale
            IF( valeig ) THEN
*              If eigenvalues in interval have to be found,
*              scale (WL, WU] accordingly
               wl = wl*scale
               wu = wu*scale
            ENDIF
         END IF
*
*        Compute the desired eigenvalues of the tridiagonal after splitting
*        into smaller subblocks if the corresponding off-diagonal elements
*        are small
*        THRESH is the splitting parameter for SLARRE
*        A negative THRESH forces the old splitting criterion based on the
*        size of the off-diagonal. A positive THRESH switches to splitting
*        which preserves relative accuracy.
*
         IF( tryrac ) THEN
*           Test whether the matrix warrants the more expensive relative approach.
            CALL slarrr( n, d, e, iinfo )
         ELSE
*           The user does not care about relative accurately eigenvalues
            iinfo = -1
         ENDIF
*        Set the splitting criterion
         IF (iinfo.EQ.0) THEN
            thresh = eps
         ELSE
            thresh = -eps
*           relative accuracy is desired but T does not guarantee it
            tryrac = .false.
         ENDIF
*
         IF( tryrac ) THEN
*           Copy original diagonal, needed to guarantee relative accuracy
            CALL scopy(n,d,1,work(indd),1)
         ENDIF
*        Store the squares of the offdiagonal values of T
         DO 5 j = 1, n-1
            work( inde2+j-1 ) = e(j)**2
 5    CONTINUE
 
*        Set the tolerance parameters for bisection
         IF( .NOT.wantz ) THEN
*           SLARRE computes the eigenvalues to full precision.
            rtol1 = four * eps
            rtol2 = four * eps
         ELSE
*           SLARRE computes the eigenvalues to less than full precision.
*           CLARRV will refine the eigenvalue approximations, and we only
*           need less accurate initial bisection in SLARRE.
*           Note: these settings do only affect the subset case and SLARRE
            rtol1 = max( sqrt(eps)*5.0e-2, four * eps )
            rtol2 = max( sqrt(eps)*5.0e-3, four * eps )
         ENDIF
         CALL slarre( range, n, wl, wu, iil, iiu, d, e,
     $             work(inde2), rtol1, rtol2, thresh, nsplit,
     $             iwork( iinspl ), m, w, work( inderr ),
     $             work( indgp ), iwork( iindbl ),
     $             iwork( iindw ), work( indgrs ), pivmin,
     $             work( indwrk ), iwork( iindwk ), iinfo )
         IF( iinfo.NE.0 ) THEN
            info = 10 + abs( iinfo )
            RETURN
         END IF
*        Note that if RANGE .NE. 'V', SLARRE computes bounds on the desired
*        part of the spectrum. All desired eigenvalues are contained in
*        (WL,WU]
 
 
         IF( wantz ) THEN
*
*           Compute the desired eigenvectors corresponding to the computed
*           eigenvalues
*
            CALL clarrv( n, wl, wu, d, e,
     $                pivmin, iwork( iinspl ), m,
     $                1, m, minrgp, rtol1, rtol2,
     $                w, work( inderr ), work( indgp ), iwork( iindbl ),
     $                iwork( iindw ), work( indgrs ), z, ldz,
     $                isuppz, work( indwrk ), iwork( iindwk ), iinfo )
            IF( iinfo.NE.0 ) THEN
               info = 20 + abs( iinfo )
               RETURN
            END IF
         ELSE
*           SLARRE computes eigenvalues of the (shifted) root representation
*           CLARRV returns the eigenvalues of the unshifted matrix.
*           However, if the eigenvectors are not desired by the user, we need
*           to apply the corresponding shifts from SLARRE to obtain the
*           eigenvalues of the original matrix.
            DO 20 j = 1, m
               itmp = iwork( iindbl+j-1 )
               w( j ) = w( j ) + e( iwork( iinspl+itmp-1 ) )
 20      CONTINUE
         END IF
*
 
         IF ( tryrac ) THEN
*           Refine computed eigenvalues so that they are relatively accurate
*           with respect to the original matrix T.
            ibegin = 1
            wbegin = 1
            DO 39  jblk = 1, iwork( iindbl+m-1 )
               iend = iwork( iinspl+jblk-1 )
               in = iend - ibegin + 1
               wend = wbegin - 1
*              check if any eigenvalues have to be refined in this block
 36         CONTINUE
               IF( wend.LT.m ) THEN
                  IF( iwork( iindbl+wend ).EQ.jblk ) THEN
                     wend = wend + 1
                     GO TO 36
                  END IF
               END IF
               IF( wend.LT.wbegin ) THEN
                  ibegin = iend + 1
                  GO TO 39
               END IF
 
               offset = iwork(iindw+wbegin-1)-1
               ifirst = iwork(iindw+wbegin-1)
               ilast = iwork(iindw+wend-1)
               rtol2 = four * eps
               CALL slarrj( in,
     $                   work(indd+ibegin-1), work(inde2+ibegin-1),
     $                   ifirst, ilast, rtol2, offset, w(wbegin),
     $                   work( inderr+wbegin-1 ),
     $                   work( indwrk ), iwork( iindwk ), pivmin,
     $                   tnrm, iinfo )
               ibegin = iend + 1
               wbegin = wend + 1
 39      CONTINUE
         ENDIF
*
*        If matrix was scaled, then rescale eigenvalues appropriately.
*
         IF( scale.NE.one ) THEN
            CALL sscal( m, one / scale, w, 1 )
         END IF
      END IF
*
*     If eigenvalues are not in increasing order, then sort them,
*     possibly along with eigenvectors.
*
      IF( nsplit.GT.1 .OR. n.EQ.2 ) THEN
         IF( .NOT. wantz ) THEN
            CALL slasrt( 'I', m, w, iinfo )
            IF( iinfo.NE.0 ) THEN
               info = 3
               RETURN
            END IF
         ELSE
            DO 60 j = 1, m - 1
               i = 0
               tmp = w( j )
               DO 50 jj = j + 1, m
                  IF( w( jj ).LT.tmp ) THEN
                     i = jj
                     tmp = w( jj )
                  END IF
 50            CONTINUE
               IF( i.NE.0 ) THEN
                  w( i ) = w( j )
                  w( j ) = tmp
                  IF( wantz ) THEN
                     CALL cswap( n, z( 1, i ), 1, z( 1, j ), 1 )
                     itmp = isuppz( 2*i-1 )
                     isuppz( 2*i-1 ) = isuppz( 2*j-1 )
                     isuppz( 2*j-1 ) = itmp
                     itmp = isuppz( 2*i )
                     isuppz( 2*i ) = isuppz( 2*j )
                     isuppz( 2*j ) = itmp
                  END IF
               END IF
 60         CONTINUE
         END IF
      ENDIF
*
*
      work( 1 ) = lwmin
      iwork( 1 ) = liwmin
      RETURN
*
*     End of CSTEMR
*

◆ csteqr()

subroutine csteqr	(	character	compz,
		integer	n,
		real, dimension( * )	d,
		real, dimension( * )	e,
		complex, dimension( ldz, * )	z,
		integer	ldz,
		real, dimension( * )	work,
		integer	info )

CSTEQR

Download CSTEQR + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CSTEQR computes all eigenvalues and, optionally, eigenvectors of a
!> symmetric tridiagonal matrix using the implicit QL or QR method.
!> The eigenvectors of a full or band complex Hermitian matrix can also
!> be found if CHETRD or CHPTRD or CHBTRD has been used to reduce this
!> matrix to tridiagonal form.
!>

Parameters

[in]	COMPZ	!> COMPZ is CHARACTER*1 !> = 'N': Compute eigenvalues only. !> = 'V': Compute eigenvalues and eigenvectors of the original !> Hermitian matrix. On entry, Z must contain the !> unitary matrix used to reduce the original matrix !> to tridiagonal form. !> = 'I': Compute eigenvalues and eigenvectors of the !> tridiagonal matrix. Z is initialized to the identity !> matrix. !>
[in]	N	!> N is INTEGER !> The order of the matrix. N >= 0. !>
[in,out]	D	!> D is REAL array, dimension (N) !> On entry, the diagonal elements of the tridiagonal matrix. !> On exit, if INFO = 0, the eigenvalues in ascending order. !>
[in,out]	E	!> E is REAL array, dimension (N-1) !> On entry, the (n-1) subdiagonal elements of the tridiagonal !> matrix. !> On exit, E has been destroyed. !>
[in,out]	Z	!> Z is COMPLEX array, dimension (LDZ, N) !> On entry, if COMPZ = 'V', then Z contains the unitary !> matrix used in the reduction to tridiagonal form. !> On exit, if INFO = 0, then if COMPZ = 'V', Z contains the !> orthonormal eigenvectors of the original Hermitian matrix, !> and if COMPZ = 'I', Z contains the orthonormal eigenvectors !> of the symmetric tridiagonal matrix. !> If COMPZ = 'N', then Z is not referenced. !>
[in]	LDZ	!> LDZ is INTEGER !> The leading dimension of the array Z. LDZ >= 1, and if !> eigenvectors are desired, then LDZ >= max(1,N). !>
[out]	WORK	!> WORK is REAL array, dimension (max(1,2*N-2)) !> If COMPZ = 'N', then WORK is not referenced. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !> > 0: the algorithm has failed to find all the eigenvalues in !> a total of 30*N iterations; if INFO = i, then i !> elements of E have not converged to zero; on exit, D !> and E contain the elements of a symmetric tridiagonal !> matrix which is unitarily similar to the original !> matrix. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 131 of file csteqr.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          COMPZ
      INTEGER            INFO, LDZ, N
*     ..
*     .. Array Arguments ..
      REAL               D( * ), E( * ), WORK( * )
      COMPLEX            Z( LDZ, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ZERO, ONE, TWO, THREE
      parameter( zero = 0.0e0, one = 1.0e0, two = 2.0e0,
     $                   three = 3.0e0 )
      COMPLEX            CZERO, CONE
      parameter( czero = ( 0.0e0, 0.0e0 ),
     $                   cone = ( 1.0e0, 0.0e0 ) )
      INTEGER            MAXIT
      parameter( maxit = 30 )
*     ..
*     .. Local Scalars ..
      INTEGER            I, ICOMPZ, II, ISCALE, J, JTOT, K, L, L1, LEND,
     $                   LENDM1, LENDP1, LENDSV, LM1, LSV, M, MM, MM1,
     $                   NM1, NMAXIT
      REAL               ANORM, B, C, EPS, EPS2, F, G, P, R, RT1, RT2,
     $                   S, SAFMAX, SAFMIN, SSFMAX, SSFMIN, TST
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      REAL               SLAMCH, SLANST, SLAPY2
      EXTERNAL           lsame, slamch, slanst, slapy2
*     ..
*     .. External Subroutines ..
      EXTERNAL           claset, clasr, cswap, slae2, slaev2, slartg,
     $                   slascl, slasrt, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, max, sign, sqrt
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
*
      IF( lsame( compz, 'N' ) ) THEN
         icompz = 0
      ELSE IF( lsame( compz, 'V' ) ) THEN
         icompz = 1
      ELSE IF( lsame( compz, 'I' ) ) THEN
         icompz = 2
      ELSE
         icompz = -1
      END IF
      IF( icompz.LT.0 ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( ( ldz.LT.1 ) .OR. ( icompz.GT.0 .AND. ldz.LT.max( 1,
     $         n ) ) ) THEN
         info = -6
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CSTEQR', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
      IF( n.EQ.1 ) THEN
         IF( icompz.EQ.2 )
     $      z( 1, 1 ) = cone
         RETURN
      END IF
*
*     Determine the unit roundoff and over/underflow thresholds.
*
      eps = slamch( 'E' )
      eps2 = eps**2
      safmin = slamch( 'S' )
      safmax = one / safmin
      ssfmax = sqrt( safmax ) / three
      ssfmin = sqrt( safmin ) / eps2
*
*     Compute the eigenvalues and eigenvectors of the tridiagonal
*     matrix.
*
      IF( icompz.EQ.2 )
     $   CALL claset( 'Full', n, n, czero, cone, z, ldz )
*
      nmaxit = n*maxit
      jtot = 0
*
*     Determine where the matrix splits and choose QL or QR iteration
*     for each block, according to whether top or bottom diagonal
*     element is smaller.
*
      l1 = 1
      nm1 = n - 1
*
   10 CONTINUE
      IF( l1.GT.n )
     $   GO TO 160
      IF( l1.GT.1 )
     $   e( l1-1 ) = zero
      IF( l1.LE.nm1 ) THEN
         DO 20 m = l1, nm1
            tst = abs( e( m ) )
            IF( tst.EQ.zero )
     $         GO TO 30
            IF( tst.LE.( sqrt( abs( d( m ) ) )*sqrt( abs( d( m+
     $          1 ) ) ) )*eps ) THEN
               e( m ) = zero
               GO TO 30
            END IF
   20    CONTINUE
      END IF
      m = n
*
   30 CONTINUE
      l = l1
      lsv = l
      lend = m
      lendsv = lend
      l1 = m + 1
      IF( lend.EQ.l )
     $   GO TO 10
*
*     Scale submatrix in rows and columns L to LEND
*
      anorm = slanst( 'I', lend-l+1, d( l ), e( l ) )
      iscale = 0
      IF( anorm.EQ.zero )
     $   GO TO 10
      IF( anorm.GT.ssfmax ) THEN
         iscale = 1
         CALL slascl( 'G', 0, 0, anorm, ssfmax, lend-l+1, 1, d( l ), n,
     $                info )
         CALL slascl( 'G', 0, 0, anorm, ssfmax, lend-l, 1, e( l ), n,
     $                info )
      ELSE IF( anorm.LT.ssfmin ) THEN
         iscale = 2
         CALL slascl( 'G', 0, 0, anorm, ssfmin, lend-l+1, 1, d( l ), n,
     $                info )
         CALL slascl( 'G', 0, 0, anorm, ssfmin, lend-l, 1, e( l ), n,
     $                info )
      END IF
*
*     Choose between QL and QR iteration
*
      IF( abs( d( lend ) ).LT.abs( d( l ) ) ) THEN
         lend = lsv
         l = lendsv
      END IF
*
      IF( lend.GT.l ) THEN
*
*        QL Iteration
*
*        Look for small subdiagonal element.
*
   40    CONTINUE
         IF( l.NE.lend ) THEN
            lendm1 = lend - 1
            DO 50 m = l, lendm1
               tst = abs( e( m ) )**2
               IF( tst.LE.( eps2*abs( d( m ) ) )*abs( d( m+1 ) )+
     $             safmin )GO TO 60
   50       CONTINUE
         END IF
*
         m = lend
*
   60    CONTINUE
         IF( m.LT.lend )
     $      e( m ) = zero
         p = d( l )
         IF( m.EQ.l )
     $      GO TO 80
*
*        If remaining matrix is 2-by-2, use SLAE2 or SLAEV2
*        to compute its eigensystem.
*
         IF( m.EQ.l+1 ) THEN
            IF( icompz.GT.0 ) THEN
               CALL slaev2( d( l ), e( l ), d( l+1 ), rt1, rt2, c, s )
               work( l ) = c
               work( n-1+l ) = s
               CALL clasr( 'R', 'V', 'B', n, 2, work( l ),
     $                     work( n-1+l ), z( 1, l ), ldz )
            ELSE
               CALL slae2( d( l ), e( l ), d( l+1 ), rt1, rt2 )
            END IF
            d( l ) = rt1
            d( l+1 ) = rt2
            e( l ) = zero
            l = l + 2
            IF( l.LE.lend )
     $         GO TO 40
            GO TO 140
         END IF
*
         IF( jtot.EQ.nmaxit )
     $      GO TO 140
         jtot = jtot + 1
*
*        Form shift.
*
         g = ( d( l+1 )-p ) / ( two*e( l ) )
         r = slapy2( g, one )
         g = d( m ) - p + ( e( l ) / ( g+sign( r, g ) ) )
*
         s = one
         c = one
         p = zero
*
*        Inner loop
*
         mm1 = m - 1
         DO 70 i = mm1, l, -1
            f = s*e( i )
            b = c*e( i )
            CALL slartg( g, f, c, s, r )
            IF( i.NE.m-1 )
     $         e( i+1 ) = r
            g = d( i+1 ) - p
            r = ( d( i )-g )*s + two*c*b
            p = s*r
            d( i+1 ) = g + p
            g = c*r - b
*
*           If eigenvectors are desired, then save rotations.
*
            IF( icompz.GT.0 ) THEN
               work( i ) = c
               work( n-1+i ) = -s
            END IF
*
   70    CONTINUE
*
*        If eigenvectors are desired, then apply saved rotations.
*
         IF( icompz.GT.0 ) THEN
            mm = m - l + 1
            CALL clasr( 'R', 'V', 'B', n, mm, work( l ), work( n-1+l ),
     $                  z( 1, l ), ldz )
         END IF
*
         d( l ) = d( l ) - p
         e( l ) = g
         GO TO 40
*
*        Eigenvalue found.
*
   80    CONTINUE
         d( l ) = p
*
         l = l + 1
         IF( l.LE.lend )
     $      GO TO 40
         GO TO 140
*
      ELSE
*
*        QR Iteration
*
*        Look for small superdiagonal element.
*
   90    CONTINUE
         IF( l.NE.lend ) THEN
            lendp1 = lend + 1
            DO 100 m = l, lendp1, -1
               tst = abs( e( m-1 ) )**2
               IF( tst.LE.( eps2*abs( d( m ) ) )*abs( d( m-1 ) )+
     $             safmin )GO TO 110
  100       CONTINUE
         END IF
*
         m = lend
*
  110    CONTINUE
         IF( m.GT.lend )
     $      e( m-1 ) = zero
         p = d( l )
         IF( m.EQ.l )
     $      GO TO 130
*
*        If remaining matrix is 2-by-2, use SLAE2 or SLAEV2
*        to compute its eigensystem.
*
         IF( m.EQ.l-1 ) THEN
            IF( icompz.GT.0 ) THEN
               CALL slaev2( d( l-1 ), e( l-1 ), d( l ), rt1, rt2, c, s )
               work( m ) = c
               work( n-1+m ) = s
               CALL clasr( 'R', 'V', 'F', n, 2, work( m ),
     $                     work( n-1+m ), z( 1, l-1 ), ldz )
            ELSE
               CALL slae2( d( l-1 ), e( l-1 ), d( l ), rt1, rt2 )
            END IF
            d( l-1 ) = rt1
            d( l ) = rt2
            e( l-1 ) = zero
            l = l - 2
            IF( l.GE.lend )
     $         GO TO 90
            GO TO 140
         END IF
*
         IF( jtot.EQ.nmaxit )
     $      GO TO 140
         jtot = jtot + 1
*
*        Form shift.
*
         g = ( d( l-1 )-p ) / ( two*e( l-1 ) )
         r = slapy2( g, one )
         g = d( m ) - p + ( e( l-1 ) / ( g+sign( r, g ) ) )
*
         s = one
         c = one
         p = zero
*
*        Inner loop
*
         lm1 = l - 1
         DO 120 i = m, lm1
            f = s*e( i )
            b = c*e( i )
            CALL slartg( g, f, c, s, r )
            IF( i.NE.m )
     $         e( i-1 ) = r
            g = d( i ) - p
            r = ( d( i+1 )-g )*s + two*c*b
            p = s*r
            d( i ) = g + p
            g = c*r - b
*
*           If eigenvectors are desired, then save rotations.
*
            IF( icompz.GT.0 ) THEN
               work( i ) = c
               work( n-1+i ) = s
            END IF
*
  120    CONTINUE
*
*        If eigenvectors are desired, then apply saved rotations.
*
         IF( icompz.GT.0 ) THEN
            mm = l - m + 1
            CALL clasr( 'R', 'V', 'F', n, mm, work( m ), work( n-1+m ),
     $                  z( 1, m ), ldz )
         END IF
*
         d( l ) = d( l ) - p
         e( lm1 ) = g
         GO TO 90
*
*        Eigenvalue found.
*
  130    CONTINUE
         d( l ) = p
*
         l = l - 1
         IF( l.GE.lend )
     $      GO TO 90
         GO TO 140
*
      END IF
*
*     Undo scaling if necessary
*
  140 CONTINUE
      IF( iscale.EQ.1 ) THEN
         CALL slascl( 'G', 0, 0, ssfmax, anorm, lendsv-lsv+1, 1,
     $                d( lsv ), n, info )
         CALL slascl( 'G', 0, 0, ssfmax, anorm, lendsv-lsv, 1, e( lsv ),
     $                n, info )
      ELSE IF( iscale.EQ.2 ) THEN
         CALL slascl( 'G', 0, 0, ssfmin, anorm, lendsv-lsv+1, 1,
     $                d( lsv ), n, info )
         CALL slascl( 'G', 0, 0, ssfmin, anorm, lendsv-lsv, 1, e( lsv ),
     $                n, info )
      END IF
*
*     Check for no convergence to an eigenvalue after a total
*     of N*MAXIT iterations.
*
      IF( jtot.EQ.nmaxit ) THEN
         DO 150 i = 1, n - 1
            IF( e( i ).NE.zero )
     $         info = info + 1
  150    CONTINUE
         RETURN
      END IF
      GO TO 10
*
*     Order eigenvalues and eigenvectors.
*
  160 CONTINUE
      IF( icompz.EQ.0 ) THEN
*
*        Use Quick Sort
*
         CALL slasrt( 'I', n, d, info )
*
      ELSE
*
*        Use Selection Sort to minimize swaps of eigenvectors
*
         DO 180 ii = 2, n
            i = ii - 1
            k = i
            p = d( i )
            DO 170 j = ii, n
               IF( d( j ).LT.p ) THEN
                  k = j
                  p = d( j )
               END IF
  170       CONTINUE
            IF( k.NE.i ) THEN
               d( k ) = d( i )
               d( i ) = p
               CALL cswap( n, z( 1, i ), 1, z( 1, k ), 1 )
            END IF
  180    CONTINUE
      END IF
      RETURN
*
*     End of CSTEQR
*

◆ ctbcon()

subroutine ctbcon	(	character	norm,
		character	uplo,
		character	diag,
		integer	n,
		integer	kd,
		complex, dimension( ldab, * )	ab,
		integer	ldab,
		real	rcond,
		complex, dimension( * )	work,
		real, dimension( * )	rwork,
		integer	info )

CTBCON

Download CTBCON + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CTBCON estimates the reciprocal of the condition number of a
!> triangular band matrix A, in either the 1-norm or the infinity-norm.
!>
!> The norm of A is computed and an estimate is obtained for
!> norm(inv(A)), then the reciprocal of the condition number is
!> computed as
!>    RCOND = 1 / ( norm(A) * norm(inv(A)) ).
!>

Parameters

[in]	NORM	!> NORM is CHARACTER*1 !> Specifies whether the 1-norm condition number or the !> infinity-norm condition number is required: !> = '1' or 'O': 1-norm; !> = 'I': Infinity-norm. !>
[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': A is upper triangular; !> = 'L': A is lower triangular. !>
[in]	DIAG	!> DIAG is CHARACTER*1 !> = 'N': A is non-unit triangular; !> = 'U': A is unit triangular. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in]	KD	!> KD is INTEGER !> The number of superdiagonals or subdiagonals of the !> triangular band matrix A. KD >= 0. !>
[in]	AB	!> AB is COMPLEX array, dimension (LDAB,N) !> The upper or lower triangular band matrix A, stored in the !> first kd+1 rows of the array. The j-th column of A is stored !> in the j-th column of the array AB as follows: !> if UPLO = 'U', AB(kd+1+i-j,j) = A(i,j) for max(1,j-kd)<=i<=j; !> if UPLO = 'L', AB(1+i-j,j) = A(i,j) for j<=i<=min(n,j+kd). !> If DIAG = 'U', the diagonal elements of A are not referenced !> and are assumed to be 1. !>
[in]	LDAB	!> LDAB is INTEGER !> The leading dimension of the array AB. LDAB >= KD+1. !>
[out]	RCOND	!> RCOND is REAL !> The reciprocal of the condition number of the matrix A, !> computed as RCOND = 1/(norm(A) * norm(inv(A))). !>
[out]	WORK	!> WORK is COMPLEX array, dimension (2*N) !>
[out]	RWORK	!> RWORK is REAL array, dimension (N) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 141 of file ctbcon.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          DIAG, NORM, UPLO
      INTEGER            INFO, KD, LDAB, N
      REAL               RCOND
*     ..
*     .. Array Arguments ..
      REAL               RWORK( * )
      COMPLEX            AB( LDAB, * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ONE, ZERO
      parameter( one = 1.0e+0, zero = 0.0e+0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            NOUNIT, ONENRM, UPPER
      CHARACTER          NORMIN
      INTEGER            IX, KASE, KASE1
      REAL               AINVNM, ANORM, SCALE, SMLNUM, XNORM
      COMPLEX            ZDUM
*     ..
*     .. Local Arrays ..
      INTEGER            ISAVE( 3 )
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      INTEGER            ICAMAX
      REAL               CLANTB, SLAMCH
      EXTERNAL           lsame, icamax, clantb, slamch
*     ..
*     .. External Subroutines ..
      EXTERNAL           clacn2, clatbs, csrscl, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, aimag, max, real
*     ..
*     .. Statement Functions ..
      REAL               CABS1
*     ..
*     .. Statement Function definitions ..
      cabs1( zdum ) = abs( real( zdum ) ) + abs( aimag( zdum ) )
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      upper = lsame( uplo, 'U' )
      onenrm = norm.EQ.'1' .OR. lsame( norm, 'O' )
      nounit = lsame( diag, 'N' )
*
      IF( .NOT.onenrm .AND. .NOT.lsame( norm, 'I' ) ) THEN
         info = -1
      ELSE IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -2
      ELSE IF( .NOT.nounit .AND. .NOT.lsame( diag, 'U' ) ) THEN
         info = -3
      ELSE IF( n.LT.0 ) THEN
         info = -4
      ELSE IF( kd.LT.0 ) THEN
         info = -5
      ELSE IF( ldab.LT.kd+1 ) THEN
         info = -7
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CTBCON', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 ) THEN
         rcond = one
         RETURN
      END IF
*
      rcond = zero
      smlnum = slamch( 'Safe minimum' )*real( max( n, 1 ) )
*
*     Compute the 1-norm of the triangular matrix A or A**H.
*
      anorm = clantb( norm, uplo, diag, n, kd, ab, ldab, rwork )
*
*     Continue only if ANORM > 0.
*
      IF( anorm.GT.zero ) THEN
*
*        Estimate the 1-norm of the inverse of A.
*
         ainvnm = zero
         normin = 'N'
         IF( onenrm ) THEN
            kase1 = 1
         ELSE
            kase1 = 2
         END IF
         kase = 0
   10    CONTINUE
         CALL clacn2( n, work( n+1 ), work, ainvnm, kase, isave )
         IF( kase.NE.0 ) THEN
            IF( kase.EQ.kase1 ) THEN
*
*              Multiply by inv(A).
*
               CALL clatbs( uplo, 'No transpose', diag, normin, n, kd,
     $                      ab, ldab, work, scale, rwork, info )
            ELSE
*
*              Multiply by inv(A**H).
*
               CALL clatbs( uplo, 'Conjugate transpose', diag, normin,
     $                      n, kd, ab, ldab, work, scale, rwork, info )
            END IF
            normin = 'Y'
*
*           Multiply by 1/SCALE if doing so will not cause overflow.
*
            IF( scale.NE.one ) THEN
               ix = icamax( n, work, 1 )
               xnorm = cabs1( work( ix ) )
               IF( scale.LT.xnorm*smlnum .OR. scale.EQ.zero )
     $            GO TO 20
               CALL csrscl( n, scale, work, 1 )
            END IF
            GO TO 10
         END IF
*
*        Compute the estimate of the reciprocal condition number.
*
         IF( ainvnm.NE.zero )
     $      rcond = ( one / anorm ) / ainvnm
      END IF
*
   20 CONTINUE
      RETURN
*
*     End of CTBCON
*

◆ ctbrfs()

subroutine ctbrfs	(	character	uplo,
		character	trans,
		character	diag,
		integer	n,
		integer	kd,
		integer	nrhs,
		complex, dimension( ldab, * )	ab,
		integer	ldab,
		complex, dimension( ldb, * )	b,
		integer	ldb,
		complex, dimension( ldx, * )	x,
		integer	ldx,
		real, dimension( * )	ferr,
		real, dimension( * )	berr,
		complex, dimension( * )	work,
		real, dimension( * )	rwork,
		integer	info )

CTBRFS

Download CTBRFS + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CTBRFS provides error bounds and backward error estimates for the
!> solution to a system of linear equations with a triangular band
!> coefficient matrix.
!>
!> The solution matrix X must be computed by CTBTRS or some other
!> means before entering this routine.  CTBRFS does not do iterative
!> refinement because doing so cannot improve the backward error.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': A is upper triangular; !> = 'L': A is lower triangular. !>
[in]	TRANS	!> TRANS is CHARACTER1 !> Specifies the form of the system of equations: !> = 'N': A X = B (No transpose) !> = 'T': A*T X = B (Transpose) !> = 'C': A*H X = B (Conjugate transpose) !>
[in]	DIAG	!> DIAG is CHARACTER*1 !> = 'N': A is non-unit triangular; !> = 'U': A is unit triangular. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in]	KD	!> KD is INTEGER !> The number of superdiagonals or subdiagonals of the !> triangular band matrix A. KD >= 0. !>
[in]	NRHS	!> NRHS is INTEGER !> The number of right hand sides, i.e., the number of columns !> of the matrices B and X. NRHS >= 0. !>
[in]	AB	!> AB is COMPLEX array, dimension (LDAB,N) !> The upper or lower triangular band matrix A, stored in the !> first kd+1 rows of the array. The j-th column of A is stored !> in the j-th column of the array AB as follows: !> if UPLO = 'U', AB(kd+1+i-j,j) = A(i,j) for max(1,j-kd)<=i<=j; !> if UPLO = 'L', AB(1+i-j,j) = A(i,j) for j<=i<=min(n,j+kd). !> If DIAG = 'U', the diagonal elements of A are not referenced !> and are assumed to be 1. !>
[in]	LDAB	!> LDAB is INTEGER !> The leading dimension of the array AB. LDAB >= KD+1. !>
[in]	B	!> B is COMPLEX array, dimension (LDB,NRHS) !> The right hand side matrix B. !>
[in]	LDB	!> LDB is INTEGER !> The leading dimension of the array B. LDB >= max(1,N). !>
[in]	X	!> X is COMPLEX array, dimension (LDX,NRHS) !> The solution matrix X. !>
[in]	LDX	!> LDX is INTEGER !> The leading dimension of the array X. LDX >= max(1,N). !>
[out]	FERR	!> FERR is REAL array, dimension (NRHS) !> The estimated forward error bound for each solution vector !> X(j) (the j-th column of the solution matrix X). !> If XTRUE is the true solution corresponding to X(j), FERR(j) !> is an estimated upper bound for the magnitude of the largest !> element in (X(j) - XTRUE) divided by the magnitude of the !> largest element in X(j). The estimate is as reliable as !> the estimate for RCOND, and is almost always a slight !> overestimate of the true error. !>
[out]	BERR	!> BERR is REAL array, dimension (NRHS) !> The componentwise relative backward error of each solution !> vector X(j) (i.e., the smallest relative change in !> any element of A or B that makes X(j) an exact solution). !>
[out]	WORK	!> WORK is COMPLEX array, dimension (2*N) !>
[out]	RWORK	!> RWORK is REAL array, dimension (N) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 186 of file ctbrfs.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          DIAG, TRANS, UPLO
      INTEGER            INFO, KD, LDAB, LDB, LDX, N, NRHS
*     ..
*     .. Array Arguments ..
      REAL               BERR( * ), FERR( * ), RWORK( * )
      COMPLEX            AB( LDAB, * ), B( LDB, * ), WORK( * ),
     $                   X( LDX, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ZERO
      parameter( zero = 0.0e+0 )
      COMPLEX            ONE
      parameter( one = ( 1.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      LOGICAL            NOTRAN, NOUNIT, UPPER
      CHARACTER          TRANSN, TRANST
      INTEGER            I, J, K, KASE, NZ
      REAL               EPS, LSTRES, S, SAFE1, SAFE2, SAFMIN, XK
      COMPLEX            ZDUM
*     ..
*     .. Local Arrays ..
      INTEGER            ISAVE( 3 )
*     ..
*     .. External Subroutines ..
      EXTERNAL           caxpy, ccopy, clacn2, ctbmv, ctbsv, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, aimag, max, min, real
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      REAL               SLAMCH
      EXTERNAL           lsame, slamch
*     ..
*     .. Statement Functions ..
      REAL               CABS1
*     ..
*     .. Statement Function definitions ..
      cabs1( zdum ) = abs( real( zdum ) ) + abs( aimag( zdum ) )
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      upper = lsame( uplo, 'U' )
      notran = lsame( trans, 'N' )
      nounit = lsame( diag, 'N' )
*
      IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -1
      ELSE IF( .NOT.notran .AND. .NOT.lsame( trans, 'T' ) .AND. .NOT.
     $         lsame( trans, 'C' ) ) THEN
         info = -2
      ELSE IF( .NOT.nounit .AND. .NOT.lsame( diag, 'U' ) ) THEN
         info = -3
      ELSE IF( n.LT.0 ) THEN
         info = -4
      ELSE IF( kd.LT.0 ) THEN
         info = -5
      ELSE IF( nrhs.LT.0 ) THEN
         info = -6
      ELSE IF( ldab.LT.kd+1 ) THEN
         info = -8
      ELSE IF( ldb.LT.max( 1, n ) ) THEN
         info = -10
      ELSE IF( ldx.LT.max( 1, n ) ) THEN
         info = -12
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CTBRFS', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 .OR. nrhs.EQ.0 ) THEN
         DO 10 j = 1, nrhs
            ferr( j ) = zero
            berr( j ) = zero
   10    CONTINUE
         RETURN
      END IF
*
      IF( notran ) THEN
         transn = 'N'
         transt = 'C'
      ELSE
         transn = 'C'
         transt = 'N'
      END IF
*
*     NZ = maximum number of nonzero elements in each row of A, plus 1
*
      nz = kd + 2
      eps = slamch( 'Epsilon' )
      safmin = slamch( 'Safe minimum' )
      safe1 = nz*safmin
      safe2 = safe1 / eps
*
*     Do for each right hand side
*
      DO 250 j = 1, nrhs
*
*        Compute residual R = B - op(A) * X,
*        where op(A) = A, A**T, or A**H, depending on TRANS.
*
         CALL ccopy( n, x( 1, j ), 1, work, 1 )
         CALL ctbmv( uplo, trans, diag, n, kd, ab, ldab, work, 1 )
         CALL caxpy( n, -one, b( 1, j ), 1, work, 1 )
*
*        Compute componentwise relative backward error from formula
*
*        max(i) ( abs(R(i)) / ( abs(op(A))*abs(X) + abs(B) )(i) )
*
*        where abs(Z) is the componentwise absolute value of the matrix
*        or vector Z.  If the i-th component of the denominator is less
*        than SAFE2, then SAFE1 is added to the i-th components of the
*        numerator and denominator before dividing.
*
         DO 20 i = 1, n
            rwork( i ) = cabs1( b( i, j ) )
   20    CONTINUE
*
         IF( notran ) THEN
*
*           Compute abs(A)*abs(X) + abs(B).
*
            IF( upper ) THEN
               IF( nounit ) THEN
                  DO 40 k = 1, n
                     xk = cabs1( x( k, j ) )
                     DO 30 i = max( 1, k-kd ), k
                        rwork( i ) = rwork( i ) +
     $                               cabs1( ab( kd+1+i-k, k ) )*xk
   30                CONTINUE
   40             CONTINUE
               ELSE
                  DO 60 k = 1, n
                     xk = cabs1( x( k, j ) )
                     DO 50 i = max( 1, k-kd ), k - 1
                        rwork( i ) = rwork( i ) +
     $                               cabs1( ab( kd+1+i-k, k ) )*xk
   50                CONTINUE
                     rwork( k ) = rwork( k ) + xk
   60             CONTINUE
               END IF
            ELSE
               IF( nounit ) THEN
                  DO 80 k = 1, n
                     xk = cabs1( x( k, j ) )
                     DO 70 i = k, min( n, k+kd )
                        rwork( i ) = rwork( i ) +
     $                               cabs1( ab( 1+i-k, k ) )*xk
   70                CONTINUE
   80             CONTINUE
               ELSE
                  DO 100 k = 1, n
                     xk = cabs1( x( k, j ) )
                     DO 90 i = k + 1, min( n, k+kd )
                        rwork( i ) = rwork( i ) +
     $                               cabs1( ab( 1+i-k, k ) )*xk
   90                CONTINUE
                     rwork( k ) = rwork( k ) + xk
  100             CONTINUE
               END IF
            END IF
         ELSE
*
*           Compute abs(A**H)*abs(X) + abs(B).
*
            IF( upper ) THEN
               IF( nounit ) THEN
                  DO 120 k = 1, n
                     s = zero
                     DO 110 i = max( 1, k-kd ), k
                        s = s + cabs1( ab( kd+1+i-k, k ) )*
     $                      cabs1( x( i, j ) )
  110                CONTINUE
                     rwork( k ) = rwork( k ) + s
  120             CONTINUE
               ELSE
                  DO 140 k = 1, n
                     s = cabs1( x( k, j ) )
                     DO 130 i = max( 1, k-kd ), k - 1
                        s = s + cabs1( ab( kd+1+i-k, k ) )*
     $                      cabs1( x( i, j ) )
  130                CONTINUE
                     rwork( k ) = rwork( k ) + s
  140             CONTINUE
               END IF
            ELSE
               IF( nounit ) THEN
                  DO 160 k = 1, n
                     s = zero
                     DO 150 i = k, min( n, k+kd )
                        s = s + cabs1( ab( 1+i-k, k ) )*
     $                      cabs1( x( i, j ) )
  150                CONTINUE
                     rwork( k ) = rwork( k ) + s
  160             CONTINUE
               ELSE
                  DO 180 k = 1, n
                     s = cabs1( x( k, j ) )
                     DO 170 i = k + 1, min( n, k+kd )
                        s = s + cabs1( ab( 1+i-k, k ) )*
     $                      cabs1( x( i, j ) )
  170                CONTINUE
                     rwork( k ) = rwork( k ) + s
  180             CONTINUE
               END IF
            END IF
         END IF
         s = zero
         DO 190 i = 1, n
            IF( rwork( i ).GT.safe2 ) THEN
               s = max( s, cabs1( work( i ) ) / rwork( i ) )
            ELSE
               s = max( s, ( cabs1( work( i ) )+safe1 ) /
     $             ( rwork( i )+safe1 ) )
            END IF
  190    CONTINUE
         berr( j ) = s
*
*        Bound error from formula
*
*        norm(X - XTRUE) / norm(X) .le. FERR =
*        norm( abs(inv(op(A)))*
*           ( abs(R) + NZ*EPS*( abs(op(A))*abs(X)+abs(B) ))) / norm(X)
*
*        where
*          norm(Z) is the magnitude of the largest component of Z
*          inv(op(A)) is the inverse of op(A)
*          abs(Z) is the componentwise absolute value of the matrix or
*             vector Z
*          NZ is the maximum number of nonzeros in any row of A, plus 1
*          EPS is machine epsilon
*
*        The i-th component of abs(R)+NZ*EPS*(abs(op(A))*abs(X)+abs(B))
*        is incremented by SAFE1 if the i-th component of
*        abs(op(A))*abs(X) + abs(B) is less than SAFE2.
*
*        Use CLACN2 to estimate the infinity-norm of the matrix
*           inv(op(A)) * diag(W),
*        where W = abs(R) + NZ*EPS*( abs(op(A))*abs(X)+abs(B) )))
*
         DO 200 i = 1, n
            IF( rwork( i ).GT.safe2 ) THEN
               rwork( i ) = cabs1( work( i ) ) + nz*eps*rwork( i )
            ELSE
               rwork( i ) = cabs1( work( i ) ) + nz*eps*rwork( i ) +
     $                      safe1
            END IF
  200    CONTINUE
*
         kase = 0
  210    CONTINUE
         CALL clacn2( n, work( n+1 ), work, ferr( j ), kase, isave )
         IF( kase.NE.0 ) THEN
            IF( kase.EQ.1 ) THEN
*
*              Multiply by diag(W)*inv(op(A)**H).
*
               CALL ctbsv( uplo, transt, diag, n, kd, ab, ldab, work,
     $                     1 )
               DO 220 i = 1, n
                  work( i ) = rwork( i )*work( i )
  220          CONTINUE
            ELSE
*
*              Multiply by inv(op(A))*diag(W).
*
               DO 230 i = 1, n
                  work( i ) = rwork( i )*work( i )
  230          CONTINUE
               CALL ctbsv( uplo, transn, diag, n, kd, ab, ldab, work,
     $                     1 )
            END IF
            GO TO 210
         END IF
*
*        Normalize error.
*
         lstres = zero
         DO 240 i = 1, n
            lstres = max( lstres, cabs1( x( i, j ) ) )
  240    CONTINUE
         IF( lstres.NE.zero )
     $      ferr( j ) = ferr( j ) / lstres
*
  250 CONTINUE
*
      RETURN
*
*     End of CTBRFS
*

◆ ctbtrs()

subroutine ctbtrs	(	character	uplo,
		character	trans,
		character	diag,
		integer	n,
		integer	kd,
		integer	nrhs,
		complex, dimension( ldab, * )	ab,
		integer	ldab,
		complex, dimension( ldb, * )	b,
		integer	ldb,
		integer	info )

CTBTRS

Download CTBTRS + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CTBTRS solves a triangular system of the form
!>
!>    A * X = B,  A**T * X = B,  or  A**H * X = B,
!>
!> where A is a triangular band matrix of order N, and B is an
!> N-by-NRHS matrix.  A check is made to verify that A is nonsingular.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': A is upper triangular; !> = 'L': A is lower triangular. !>
[in]	TRANS	!> TRANS is CHARACTER1 !> Specifies the form of the system of equations: !> = 'N': A X = B (No transpose) !> = 'T': A*T X = B (Transpose) !> = 'C': A*H X = B (Conjugate transpose) !>
[in]	DIAG	!> DIAG is CHARACTER*1 !> = 'N': A is non-unit triangular; !> = 'U': A is unit triangular. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in]	KD	!> KD is INTEGER !> The number of superdiagonals or subdiagonals of the !> triangular band matrix A. KD >= 0. !>
[in]	NRHS	!> NRHS is INTEGER !> The number of right hand sides, i.e., the number of columns !> of the matrix B. NRHS >= 0. !>
[in]	AB	!> AB is COMPLEX array, dimension (LDAB,N) !> The upper or lower triangular band matrix A, stored in the !> first kd+1 rows of AB. The j-th column of A is stored !> in the j-th column of the array AB as follows: !> if UPLO = 'U', AB(kd+1+i-j,j) = A(i,j) for max(1,j-kd)<=i<=j; !> if UPLO = 'L', AB(1+i-j,j) = A(i,j) for j<=i<=min(n,j+kd). !> If DIAG = 'U', the diagonal elements of A are not referenced !> and are assumed to be 1. !>
[in]	LDAB	!> LDAB is INTEGER !> The leading dimension of the array AB. LDAB >= KD+1. !>
[in,out]	B	!> B is COMPLEX array, dimension (LDB,NRHS) !> On entry, the right hand side matrix B. !> On exit, if INFO = 0, the solution matrix X. !>
[in]	LDB	!> LDB is INTEGER !> The leading dimension of the array B. LDB >= max(1,N). !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !> > 0: if INFO = i, the i-th diagonal element of A is zero, !> indicating that the matrix is singular and the !> solutions X have not been computed. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 144 of file ctbtrs.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          DIAG, TRANS, UPLO
      INTEGER            INFO, KD, LDAB, LDB, N, NRHS
*     ..
*     .. Array Arguments ..
      COMPLEX            AB( LDAB, * ), B( LDB, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            ZERO
      parameter( zero = ( 0.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      LOGICAL            NOUNIT, UPPER
      INTEGER            J
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           ctbsv, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      nounit = lsame( diag, 'N' )
      upper = lsame( uplo, 'U' )
      IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -1
      ELSE IF( .NOT.lsame( trans, 'N' ) .AND. .NOT.
     $         lsame( trans, 'T' ) .AND. .NOT.lsame( trans, 'C' ) ) THEN
         info = -2
      ELSE IF( .NOT.nounit .AND. .NOT.lsame( diag, 'U' ) ) THEN
         info = -3
      ELSE IF( n.LT.0 ) THEN
         info = -4
      ELSE IF( kd.LT.0 ) THEN
         info = -5
      ELSE IF( nrhs.LT.0 ) THEN
         info = -6
      ELSE IF( ldab.LT.kd+1 ) THEN
         info = -8
      ELSE IF( ldb.LT.max( 1, n ) ) THEN
         info = -10
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CTBTRS', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
*     Check for singularity.
*
      IF( nounit ) THEN
         IF( upper ) THEN
            DO 10 info = 1, n
               IF( ab( kd+1, info ).EQ.zero )
     $            RETURN
   10       CONTINUE
         ELSE
            DO 20 info = 1, n
               IF( ab( 1, info ).EQ.zero )
     $            RETURN
   20       CONTINUE
         END IF
      END IF
      info = 0
*
*     Solve A * X = B,  A**T * X = B,  or  A**H * X = B.
*
      DO 30 j = 1, nrhs
         CALL ctbsv( uplo, trans, diag, n, kd, ab, ldab, b( 1, j ), 1 )
   30 CONTINUE
*
      RETURN
*
*     End of CTBTRS
*

◆ ctfsm()

subroutine ctfsm	(	character	transr,
		character	side,
		character	uplo,
		character	trans,
		character	diag,
		integer	m,
		integer	n,
		complex	alpha,
		complex, dimension( 0: * )	a,
		complex, dimension( 0: ldb-1, 0: * )	b,
		integer	ldb )

CTFSM solves a matrix equation (one operand is a triangular matrix in RFP format).

Download CTFSM + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> Level 3 BLAS like routine for A in RFP Format.
!>
!> CTFSM solves the matrix equation
!>
!>    op( A )*X = alpha*B  or  X*op( A ) = alpha*B
!>
!> where alpha is a scalar, X and B are m by n matrices, A is a unit, or
!> non-unit,  upper or lower triangular matrix  and  op( A )  is one  of
!>
!>    op( A ) = A   or   op( A ) = A**H.
!>
!> A is in Rectangular Full Packed (RFP) Format.
!>
!> The matrix X is overwritten on B.
!>

Parameters

[in]	TRANSR	!> TRANSR is CHARACTER*1 !> = 'N': The Normal Form of RFP A is stored; !> = 'C': The Conjugate-transpose Form of RFP A is stored. !>
[in]	SIDE	!> SIDE is CHARACTER1 !> On entry, SIDE specifies whether op( A ) appears on the left !> or right of X as follows: !> !> SIDE = 'L' or 'l' op( A )X = alphaB. !> !> SIDE = 'R' or 'r' Xop( A ) = alpha*B. !> !> Unchanged on exit. !>
[in]	UPLO	!> UPLO is CHARACTER*1 !> On entry, UPLO specifies whether the RFP matrix A came from !> an upper or lower triangular matrix as follows: !> UPLO = 'U' or 'u' RFP A came from an upper triangular matrix !> UPLO = 'L' or 'l' RFP A came from a lower triangular matrix !> !> Unchanged on exit. !>
[in]	TRANS	!> TRANS is CHARACTER*1 !> On entry, TRANS specifies the form of op( A ) to be used !> in the matrix multiplication as follows: !> !> TRANS = 'N' or 'n' op( A ) = A. !> !> TRANS = 'C' or 'c' op( A ) = conjg( A' ). !> !> Unchanged on exit. !>
[in]	DIAG	!> DIAG is CHARACTER*1 !> On entry, DIAG specifies whether or not RFP A is unit !> triangular as follows: !> !> DIAG = 'U' or 'u' A is assumed to be unit triangular. !> !> DIAG = 'N' or 'n' A is not assumed to be unit !> triangular. !> !> Unchanged on exit. !>
[in]	M	!> M is INTEGER !> On entry, M specifies the number of rows of B. M must be at !> least zero. !> Unchanged on exit. !>
[in]	N	!> N is INTEGER !> On entry, N specifies the number of columns of B. N must be !> at least zero. !> Unchanged on exit. !>
[in]	ALPHA	!> ALPHA is COMPLEX !> On entry, ALPHA specifies the scalar alpha. When alpha is !> zero then A is not referenced and B need not be set before !> entry. !> Unchanged on exit. !>
[in]	A	!> A is COMPLEX array, dimension (N(N+1)/2) !> NT = N(N+1)/2. On entry, the matrix A in RFP Format. !> RFP Format is described by TRANSR, UPLO and N as follows: !> If TRANSR='N' then RFP A is (0:N,0:K-1) when N is even; !> K=N/2. RFP A is (0:N-1,0:K) when N is odd; K=N/2. If !> TRANSR = 'C' then RFP is the Conjugate-transpose of RFP A as !> defined when TRANSR = 'N'. The contents of RFP A are defined !> by UPLO as follows: If UPLO = 'U' the RFP A contains the NT !> elements of upper packed A either in normal or !> conjugate-transpose Format. If UPLO = 'L' the RFP A contains !> the NT elements of lower packed A either in normal or !> conjugate-transpose Format. The LDA of RFP A is (N+1)/2 when !> TRANSR = 'C'. When TRANSR is 'N' the LDA is N+1 when N is !> even and is N when is odd. !> See the Note below for more details. Unchanged on exit. !>
[in,out]	B	!> B is COMPLEX array, dimension (LDB,N) !> Before entry, the leading m by n part of the array B must !> contain the right-hand side matrix B, and on exit is !> overwritten by the solution matrix X. !>
[in]	LDB	!> LDB is INTEGER !> On entry, LDB specifies the first dimension of B as declared !> in the calling (sub) program. LDB must be at least !> max( 1, m ). !> Unchanged on exit. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  We first consider Standard Packed Format when N is even.
!>  We give an example where N = 6.
!>
!>      AP is Upper             AP is Lower
!>
!>   00 01 02 03 04 05       00
!>      11 12 13 14 15       10 11
!>         22 23 24 25       20 21 22
!>            33 34 35       30 31 32 33
!>               44 45       40 41 42 43 44
!>                  55       50 51 52 53 54 55
!>
!>
!>  Let TRANSR = 'N'. RFP holds AP as follows:
!>  For UPLO = 'U' the upper trapezoid A(0:5,0:2) consists of the last
!>  three columns of AP upper. The lower triangle A(4:6,0:2) consists of
!>  conjugate-transpose of the first three columns of AP upper.
!>  For UPLO = 'L' the lower trapezoid A(1:6,0:2) consists of the first
!>  three columns of AP lower. The upper triangle A(0:2,0:2) consists of
!>  conjugate-transpose of the last three columns of AP lower.
!>  To denote conjugate we place -- above the element. This covers the
!>  case N even and TRANSR = 'N'.
!>
!>         RFP A                   RFP A
!>
!>                                -- -- --
!>        03 04 05                33 43 53
!>                                   -- --
!>        13 14 15                00 44 54
!>                                      --
!>        23 24 25                10 11 55
!>
!>        33 34 35                20 21 22
!>        --
!>        00 44 45                30 31 32
!>        -- --
!>        01 11 55                40 41 42
!>        -- -- --
!>        02 12 22                50 51 52
!>
!>  Now let TRANSR = 'C'. RFP A in both UPLO cases is just the conjugate-
!>  transpose of RFP A above. One therefore gets:
!>
!>
!>           RFP A                   RFP A
!>
!>     -- -- -- --                -- -- -- -- -- --
!>     03 13 23 33 00 01 02    33 00 10 20 30 40 50
!>     -- -- -- -- --                -- -- -- -- --
!>     04 14 24 34 44 11 12    43 44 11 21 31 41 51
!>     -- -- -- -- -- --                -- -- -- --
!>     05 15 25 35 45 55 22    53 54 55 22 32 42 52
!>
!>
!>  We next  consider Standard Packed Format when N is odd.
!>  We give an example where N = 5.
!>
!>     AP is Upper                 AP is Lower
!>
!>   00 01 02 03 04              00
!>      11 12 13 14              10 11
!>         22 23 24              20 21 22
!>            33 34              30 31 32 33
!>               44              40 41 42 43 44
!>
!>
!>  Let TRANSR = 'N'. RFP holds AP as follows:
!>  For UPLO = 'U' the upper trapezoid A(0:4,0:2) consists of the last
!>  three columns of AP upper. The lower triangle A(3:4,0:1) consists of
!>  conjugate-transpose of the first two   columns of AP upper.
!>  For UPLO = 'L' the lower trapezoid A(0:4,0:2) consists of the first
!>  three columns of AP lower. The upper triangle A(0:1,1:2) consists of
!>  conjugate-transpose of the last two   columns of AP lower.
!>  To denote conjugate we place -- above the element. This covers the
!>  case N odd  and TRANSR = 'N'.
!>
!>         RFP A                   RFP A
!>
!>                                   -- --
!>        02 03 04                00 33 43
!>                                      --
!>        12 13 14                10 11 44
!>
!>        22 23 24                20 21 22
!>        --
!>        00 33 34                30 31 32
!>        -- --
!>        01 11 44                40 41 42
!>
!>  Now let TRANSR = 'C'. RFP A in both UPLO cases is just the conjugate-
!>  transpose of RFP A above. One therefore gets:
!>
!>
!>           RFP A                   RFP A
!>
!>     -- -- --                   -- -- -- -- -- --
!>     02 12 22 00 01             00 10 20 30 40 50
!>     -- -- -- --                   -- -- -- -- --
!>     03 13 23 33 11             33 11 21 31 41 51
!>     -- -- -- -- --                   -- -- -- --
!>     04 14 24 34 44             43 44 22 32 42 52
!>

Definition at line 296 of file ctfsm.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          TRANSR, DIAG, SIDE, TRANS, UPLO
      INTEGER            LDB, M, N
      COMPLEX            ALPHA
*     ..
*     .. Array Arguments ..
      COMPLEX            A( 0: * ), B( 0: LDB-1, 0: * )
*     ..
*
*  =====================================================================
*     ..
*     .. Parameters ..
      COMPLEX            CONE, CZERO
      parameter( cone = ( 1.0e+0, 0.0e+0 ),
     $                   czero = ( 0.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      LOGICAL            LOWER, LSIDE, MISODD, NISODD, NORMALTRANSR,
     $                   NOTRANS
      INTEGER            M1, M2, N1, N2, K, INFO, I, J
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           xerbla, cgemm, ctrsm
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, mod
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      normaltransr = lsame( transr, 'N' )
      lside = lsame( side, 'L' )
      lower = lsame( uplo, 'L' )
      notrans = lsame( trans, 'N' )
      IF( .NOT.normaltransr .AND. .NOT.lsame( transr, 'C' ) ) THEN
         info = -1
      ELSE IF( .NOT.lside .AND. .NOT.lsame( side, 'R' ) ) THEN
         info = -2
      ELSE IF( .NOT.lower .AND. .NOT.lsame( uplo, 'U' ) ) THEN
         info = -3
      ELSE IF( .NOT.notrans .AND. .NOT.lsame( trans, 'C' ) ) THEN
         info = -4
      ELSE IF( .NOT.lsame( diag, 'N' ) .AND. .NOT.lsame( diag, 'U' ) )
     $         THEN
         info = -5
      ELSE IF( m.LT.0 ) THEN
         info = -6
      ELSE IF( n.LT.0 ) THEN
         info = -7
      ELSE IF( ldb.LT.max( 1, m ) ) THEN
         info = -11
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CTFSM ', -info )
         RETURN
      END IF
*
*     Quick return when ( (N.EQ.0).OR.(M.EQ.0) )
*
      IF( ( m.EQ.0 ) .OR. ( n.EQ.0 ) )
     $   RETURN
*
*     Quick return when ALPHA.EQ.(0E+0,0E+0)
*
      IF( alpha.EQ.czero ) THEN
         DO 20 j = 0, n - 1
            DO 10 i = 0, m - 1
               b( i, j ) = czero
   10       CONTINUE
   20    CONTINUE
         RETURN
      END IF
*
      IF( lside ) THEN
*
*        SIDE = 'L'
*
*        A is M-by-M.
*        If M is odd, set NISODD = .TRUE., and M1 and M2.
*        If M is even, NISODD = .FALSE., and M.
*
         IF( mod( m, 2 ).EQ.0 ) THEN
            misodd = .false.
            k = m / 2
         ELSE
            misodd = .true.
            IF( lower ) THEN
               m2 = m / 2
               m1 = m - m2
            ELSE
               m1 = m / 2
               m2 = m - m1
            END IF
         END IF
*
         IF( misodd ) THEN
*
*           SIDE = 'L' and N is odd
*
            IF( normaltransr ) THEN
*
*              SIDE = 'L', N is odd, and TRANSR = 'N'
*
               IF( lower ) THEN
*
*                 SIDE  ='L', N is odd, TRANSR = 'N', and UPLO = 'L'
*
                  IF( notrans ) THEN
*
*                    SIDE  ='L', N is odd, TRANSR = 'N', UPLO = 'L', and
*                    TRANS = 'N'
*
                     IF( m.EQ.1 ) THEN
                        CALL ctrsm( 'L', 'L', 'N', diag, m1, n, alpha,
     $                              a, m, b, ldb )
                     ELSE
                        CALL ctrsm( 'L', 'L', 'N', diag, m1, n, alpha,
     $                              a( 0 ), m, b, ldb )
                        CALL cgemm( 'N', 'N', m2, n, m1, -cone, a( m1 ),
     $                              m, b, ldb, alpha, b( m1, 0 ), ldb )
                        CALL ctrsm( 'L', 'U', 'C', diag, m2, n, cone,
     $                              a( m ), m, b( m1, 0 ), ldb )
                     END IF
*
                  ELSE
*
*                    SIDE  ='L', N is odd, TRANSR = 'N', UPLO = 'L', and
*                    TRANS = 'C'
*
                     IF( m.EQ.1 ) THEN
                        CALL ctrsm( 'L', 'L', 'C', diag, m1, n, alpha,
     $                              a( 0 ), m, b, ldb )
                     ELSE
                        CALL ctrsm( 'L', 'U', 'N', diag, m2, n, alpha,
     $                              a( m ), m, b( m1, 0 ), ldb )
                        CALL cgemm( 'C', 'N', m1, n, m2, -cone, a( m1 ),
     $                              m, b( m1, 0 ), ldb, alpha, b, ldb )
                        CALL ctrsm( 'L', 'L', 'C', diag, m1, n, cone,
     $                              a( 0 ), m, b, ldb )
                     END IF
*
                  END IF
*
               ELSE
*
*                 SIDE  ='L', N is odd, TRANSR = 'N', and UPLO = 'U'
*
                  IF( .NOT.notrans ) THEN
*
*                    SIDE  ='L', N is odd, TRANSR = 'N', UPLO = 'U', and
*                    TRANS = 'N'
*
                     CALL ctrsm( 'L', 'L', 'N', diag, m1, n, alpha,
     $                           a( m2 ), m, b, ldb )
                     CALL cgemm( 'C', 'N', m2, n, m1, -cone, a( 0 ), m,
     $                           b, ldb, alpha, b( m1, 0 ), ldb )
                     CALL ctrsm( 'L', 'U', 'C', diag, m2, n, cone,
     $                           a( m1 ), m, b( m1, 0 ), ldb )
*
                  ELSE
*
*                    SIDE  ='L', N is odd, TRANSR = 'N', UPLO = 'U', and
*                    TRANS = 'C'
*
                     CALL ctrsm( 'L', 'U', 'N', diag, m2, n, alpha,
     $                           a( m1 ), m, b( m1, 0 ), ldb )
                     CALL cgemm( 'N', 'N', m1, n, m2, -cone, a( 0 ), m,
     $                           b( m1, 0 ), ldb, alpha, b, ldb )
                     CALL ctrsm( 'L', 'L', 'C', diag, m1, n, cone,
     $                           a( m2 ), m, b, ldb )
*
                  END IF
*
               END IF
*
            ELSE
*
*              SIDE = 'L', N is odd, and TRANSR = 'C'
*
               IF( lower ) THEN
*
*                 SIDE  ='L', N is odd, TRANSR = 'C', and UPLO = 'L'
*
                  IF( notrans ) THEN
*
*                    SIDE  ='L', N is odd, TRANSR = 'C', UPLO = 'L', and
*                    TRANS = 'N'
*
                     IF( m.EQ.1 ) THEN
                        CALL ctrsm( 'L', 'U', 'C', diag, m1, n, alpha,
     $                              a( 0 ), m1, b, ldb )
                     ELSE
                        CALL ctrsm( 'L', 'U', 'C', diag, m1, n, alpha,
     $                              a( 0 ), m1, b, ldb )
                        CALL cgemm( 'C', 'N', m2, n, m1, -cone,
     $                              a( m1*m1 ), m1, b, ldb, alpha,
     $                              b( m1, 0 ), ldb )
                        CALL ctrsm( 'L', 'L', 'N', diag, m2, n, cone,
     $                              a( 1 ), m1, b( m1, 0 ), ldb )
                     END IF
*
                  ELSE
*
*                    SIDE  ='L', N is odd, TRANSR = 'C', UPLO = 'L', and
*                    TRANS = 'C'
*
                     IF( m.EQ.1 ) THEN
                        CALL ctrsm( 'L', 'U', 'N', diag, m1, n, alpha,
     $                              a( 0 ), m1, b, ldb )
                     ELSE
                        CALL ctrsm( 'L', 'L', 'C', diag, m2, n, alpha,
     $                              a( 1 ), m1, b( m1, 0 ), ldb )
                        CALL cgemm( 'N', 'N', m1, n, m2, -cone,
     $                              a( m1*m1 ), m1, b( m1, 0 ), ldb,
     $                              alpha, b, ldb )
                        CALL ctrsm( 'L', 'U', 'N', diag, m1, n, cone,
     $                              a( 0 ), m1, b, ldb )
                     END IF
*
                  END IF
*
               ELSE
*
*                 SIDE  ='L', N is odd, TRANSR = 'C', and UPLO = 'U'
*
                  IF( .NOT.notrans ) THEN
*
*                    SIDE  ='L', N is odd, TRANSR = 'C', UPLO = 'U', and
*                    TRANS = 'N'
*
                     CALL ctrsm( 'L', 'U', 'C', diag, m1, n, alpha,
     $                           a( m2*m2 ), m2, b, ldb )
                     CALL cgemm( 'N', 'N', m2, n, m1, -cone, a( 0 ), m2,
     $                           b, ldb, alpha, b( m1, 0 ), ldb )
                     CALL ctrsm( 'L', 'L', 'N', diag, m2, n, cone,
     $                           a( m1*m2 ), m2, b( m1, 0 ), ldb )
*
                  ELSE
*
*                    SIDE  ='L', N is odd, TRANSR = 'C', UPLO = 'U', and
*                    TRANS = 'C'
*
                     CALL ctrsm( 'L', 'L', 'C', diag, m2, n, alpha,
     $                           a( m1*m2 ), m2, b( m1, 0 ), ldb )
                     CALL cgemm( 'C', 'N', m1, n, m2, -cone, a( 0 ), m2,
     $                           b( m1, 0 ), ldb, alpha, b, ldb )
                     CALL ctrsm( 'L', 'U', 'N', diag, m1, n, cone,
     $                           a( m2*m2 ), m2, b, ldb )
*
                  END IF
*
               END IF
*
            END IF
*
         ELSE
*
*           SIDE = 'L' and N is even
*
            IF( normaltransr ) THEN
*
*              SIDE = 'L', N is even, and TRANSR = 'N'
*
               IF( lower ) THEN
*
*                 SIDE  ='L', N is even, TRANSR = 'N', and UPLO = 'L'
*
                  IF( notrans ) THEN
*
*                    SIDE  ='L', N is even, TRANSR = 'N', UPLO = 'L',
*                    and TRANS = 'N'
*
                     CALL ctrsm( 'L', 'L', 'N', diag, k, n, alpha,
     $                           a( 1 ), m+1, b, ldb )
                     CALL cgemm( 'N', 'N', k, n, k, -cone, a( k+1 ),
     $                           m+1, b, ldb, alpha, b( k, 0 ), ldb )
                     CALL ctrsm( 'L', 'U', 'C', diag, k, n, cone,
     $                           a( 0 ), m+1, b( k, 0 ), ldb )
*
                  ELSE
*
*                    SIDE  ='L', N is even, TRANSR = 'N', UPLO = 'L',
*                    and TRANS = 'C'
*
                     CALL ctrsm( 'L', 'U', 'N', diag, k, n, alpha,
     $                           a( 0 ), m+1, b( k, 0 ), ldb )
                     CALL cgemm( 'C', 'N', k, n, k, -cone, a( k+1 ),
     $                           m+1, b( k, 0 ), ldb, alpha, b, ldb )
                     CALL ctrsm( 'L', 'L', 'C', diag, k, n, cone,
     $                           a( 1 ), m+1, b, ldb )
*
                  END IF
*
               ELSE
*
*                 SIDE  ='L', N is even, TRANSR = 'N', and UPLO = 'U'
*
                  IF( .NOT.notrans ) THEN
*
*                    SIDE  ='L', N is even, TRANSR = 'N', UPLO = 'U',
*                    and TRANS = 'N'
*
                     CALL ctrsm( 'L', 'L', 'N', diag, k, n, alpha,
     $                           a( k+1 ), m+1, b, ldb )
                     CALL cgemm( 'C', 'N', k, n, k, -cone, a( 0 ), m+1,
     $                           b, ldb, alpha, b( k, 0 ), ldb )
                     CALL ctrsm( 'L', 'U', 'C', diag, k, n, cone,
     $                           a( k ), m+1, b( k, 0 ), ldb )
*
                  ELSE
*
*                    SIDE  ='L', N is even, TRANSR = 'N', UPLO = 'U',
*                    and TRANS = 'C'
                     CALL ctrsm( 'L', 'U', 'N', diag, k, n, alpha,
     $                           a( k ), m+1, b( k, 0 ), ldb )
                     CALL cgemm( 'N', 'N', k, n, k, -cone, a( 0 ), m+1,
     $                           b( k, 0 ), ldb, alpha, b, ldb )
                     CALL ctrsm( 'L', 'L', 'C', diag, k, n, cone,
     $                           a( k+1 ), m+1, b, ldb )
*
                  END IF
*
               END IF
*
            ELSE
*
*              SIDE = 'L', N is even, and TRANSR = 'C'
*
               IF( lower ) THEN
*
*                 SIDE  ='L', N is even, TRANSR = 'C', and UPLO = 'L'
*
                  IF( notrans ) THEN
*
*                    SIDE  ='L', N is even, TRANSR = 'C', UPLO = 'L',
*                    and TRANS = 'N'
*
                     CALL ctrsm( 'L', 'U', 'C', diag, k, n, alpha,
     $                           a( k ), k, b, ldb )
                     CALL cgemm( 'C', 'N', k, n, k, -cone,
     $                           a( k*( k+1 ) ), k, b, ldb, alpha,
     $                           b( k, 0 ), ldb )
                     CALL ctrsm( 'L', 'L', 'N', diag, k, n, cone,
     $                           a( 0 ), k, b( k, 0 ), ldb )
*
                  ELSE
*
*                    SIDE  ='L', N is even, TRANSR = 'C', UPLO = 'L',
*                    and TRANS = 'C'
*
                     CALL ctrsm( 'L', 'L', 'C', diag, k, n, alpha,
     $                           a( 0 ), k, b( k, 0 ), ldb )
                     CALL cgemm( 'N', 'N', k, n, k, -cone,
     $                           a( k*( k+1 ) ), k, b( k, 0 ), ldb,
     $                           alpha, b, ldb )
                     CALL ctrsm( 'L', 'U', 'N', diag, k, n, cone,
     $                           a( k ), k, b, ldb )
*
                  END IF
*
               ELSE
*
*                 SIDE  ='L', N is even, TRANSR = 'C', and UPLO = 'U'
*
                  IF( .NOT.notrans ) THEN
*
*                    SIDE  ='L', N is even, TRANSR = 'C', UPLO = 'U',
*                    and TRANS = 'N'
*
                     CALL ctrsm( 'L', 'U', 'C', diag, k, n, alpha,
     $                           a( k*( k+1 ) ), k, b, ldb )
                     CALL cgemm( 'N', 'N', k, n, k, -cone, a( 0 ), k, b,
     $                           ldb, alpha, b( k, 0 ), ldb )
                     CALL ctrsm( 'L', 'L', 'N', diag, k, n, cone,
     $                           a( k*k ), k, b( k, 0 ), ldb )
*
                  ELSE
*
*                    SIDE  ='L', N is even, TRANSR = 'C', UPLO = 'U',
*                    and TRANS = 'C'
*
                     CALL ctrsm( 'L', 'L', 'C', diag, k, n, alpha,
     $                           a( k*k ), k, b( k, 0 ), ldb )
                     CALL cgemm( 'C', 'N', k, n, k, -cone, a( 0 ), k,
     $                           b( k, 0 ), ldb, alpha, b, ldb )
                     CALL ctrsm( 'L', 'U', 'N', diag, k, n, cone,
     $                           a( k*( k+1 ) ), k, b, ldb )
*
                  END IF
*
               END IF
*
            END IF
*
         END IF
*
      ELSE
*
*        SIDE = 'R'
*
*        A is N-by-N.
*        If N is odd, set NISODD = .TRUE., and N1 and N2.
*        If N is even, NISODD = .FALSE., and K.
*
         IF( mod( n, 2 ).EQ.0 ) THEN
            nisodd = .false.
            k = n / 2
         ELSE
            nisodd = .true.
            IF( lower ) THEN
               n2 = n / 2
               n1 = n - n2
            ELSE
               n1 = n / 2
               n2 = n - n1
            END IF
         END IF
*
         IF( nisodd ) THEN
*
*           SIDE = 'R' and N is odd
*
            IF( normaltransr ) THEN
*
*              SIDE = 'R', N is odd, and TRANSR = 'N'
*
               IF( lower ) THEN
*
*                 SIDE  ='R', N is odd, TRANSR = 'N', and UPLO = 'L'
*
                  IF( notrans ) THEN
*
*                    SIDE  ='R', N is odd, TRANSR = 'N', UPLO = 'L', and
*                    TRANS = 'N'
*
                     CALL ctrsm( 'R', 'U', 'C', diag, m, n2, alpha,
     $                           a( n ), n, b( 0, n1 ), ldb )
                     CALL cgemm( 'N', 'N', m, n1, n2, -cone, b( 0, n1 ),
     $                           ldb, a( n1 ), n, alpha, b( 0, 0 ),
     $                           ldb )
                     CALL ctrsm( 'R', 'L', 'N', diag, m, n1, cone,
     $                           a( 0 ), n, b( 0, 0 ), ldb )
*
                  ELSE
*
*                    SIDE  ='R', N is odd, TRANSR = 'N', UPLO = 'L', and
*                    TRANS = 'C'
*
                     CALL ctrsm( 'R', 'L', 'C', diag, m, n1, alpha,
     $                           a( 0 ), n, b( 0, 0 ), ldb )
                     CALL cgemm( 'N', 'C', m, n2, n1, -cone, b( 0, 0 ),
     $                           ldb, a( n1 ), n, alpha, b( 0, n1 ),
     $                           ldb )
                     CALL ctrsm( 'R', 'U', 'N', diag, m, n2, cone,
     $                           a( n ), n, b( 0, n1 ), ldb )
*
                  END IF
*
               ELSE
*
*                 SIDE  ='R', N is odd, TRANSR = 'N', and UPLO = 'U'
*
                  IF( notrans ) THEN
*
*                    SIDE  ='R', N is odd, TRANSR = 'N', UPLO = 'U', and
*                    TRANS = 'N'
*
                     CALL ctrsm( 'R', 'L', 'C', diag, m, n1, alpha,
     $                           a( n2 ), n, b( 0, 0 ), ldb )
                     CALL cgemm( 'N', 'N', m, n2, n1, -cone, b( 0, 0 ),
     $                           ldb, a( 0 ), n, alpha, b( 0, n1 ),
     $                           ldb )
                     CALL ctrsm( 'R', 'U', 'N', diag, m, n2, cone,
     $                           a( n1 ), n, b( 0, n1 ), ldb )
*
                  ELSE
*
*                    SIDE  ='R', N is odd, TRANSR = 'N', UPLO = 'U', and
*                    TRANS = 'C'
*
                     CALL ctrsm( 'R', 'U', 'C', diag, m, n2, alpha,
     $                           a( n1 ), n, b( 0, n1 ), ldb )
                     CALL cgemm( 'N', 'C', m, n1, n2, -cone, b( 0, n1 ),
     $                           ldb, a( 0 ), n, alpha, b( 0, 0 ), ldb )
                     CALL ctrsm( 'R', 'L', 'N', diag, m, n1, cone,
     $                           a( n2 ), n, b( 0, 0 ), ldb )
*
                  END IF
*
               END IF
*
            ELSE
*
*              SIDE = 'R', N is odd, and TRANSR = 'C'
*
               IF( lower ) THEN
*
*                 SIDE  ='R', N is odd, TRANSR = 'C', and UPLO = 'L'
*
                  IF( notrans ) THEN
*
*                    SIDE  ='R', N is odd, TRANSR = 'C', UPLO = 'L', and
*                    TRANS = 'N'
*
                     CALL ctrsm( 'R', 'L', 'N', diag, m, n2, alpha,
     $                           a( 1 ), n1, b( 0, n1 ), ldb )
                     CALL cgemm( 'N', 'C', m, n1, n2, -cone, b( 0, n1 ),
     $                           ldb, a( n1*n1 ), n1, alpha, b( 0, 0 ),
     $                           ldb )
                     CALL ctrsm( 'R', 'U', 'C', diag, m, n1, cone,
     $                           a( 0 ), n1, b( 0, 0 ), ldb )
*
                  ELSE
*
*                    SIDE  ='R', N is odd, TRANSR = 'C', UPLO = 'L', and
*                    TRANS = 'C'
*
                     CALL ctrsm( 'R', 'U', 'N', diag, m, n1, alpha,
     $                           a( 0 ), n1, b( 0, 0 ), ldb )
                     CALL cgemm( 'N', 'N', m, n2, n1, -cone, b( 0, 0 ),
     $                           ldb, a( n1*n1 ), n1, alpha, b( 0, n1 ),
     $                           ldb )
                     CALL ctrsm( 'R', 'L', 'C', diag, m, n2, cone,
     $                           a( 1 ), n1, b( 0, n1 ), ldb )
*
                  END IF
*
               ELSE
*
*                 SIDE  ='R', N is odd, TRANSR = 'C', and UPLO = 'U'
*
                  IF( notrans ) THEN
*
*                    SIDE  ='R', N is odd, TRANSR = 'C', UPLO = 'U', and
*                    TRANS = 'N'
*
                     CALL ctrsm( 'R', 'U', 'N', diag, m, n1, alpha,
     $                           a( n2*n2 ), n2, b( 0, 0 ), ldb )
                     CALL cgemm( 'N', 'C', m, n2, n1, -cone, b( 0, 0 ),
     $                           ldb, a( 0 ), n2, alpha, b( 0, n1 ),
     $                           ldb )
                     CALL ctrsm( 'R', 'L', 'C', diag, m, n2, cone,
     $                           a( n1*n2 ), n2, b( 0, n1 ), ldb )
*
                  ELSE
*
*                    SIDE  ='R', N is odd, TRANSR = 'C', UPLO = 'U', and
*                    TRANS = 'C'
*
                     CALL ctrsm( 'R', 'L', 'N', diag, m, n2, alpha,
     $                           a( n1*n2 ), n2, b( 0, n1 ), ldb )
                     CALL cgemm( 'N', 'N', m, n1, n2, -cone, b( 0, n1 ),
     $                           ldb, a( 0 ), n2, alpha, b( 0, 0 ),
     $                           ldb )
                     CALL ctrsm( 'R', 'U', 'C', diag, m, n1, cone,
     $                           a( n2*n2 ), n2, b( 0, 0 ), ldb )
*
                  END IF
*
               END IF
*
            END IF
*
         ELSE
*
*           SIDE = 'R' and N is even
*
            IF( normaltransr ) THEN
*
*              SIDE = 'R', N is even, and TRANSR = 'N'
*
               IF( lower ) THEN
*
*                 SIDE  ='R', N is even, TRANSR = 'N', and UPLO = 'L'
*
                  IF( notrans ) THEN
*
*                    SIDE  ='R', N is even, TRANSR = 'N', UPLO = 'L',
*                    and TRANS = 'N'
*
                     CALL ctrsm( 'R', 'U', 'C', diag, m, k, alpha,
     $                           a( 0 ), n+1, b( 0, k ), ldb )
                     CALL cgemm( 'N', 'N', m, k, k, -cone, b( 0, k ),
     $                           ldb, a( k+1 ), n+1, alpha, b( 0, 0 ),
     $                           ldb )
                     CALL ctrsm( 'R', 'L', 'N', diag, m, k, cone,
     $                           a( 1 ), n+1, b( 0, 0 ), ldb )
*
                  ELSE
*
*                    SIDE  ='R', N is even, TRANSR = 'N', UPLO = 'L',
*                    and TRANS = 'C'
*
                     CALL ctrsm( 'R', 'L', 'C', diag, m, k, alpha,
     $                           a( 1 ), n+1, b( 0, 0 ), ldb )
                     CALL cgemm( 'N', 'C', m, k, k, -cone, b( 0, 0 ),
     $                           ldb, a( k+1 ), n+1, alpha, b( 0, k ),
     $                           ldb )
                     CALL ctrsm( 'R', 'U', 'N', diag, m, k, cone,
     $                           a( 0 ), n+1, b( 0, k ), ldb )
*
                  END IF
*
               ELSE
*
*                 SIDE  ='R', N is even, TRANSR = 'N', and UPLO = 'U'
*
                  IF( notrans ) THEN
*
*                    SIDE  ='R', N is even, TRANSR = 'N', UPLO = 'U',
*                    and TRANS = 'N'
*
                     CALL ctrsm( 'R', 'L', 'C', diag, m, k, alpha,
     $                           a( k+1 ), n+1, b( 0, 0 ), ldb )
                     CALL cgemm( 'N', 'N', m, k, k, -cone, b( 0, 0 ),
     $                           ldb, a( 0 ), n+1, alpha, b( 0, k ),
     $                           ldb )
                     CALL ctrsm( 'R', 'U', 'N', diag, m, k, cone,
     $                           a( k ), n+1, b( 0, k ), ldb )
*
                  ELSE
*
*                    SIDE  ='R', N is even, TRANSR = 'N', UPLO = 'U',
*                    and TRANS = 'C'
*
                     CALL ctrsm( 'R', 'U', 'C', diag, m, k, alpha,
     $                           a( k ), n+1, b( 0, k ), ldb )
                     CALL cgemm( 'N', 'C', m, k, k, -cone, b( 0, k ),
     $                           ldb, a( 0 ), n+1, alpha, b( 0, 0 ),
     $                           ldb )
                     CALL ctrsm( 'R', 'L', 'N', diag, m, k, cone,
     $                           a( k+1 ), n+1, b( 0, 0 ), ldb )
*
                  END IF
*
               END IF
*
            ELSE
*
*              SIDE = 'R', N is even, and TRANSR = 'C'
*
               IF( lower ) THEN
*
*                 SIDE  ='R', N is even, TRANSR = 'C', and UPLO = 'L'
*
                  IF( notrans ) THEN
*
*                    SIDE  ='R', N is even, TRANSR = 'C', UPLO = 'L',
*                    and TRANS = 'N'
*
                     CALL ctrsm( 'R', 'L', 'N', diag, m, k, alpha,
     $                           a( 0 ), k, b( 0, k ), ldb )
                     CALL cgemm( 'N', 'C', m, k, k, -cone, b( 0, k ),
     $                           ldb, a( ( k+1 )*k ), k, alpha,
     $                           b( 0, 0 ), ldb )
                     CALL ctrsm( 'R', 'U', 'C', diag, m, k, cone,
     $                           a( k ), k, b( 0, 0 ), ldb )
*
                  ELSE
*
*                    SIDE  ='R', N is even, TRANSR = 'C', UPLO = 'L',
*                    and TRANS = 'C'
*
                     CALL ctrsm( 'R', 'U', 'N', diag, m, k, alpha,
     $                           a( k ), k, b( 0, 0 ), ldb )
                     CALL cgemm( 'N', 'N', m, k, k, -cone, b( 0, 0 ),
     $                           ldb, a( ( k+1 )*k ), k, alpha,
     $                           b( 0, k ), ldb )
                     CALL ctrsm( 'R', 'L', 'C', diag, m, k, cone,
     $                           a( 0 ), k, b( 0, k ), ldb )
*
                  END IF
*
               ELSE
*
*                 SIDE  ='R', N is even, TRANSR = 'C', and UPLO = 'U'
*
                  IF( notrans ) THEN
*
*                    SIDE  ='R', N is even, TRANSR = 'C', UPLO = 'U',
*                    and TRANS = 'N'
*
                     CALL ctrsm( 'R', 'U', 'N', diag, m, k, alpha,
     $                           a( ( k+1 )*k ), k, b( 0, 0 ), ldb )
                     CALL cgemm( 'N', 'C', m, k, k, -cone, b( 0, 0 ),
     $                           ldb, a( 0 ), k, alpha, b( 0, k ), ldb )
                     CALL ctrsm( 'R', 'L', 'C', diag, m, k, cone,
     $                           a( k*k ), k, b( 0, k ), ldb )
*
                  ELSE
*
*                    SIDE  ='R', N is even, TRANSR = 'C', UPLO = 'U',
*                    and TRANS = 'C'
*
                     CALL ctrsm( 'R', 'L', 'N', diag, m, k, alpha,
     $                           a( k*k ), k, b( 0, k ), ldb )
                     CALL cgemm( 'N', 'N', m, k, k, -cone, b( 0, k ),
     $                           ldb, a( 0 ), k, alpha, b( 0, 0 ), ldb )
                     CALL ctrsm( 'R', 'U', 'C', diag, m, k, cone,
     $                           a( ( k+1 )*k ), k, b( 0, 0 ), ldb )
*
                  END IF
*
               END IF
*
            END IF
*
         END IF
      END IF
*
      RETURN
*
*     End of CTFSM
*

◆ ctftri()

subroutine ctftri	(	character	transr,
		character	uplo,
		character	diag,
		integer	n,
		complex, dimension( 0: * )	a,
		integer	info )

CTFTRI

Download CTFTRI + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CTFTRI computes the inverse of a triangular matrix A stored in RFP
!> format.
!>
!> This is a Level 3 BLAS version of the algorithm.
!>

Parameters

[in]	TRANSR	!> TRANSR is CHARACTER*1 !> = 'N': The Normal TRANSR of RFP A is stored; !> = 'C': The Conjugate-transpose TRANSR of RFP A is stored. !>
[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': A is upper triangular; !> = 'L': A is lower triangular. !>
[in]	DIAG	!> DIAG is CHARACTER*1 !> = 'N': A is non-unit triangular; !> = 'U': A is unit triangular. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in,out]	A	!> A is COMPLEX array, dimension ( N*(N+1)/2 ); !> On entry, the triangular matrix A in RFP format. RFP format !> is described by TRANSR, UPLO, and N as follows: If TRANSR = !> 'N' then RFP A is (0:N,0:k-1) when N is even; k=N/2. RFP A is !> (0:N-1,0:k) when N is odd; k=N/2. IF TRANSR = 'C' then RFP is !> the Conjugate-transpose of RFP A as defined when !> TRANSR = 'N'. The contents of RFP A are defined by UPLO as !> follows: If UPLO = 'U' the RFP A contains the nt elements of !> upper packed A; If UPLO = 'L' the RFP A contains the nt !> elements of lower packed A. The LDA of RFP A is (N+1)/2 when !> TRANSR = 'C'. When TRANSR is 'N' the LDA is N+1 when N is !> even and N is odd. See the Note below for more details. !> !> On exit, the (triangular) inverse of the original matrix, in !> the same storage format. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !> > 0: if INFO = i, A(i,i) is exactly zero. The triangular !> matrix is singular and its inverse can not be computed. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  We first consider Standard Packed Format when N is even.
!>  We give an example where N = 6.
!>
!>      AP is Upper             AP is Lower
!>
!>   00 01 02 03 04 05       00
!>      11 12 13 14 15       10 11
!>         22 23 24 25       20 21 22
!>            33 34 35       30 31 32 33
!>               44 45       40 41 42 43 44
!>                  55       50 51 52 53 54 55
!>
!>
!>  Let TRANSR = 'N'. RFP holds AP as follows:
!>  For UPLO = 'U' the upper trapezoid A(0:5,0:2) consists of the last
!>  three columns of AP upper. The lower triangle A(4:6,0:2) consists of
!>  conjugate-transpose of the first three columns of AP upper.
!>  For UPLO = 'L' the lower trapezoid A(1:6,0:2) consists of the first
!>  three columns of AP lower. The upper triangle A(0:2,0:2) consists of
!>  conjugate-transpose of the last three columns of AP lower.
!>  To denote conjugate we place -- above the element. This covers the
!>  case N even and TRANSR = 'N'.
!>
!>         RFP A                   RFP A
!>
!>                                -- -- --
!>        03 04 05                33 43 53
!>                                   -- --
!>        13 14 15                00 44 54
!>                                      --
!>        23 24 25                10 11 55
!>
!>        33 34 35                20 21 22
!>        --
!>        00 44 45                30 31 32
!>        -- --
!>        01 11 55                40 41 42
!>        -- -- --
!>        02 12 22                50 51 52
!>
!>  Now let TRANSR = 'C'. RFP A in both UPLO cases is just the conjugate-
!>  transpose of RFP A above. One therefore gets:
!>
!>
!>           RFP A                   RFP A
!>
!>     -- -- -- --                -- -- -- -- -- --
!>     03 13 23 33 00 01 02    33 00 10 20 30 40 50
!>     -- -- -- -- --                -- -- -- -- --
!>     04 14 24 34 44 11 12    43 44 11 21 31 41 51
!>     -- -- -- -- -- --                -- -- -- --
!>     05 15 25 35 45 55 22    53 54 55 22 32 42 52
!>
!>
!>  We next  consider Standard Packed Format when N is odd.
!>  We give an example where N = 5.
!>
!>     AP is Upper                 AP is Lower
!>
!>   00 01 02 03 04              00
!>      11 12 13 14              10 11
!>         22 23 24              20 21 22
!>            33 34              30 31 32 33
!>               44              40 41 42 43 44
!>
!>
!>  Let TRANSR = 'N'. RFP holds AP as follows:
!>  For UPLO = 'U' the upper trapezoid A(0:4,0:2) consists of the last
!>  three columns of AP upper. The lower triangle A(3:4,0:1) consists of
!>  conjugate-transpose of the first two   columns of AP upper.
!>  For UPLO = 'L' the lower trapezoid A(0:4,0:2) consists of the first
!>  three columns of AP lower. The upper triangle A(0:1,1:2) consists of
!>  conjugate-transpose of the last two   columns of AP lower.
!>  To denote conjugate we place -- above the element. This covers the
!>  case N odd  and TRANSR = 'N'.
!>
!>         RFP A                   RFP A
!>
!>                                   -- --
!>        02 03 04                00 33 43
!>                                      --
!>        12 13 14                10 11 44
!>
!>        22 23 24                20 21 22
!>        --
!>        00 33 34                30 31 32
!>        -- --
!>        01 11 44                40 41 42
!>
!>  Now let TRANSR = 'C'. RFP A in both UPLO cases is just the conjugate-
!>  transpose of RFP A above. One therefore gets:
!>
!>
!>           RFP A                   RFP A
!>
!>     -- -- --                   -- -- -- -- -- --
!>     02 12 22 00 01             00 10 20 30 40 50
!>     -- -- -- --                   -- -- -- -- --
!>     03 13 23 33 11             33 11 21 31 41 51
!>     -- -- -- -- --                   -- -- -- --
!>     04 14 24 34 44             43 44 22 32 42 52
!>

Definition at line 220 of file ctftri.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          TRANSR, UPLO, DIAG
      INTEGER            INFO, N
*     ..
*     .. Array Arguments ..
      COMPLEX            A( 0: * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            CONE
      parameter( cone = ( 1.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      LOGICAL            LOWER, NISODD, NORMALTRANSR
      INTEGER            N1, N2, K
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           xerbla, ctrmm, ctrtri
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          mod
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      normaltransr = lsame( transr, 'N' )
      lower = lsame( uplo, 'L' )
      IF( .NOT.normaltransr .AND. .NOT.lsame( transr, 'C' ) ) THEN
         info = -1
      ELSE IF( .NOT.lower .AND. .NOT.lsame( uplo, 'U' ) ) THEN
         info = -2
      ELSE IF( .NOT.lsame( diag, 'N' ) .AND. .NOT.lsame( diag, 'U' ) )
     $         THEN
         info = -3
      ELSE IF( n.LT.0 ) THEN
         info = -4
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CTFTRI', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
*     If N is odd, set NISODD = .TRUE.
*     If N is even, set K = N/2 and NISODD = .FALSE.
*
      IF( mod( n, 2 ).EQ.0 ) THEN
         k = n / 2
         nisodd = .false.
      ELSE
         nisodd = .true.
      END IF
*
*     Set N1 and N2 depending on LOWER
*
      IF( lower ) THEN
         n2 = n / 2
         n1 = n - n2
      ELSE
         n1 = n / 2
         n2 = n - n1
      END IF
*
*
*     start execution: there are eight cases
*
      IF( nisodd ) THEN
*
*        N is odd
*
         IF( normaltransr ) THEN
*
*           N is odd and TRANSR = 'N'
*
            IF( lower ) THEN
*
*             SRPA for LOWER, NORMAL and N is odd ( a(0:n-1,0:n1-1) )
*             T1 -> a(0,0), T2 -> a(0,1), S -> a(n1,0)
*             T1 -> a(0), T2 -> a(n), S -> a(n1)
*
               CALL ctrtri( 'L', diag, n1, a( 0 ), n, info )
               IF( info.GT.0 )
     $            RETURN
               CALL ctrmm( 'R', 'L', 'N', diag, n2, n1, -cone, a( 0 ),
     $                     n, a( n1 ), n )
               CALL ctrtri( 'U', diag, n2, a( n ), n, info )
               IF( info.GT.0 )
     $            info = info + n1
               IF( info.GT.0 )
     $            RETURN
               CALL ctrmm( 'L', 'U', 'C', diag, n2, n1, cone, a( n ), n,
     $                     a( n1 ), n )
*
            ELSE
*
*             SRPA for UPPER, NORMAL and N is odd ( a(0:n-1,0:n2-1)
*             T1 -> a(n1+1,0), T2 -> a(n1,0), S -> a(0,0)
*             T1 -> a(n2), T2 -> a(n1), S -> a(0)
*
               CALL ctrtri( 'L', diag, n1, a( n2 ), n, info )
               IF( info.GT.0 )
     $            RETURN
               CALL ctrmm( 'L', 'L', 'C', diag, n1, n2, -cone, a( n2 ),
     $                     n, a( 0 ), n )
               CALL ctrtri( 'U', diag, n2, a( n1 ), n, info )
               IF( info.GT.0 )
     $            info = info + n1
               IF( info.GT.0 )
     $            RETURN
               CALL ctrmm( 'R', 'U', 'N', diag, n1, n2, cone, a( n1 ),
     $                     n, a( 0 ), n )
*
            END IF
*
         ELSE
*
*           N is odd and TRANSR = 'C'
*
            IF( lower ) THEN
*
*              SRPA for LOWER, TRANSPOSE and N is odd
*              T1 -> a(0), T2 -> a(1), S -> a(0+n1*n1)
*
               CALL ctrtri( 'U', diag, n1, a( 0 ), n1, info )
               IF( info.GT.0 )
     $            RETURN
               CALL ctrmm( 'L', 'U', 'N', diag, n1, n2, -cone, a( 0 ),
     $                     n1, a( n1*n1 ), n1 )
               CALL ctrtri( 'L', diag, n2, a( 1 ), n1, info )
               IF( info.GT.0 )
     $            info = info + n1
               IF( info.GT.0 )
     $            RETURN
               CALL ctrmm( 'R', 'L', 'C', diag, n1, n2, cone, a( 1 ),
     $                     n1, a( n1*n1 ), n1 )
*
            ELSE
*
*              SRPA for UPPER, TRANSPOSE and N is odd
*              T1 -> a(0+n2*n2), T2 -> a(0+n1*n2), S -> a(0)
*
               CALL ctrtri( 'U', diag, n1, a( n2*n2 ), n2, info )
               IF( info.GT.0 )
     $            RETURN
               CALL ctrmm( 'R', 'U', 'C', diag, n2, n1, -cone,
     $                     a( n2*n2 ), n2, a( 0 ), n2 )
               CALL ctrtri( 'L', diag, n2, a( n1*n2 ), n2, info )
               IF( info.GT.0 )
     $            info = info + n1
               IF( info.GT.0 )
     $            RETURN
               CALL ctrmm( 'L', 'L', 'N', diag, n2, n1, cone,
     $                     a( n1*n2 ), n2, a( 0 ), n2 )
            END IF
*
         END IF
*
      ELSE
*
*        N is even
*
         IF( normaltransr ) THEN
*
*           N is even and TRANSR = 'N'
*
            IF( lower ) THEN
*
*              SRPA for LOWER, NORMAL, and N is even ( a(0:n,0:k-1) )
*              T1 -> a(1,0), T2 -> a(0,0), S -> a(k+1,0)
*              T1 -> a(1), T2 -> a(0), S -> a(k+1)
*
               CALL ctrtri( 'L', diag, k, a( 1 ), n+1, info )
               IF( info.GT.0 )
     $            RETURN
               CALL ctrmm( 'R', 'L', 'N', diag, k, k, -cone, a( 1 ),
     $                     n+1, a( k+1 ), n+1 )
               CALL ctrtri( 'U', diag, k, a( 0 ), n+1, info )
               IF( info.GT.0 )
     $            info = info + k
               IF( info.GT.0 )
     $            RETURN
               CALL ctrmm( 'L', 'U', 'C', diag, k, k, cone, a( 0 ), n+1,
     $                     a( k+1 ), n+1 )
*
            ELSE
*
*              SRPA for UPPER, NORMAL, and N is even ( a(0:n,0:k-1) )
*              T1 -> a(k+1,0) ,  T2 -> a(k,0),   S -> a(0,0)
*              T1 -> a(k+1), T2 -> a(k), S -> a(0)
*
               CALL ctrtri( 'L', diag, k, a( k+1 ), n+1, info )
               IF( info.GT.0 )
     $            RETURN
               CALL ctrmm( 'L', 'L', 'C', diag, k, k, -cone, a( k+1 ),
     $                     n+1, a( 0 ), n+1 )
               CALL ctrtri( 'U', diag, k, a( k ), n+1, info )
               IF( info.GT.0 )
     $            info = info + k
               IF( info.GT.0 )
     $            RETURN
               CALL ctrmm( 'R', 'U', 'N', diag, k, k, cone, a( k ), n+1,
     $                     a( 0 ), n+1 )
            END IF
         ELSE
*
*           N is even and TRANSR = 'C'
*
            IF( lower ) THEN
*
*              SRPA for LOWER, TRANSPOSE and N is even (see paper)
*              T1 -> B(0,1), T2 -> B(0,0), S -> B(0,k+1)
*              T1 -> a(0+k), T2 -> a(0+0), S -> a(0+k*(k+1)); lda=k
*
               CALL ctrtri( 'U', diag, k, a( k ), k, info )
               IF( info.GT.0 )
     $            RETURN
               CALL ctrmm( 'L', 'U', 'N', diag, k, k, -cone, a( k ), k,
     $                     a( k*( k+1 ) ), k )
               CALL ctrtri( 'L', diag, k, a( 0 ), k, info )
               IF( info.GT.0 )
     $            info = info + k
               IF( info.GT.0 )
     $            RETURN
               CALL ctrmm( 'R', 'L', 'C', diag, k, k, cone, a( 0 ), k,
     $                     a( k*( k+1 ) ), k )
            ELSE
*
*              SRPA for UPPER, TRANSPOSE and N is even (see paper)
*              T1 -> B(0,k+1),     T2 -> B(0,k),   S -> B(0,0)
*              T1 -> a(0+k*(k+1)), T2 -> a(0+k*k), S -> a(0+0)); lda=k
*
               CALL ctrtri( 'U', diag, k, a( k*( k+1 ) ), k, info )
               IF( info.GT.0 )
     $            RETURN
               CALL ctrmm( 'R', 'U', 'C', diag, k, k, -cone,
     $                     a( k*( k+1 ) ), k, a( 0 ), k )
               CALL ctrtri( 'L', diag, k, a( k*k ), k, info )
               IF( info.GT.0 )
     $            info = info + k
               IF( info.GT.0 )
     $            RETURN
               CALL ctrmm( 'L', 'L', 'N', diag, k, k, cone, a( k*k ), k,
     $                     a( 0 ), k )
            END IF
         END IF
      END IF
*
      RETURN
*
*     End of CTFTRI
*

◆ ctfttp()

subroutine ctfttp	(	character	transr,
		character	uplo,
		integer	n,
		complex, dimension( 0: * )	arf,
		complex, dimension( 0: * )	ap,
		integer	info )

CTFTTP copies a triangular matrix from the rectangular full packed format (TF) to the standard packed format (TP).

Download CTFTTP + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CTFTTP copies a triangular matrix A from rectangular full packed
!> format (TF) to standard packed format (TP).
!>

Parameters

[in]	TRANSR	!> TRANSR is CHARACTER*1 !> = 'N': ARF is in Normal format; !> = 'C': ARF is in Conjugate-transpose format; !>
[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': A is upper triangular; !> = 'L': A is lower triangular. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in]	ARF	!> ARF is COMPLEX array, dimension ( N*(N+1)/2 ), !> On entry, the upper or lower triangular matrix A stored in !> RFP format. For a further discussion see Notes below. !>
[out]	AP	!> AP is COMPLEX array, dimension ( N(N+1)/2 ), !> On exit, the upper or lower triangular matrix A, packed !> columnwise in a linear array. The j-th column of A is stored !> in the array AP as follows: !> if UPLO = 'U', AP(i + (j-1)j/2) = A(i,j) for 1<=i<=j; !> if UPLO = 'L', AP(i + (j-1)*(2n-j)/2) = A(i,j) for j<=i<=n. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  We first consider Standard Packed Format when N is even.
!>  We give an example where N = 6.
!>
!>      AP is Upper             AP is Lower
!>
!>   00 01 02 03 04 05       00
!>      11 12 13 14 15       10 11
!>         22 23 24 25       20 21 22
!>            33 34 35       30 31 32 33
!>               44 45       40 41 42 43 44
!>                  55       50 51 52 53 54 55
!>
!>
!>  Let TRANSR = 'N'. RFP holds AP as follows:
!>  For UPLO = 'U' the upper trapezoid A(0:5,0:2) consists of the last
!>  three columns of AP upper. The lower triangle A(4:6,0:2) consists of
!>  conjugate-transpose of the first three columns of AP upper.
!>  For UPLO = 'L' the lower trapezoid A(1:6,0:2) consists of the first
!>  three columns of AP lower. The upper triangle A(0:2,0:2) consists of
!>  conjugate-transpose of the last three columns of AP lower.
!>  To denote conjugate we place -- above the element. This covers the
!>  case N even and TRANSR = 'N'.
!>
!>         RFP A                   RFP A
!>
!>                                -- -- --
!>        03 04 05                33 43 53
!>                                   -- --
!>        13 14 15                00 44 54
!>                                      --
!>        23 24 25                10 11 55
!>
!>        33 34 35                20 21 22
!>        --
!>        00 44 45                30 31 32
!>        -- --
!>        01 11 55                40 41 42
!>        -- -- --
!>        02 12 22                50 51 52
!>
!>  Now let TRANSR = 'C'. RFP A in both UPLO cases is just the conjugate-
!>  transpose of RFP A above. One therefore gets:
!>
!>
!>           RFP A                   RFP A
!>
!>     -- -- -- --                -- -- -- -- -- --
!>     03 13 23 33 00 01 02    33 00 10 20 30 40 50
!>     -- -- -- -- --                -- -- -- -- --
!>     04 14 24 34 44 11 12    43 44 11 21 31 41 51
!>     -- -- -- -- -- --                -- -- -- --
!>     05 15 25 35 45 55 22    53 54 55 22 32 42 52
!>
!>
!>  We next  consider Standard Packed Format when N is odd.
!>  We give an example where N = 5.
!>
!>     AP is Upper                 AP is Lower
!>
!>   00 01 02 03 04              00
!>      11 12 13 14              10 11
!>         22 23 24              20 21 22
!>            33 34              30 31 32 33
!>               44              40 41 42 43 44
!>
!>
!>  Let TRANSR = 'N'. RFP holds AP as follows:
!>  For UPLO = 'U' the upper trapezoid A(0:4,0:2) consists of the last
!>  three columns of AP upper. The lower triangle A(3:4,0:1) consists of
!>  conjugate-transpose of the first two   columns of AP upper.
!>  For UPLO = 'L' the lower trapezoid A(0:4,0:2) consists of the first
!>  three columns of AP lower. The upper triangle A(0:1,1:2) consists of
!>  conjugate-transpose of the last two   columns of AP lower.
!>  To denote conjugate we place -- above the element. This covers the
!>  case N odd  and TRANSR = 'N'.
!>
!>         RFP A                   RFP A
!>
!>                                   -- --
!>        02 03 04                00 33 43
!>                                      --
!>        12 13 14                10 11 44
!>
!>        22 23 24                20 21 22
!>        --
!>        00 33 34                30 31 32
!>        -- --
!>        01 11 44                40 41 42
!>
!>  Now let TRANSR = 'C'. RFP A in both UPLO cases is just the conjugate-
!>  transpose of RFP A above. One therefore gets:
!>
!>
!>           RFP A                   RFP A
!>
!>     -- -- --                   -- -- -- -- -- --
!>     02 12 22 00 01             00 10 20 30 40 50
!>     -- -- -- --                   -- -- -- -- --
!>     03 13 23 33 11             33 11 21 31 41 51
!>     -- -- -- -- --                   -- -- -- --
!>     04 14 24 34 44             43 44 22 32 42 52
!>

Definition at line 207 of file ctfttp.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          TRANSR, UPLO
      INTEGER            INFO, N
*     ..
*     .. Array Arguments ..
      COMPLEX            AP( 0: * ), ARF( 0: * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
*     ..
*     .. Local Scalars ..
      LOGICAL            LOWER, NISODD, NORMALTRANSR
      INTEGER            N1, N2, K, NT
      INTEGER            I, J, IJ
      INTEGER            IJP, JP, LDA, JS
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          conjg
*     ..
*     .. Intrinsic Functions ..
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      normaltransr = lsame( transr, 'N' )
      lower = lsame( uplo, 'L' )
      IF( .NOT.normaltransr .AND. .NOT.lsame( transr, 'C' ) ) THEN
         info = -1
      ELSE IF( .NOT.lower .AND. .NOT.lsame( uplo, 'U' ) ) THEN
         info = -2
      ELSE IF( n.LT.0 ) THEN
         info = -3
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CTFTTP', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
      IF( n.EQ.1 ) THEN
         IF( normaltransr ) THEN
            ap( 0 ) = arf( 0 )
         ELSE
            ap( 0 ) = conjg( arf( 0 ) )
         END IF
         RETURN
      END IF
*
*     Size of array ARF(0:NT-1)
*
      nt = n*( n+1 ) / 2
*
*     Set N1 and N2 depending on LOWER
*
      IF( lower ) THEN
         n2 = n / 2
         n1 = n - n2
      ELSE
         n1 = n / 2
         n2 = n - n1
      END IF
*
*     If N is odd, set NISODD = .TRUE.
*     If N is even, set K = N/2 and NISODD = .FALSE.
*
*     set lda of ARF^C; ARF^C is (0:(N+1)/2-1,0:N-noe)
*     where noe = 0 if n is even, noe = 1 if n is odd
*
      IF( mod( n, 2 ).EQ.0 ) THEN
         k = n / 2
         nisodd = .false.
         lda = n + 1
      ELSE
         nisodd = .true.
         lda = n
      END IF
*
*     ARF^C has lda rows and n+1-noe cols
*
      IF( .NOT.normaltransr )
     $   lda = ( n+1 ) / 2
*
*     start execution: there are eight cases
*
      IF( nisodd ) THEN
*
*        N is odd
*
         IF( normaltransr ) THEN
*
*           N is odd and TRANSR = 'N'
*
            IF( lower ) THEN
*
*             SRPA for LOWER, NORMAL and N is odd ( a(0:n-1,0:n1-1) )
*             T1 -> a(0,0), T2 -> a(0,1), S -> a(n1,0)
*             T1 -> a(0), T2 -> a(n), S -> a(n1); lda = n
*
               ijp = 0
               jp = 0
               DO j = 0, n2
                  DO i = j, n - 1
                     ij = i + jp
                     ap( ijp ) = arf( ij )
                     ijp = ijp + 1
                  END DO
                  jp = jp + lda
               END DO
               DO i = 0, n2 - 1
                  DO j = 1 + i, n2
                     ij = i + j*lda
                     ap( ijp ) = conjg( arf( ij ) )
                     ijp = ijp + 1
                  END DO
               END DO
*
            ELSE
*
*             SRPA for UPPER, NORMAL and N is odd ( a(0:n-1,0:n2-1)
*             T1 -> a(n1+1,0), T2 -> a(n1,0), S -> a(0,0)
*             T1 -> a(n2), T2 -> a(n1), S -> a(0)
*
               ijp = 0
               DO j = 0, n1 - 1
                  ij = n2 + j
                  DO i = 0, j
                     ap( ijp ) = conjg( arf( ij ) )
                     ijp = ijp + 1
                     ij = ij + lda
                  END DO
               END DO
               js = 0
               DO j = n1, n - 1
                  ij = js
                  DO ij = js, js + j
                     ap( ijp ) = arf( ij )
                     ijp = ijp + 1
                  END DO
                  js = js + lda
               END DO
*
            END IF
*
         ELSE
*
*           N is odd and TRANSR = 'C'
*
            IF( lower ) THEN
*
*              SRPA for LOWER, TRANSPOSE and N is odd
*              T1 -> A(0,0) , T2 -> A(1,0) , S -> A(0,n1)
*              T1 -> a(0+0) , T2 -> a(1+0) , S -> a(0+n1*n1); lda=n1
*
               ijp = 0
               DO i = 0, n2
                  DO ij = i*( lda+1 ), n*lda - 1, lda
                     ap( ijp ) = conjg( arf( ij ) )
                     ijp = ijp + 1
                  END DO
               END DO
               js = 1
               DO j = 0, n2 - 1
                  DO ij = js, js + n2 - j - 1
                     ap( ijp ) = arf( ij )
                     ijp = ijp + 1
                  END DO
                  js = js + lda + 1
               END DO
*
            ELSE
*
*              SRPA for UPPER, TRANSPOSE and N is odd
*              T1 -> A(0,n1+1), T2 -> A(0,n1), S -> A(0,0)
*              T1 -> a(n2*n2), T2 -> a(n1*n2), S -> a(0); lda = n2
*
               ijp = 0
               js = n2*lda
               DO j = 0, n1 - 1
                  DO ij = js, js + j
                     ap( ijp ) = arf( ij )
                     ijp = ijp + 1
                  END DO
                  js = js + lda
               END DO
               DO i = 0, n1
                  DO ij = i, i + ( n1+i )*lda, lda
                     ap( ijp ) = conjg( arf( ij ) )
                     ijp = ijp + 1
                  END DO
               END DO
*
            END IF
*
         END IF
*
      ELSE
*
*        N is even
*
         IF( normaltransr ) THEN
*
*           N is even and TRANSR = 'N'
*
            IF( lower ) THEN
*
*              SRPA for LOWER, NORMAL, and N is even ( a(0:n,0:k-1) )
*              T1 -> a(1,0), T2 -> a(0,0), S -> a(k+1,0)
*              T1 -> a(1), T2 -> a(0), S -> a(k+1)
*
               ijp = 0
               jp = 0
               DO j = 0, k - 1
                  DO i = j, n - 1
                     ij = 1 + i + jp
                     ap( ijp ) = arf( ij )
                     ijp = ijp + 1
                  END DO
                  jp = jp + lda
               END DO
               DO i = 0, k - 1
                  DO j = i, k - 1
                     ij = i + j*lda
                     ap( ijp ) = conjg( arf( ij ) )
                     ijp = ijp + 1
                  END DO
               END DO
*
            ELSE
*
*              SRPA for UPPER, NORMAL, and N is even ( a(0:n,0:k-1) )
*              T1 -> a(k+1,0) ,  T2 -> a(k,0),   S -> a(0,0)
*              T1 -> a(k+1), T2 -> a(k), S -> a(0)
*
               ijp = 0
               DO j = 0, k - 1
                  ij = k + 1 + j
                  DO i = 0, j
                     ap( ijp ) = conjg( arf( ij ) )
                     ijp = ijp + 1
                     ij = ij + lda
                  END DO
               END DO
               js = 0
               DO j = k, n - 1
                  ij = js
                  DO ij = js, js + j
                     ap( ijp ) = arf( ij )
                     ijp = ijp + 1
                  END DO
                  js = js + lda
               END DO
*
            END IF
*
         ELSE
*
*           N is even and TRANSR = 'C'
*
            IF( lower ) THEN
*
*              SRPA for LOWER, TRANSPOSE and N is even (see paper)
*              T1 -> B(0,1), T2 -> B(0,0), S -> B(0,k+1)
*              T1 -> a(0+k), T2 -> a(0+0), S -> a(0+k*(k+1)); lda=k
*
               ijp = 0
               DO i = 0, k - 1
                  DO ij = i + ( i+1 )*lda, ( n+1 )*lda - 1, lda
                     ap( ijp ) = conjg( arf( ij ) )
                     ijp = ijp + 1
                  END DO
               END DO
               js = 0
               DO j = 0, k - 1
                  DO ij = js, js + k - j - 1
                     ap( ijp ) = arf( ij )
                     ijp = ijp + 1
                  END DO
                  js = js + lda + 1
               END DO
*
            ELSE
*
*              SRPA for UPPER, TRANSPOSE and N is even (see paper)
*              T1 -> B(0,k+1),     T2 -> B(0,k),   S -> B(0,0)
*              T1 -> a(0+k*(k+1)), T2 -> a(0+k*k), S -> a(0+0)); lda=k
*
               ijp = 0
               js = ( k+1 )*lda
               DO j = 0, k - 1
                  DO ij = js, js + j
                     ap( ijp ) = arf( ij )
                     ijp = ijp + 1
                  END DO
                  js = js + lda
               END DO
               DO i = 0, k - 1
                  DO ij = i, i + ( k+i )*lda, lda
                     ap( ijp ) = conjg( arf( ij ) )
                     ijp = ijp + 1
                  END DO
               END DO
*
            END IF
*
         END IF
*
      END IF
*
      RETURN
*
*     End of CTFTTP
*

◆ ctfttr()

subroutine ctfttr	(	character	transr,
		character	uplo,
		integer	n,
		complex, dimension( 0: * )	arf,
		complex, dimension( 0: lda-1, 0: * )	a,
		integer	lda,
		integer	info )

CTFTTR copies a triangular matrix from the rectangular full packed format (TF) to the standard full format (TR).

Download CTFTTR + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CTFTTR copies a triangular matrix A from rectangular full packed
!> format (TF) to standard full format (TR).
!>

Parameters

[in]	TRANSR	!> TRANSR is CHARACTER*1 !> = 'N': ARF is in Normal format; !> = 'C': ARF is in Conjugate-transpose format; !>
[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': A is upper triangular; !> = 'L': A is lower triangular. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in]	ARF	!> ARF is COMPLEX array, dimension ( N*(N+1)/2 ), !> On entry, the upper or lower triangular matrix A stored in !> RFP format. For a further discussion see Notes below. !>
[out]	A	!> A is COMPLEX array, dimension ( LDA, N ) !> On exit, the triangular matrix A. If UPLO = 'U', the !> leading N-by-N upper triangular part of the array A contains !> the upper triangular matrix, and the strictly lower !> triangular part of A is not referenced. If UPLO = 'L', the !> leading N-by-N lower triangular part of the array A contains !> the lower triangular matrix, and the strictly upper !> triangular part of A is not referenced. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,N). !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  We first consider Standard Packed Format when N is even.
!>  We give an example where N = 6.
!>
!>      AP is Upper             AP is Lower
!>
!>   00 01 02 03 04 05       00
!>      11 12 13 14 15       10 11
!>         22 23 24 25       20 21 22
!>            33 34 35       30 31 32 33
!>               44 45       40 41 42 43 44
!>                  55       50 51 52 53 54 55
!>
!>
!>  Let TRANSR = 'N'. RFP holds AP as follows:
!>  For UPLO = 'U' the upper trapezoid A(0:5,0:2) consists of the last
!>  three columns of AP upper. The lower triangle A(4:6,0:2) consists of
!>  conjugate-transpose of the first three columns of AP upper.
!>  For UPLO = 'L' the lower trapezoid A(1:6,0:2) consists of the first
!>  three columns of AP lower. The upper triangle A(0:2,0:2) consists of
!>  conjugate-transpose of the last three columns of AP lower.
!>  To denote conjugate we place -- above the element. This covers the
!>  case N even and TRANSR = 'N'.
!>
!>         RFP A                   RFP A
!>
!>                                -- -- --
!>        03 04 05                33 43 53
!>                                   -- --
!>        13 14 15                00 44 54
!>                                      --
!>        23 24 25                10 11 55
!>
!>        33 34 35                20 21 22
!>        --
!>        00 44 45                30 31 32
!>        -- --
!>        01 11 55                40 41 42
!>        -- -- --
!>        02 12 22                50 51 52
!>
!>  Now let TRANSR = 'C'. RFP A in both UPLO cases is just the conjugate-
!>  transpose of RFP A above. One therefore gets:
!>
!>
!>           RFP A                   RFP A
!>
!>     -- -- -- --                -- -- -- -- -- --
!>     03 13 23 33 00 01 02    33 00 10 20 30 40 50
!>     -- -- -- -- --                -- -- -- -- --
!>     04 14 24 34 44 11 12    43 44 11 21 31 41 51
!>     -- -- -- -- -- --                -- -- -- --
!>     05 15 25 35 45 55 22    53 54 55 22 32 42 52
!>
!>
!>  We next  consider Standard Packed Format when N is odd.
!>  We give an example where N = 5.
!>
!>     AP is Upper                 AP is Lower
!>
!>   00 01 02 03 04              00
!>      11 12 13 14              10 11
!>         22 23 24              20 21 22
!>            33 34              30 31 32 33
!>               44              40 41 42 43 44
!>
!>
!>  Let TRANSR = 'N'. RFP holds AP as follows:
!>  For UPLO = 'U' the upper trapezoid A(0:4,0:2) consists of the last
!>  three columns of AP upper. The lower triangle A(3:4,0:1) consists of
!>  conjugate-transpose of the first two   columns of AP upper.
!>  For UPLO = 'L' the lower trapezoid A(0:4,0:2) consists of the first
!>  three columns of AP lower. The upper triangle A(0:1,1:2) consists of
!>  conjugate-transpose of the last two   columns of AP lower.
!>  To denote conjugate we place -- above the element. This covers the
!>  case N odd  and TRANSR = 'N'.
!>
!>         RFP A                   RFP A
!>
!>                                   -- --
!>        02 03 04                00 33 43
!>                                      --
!>        12 13 14                10 11 44
!>
!>        22 23 24                20 21 22
!>        --
!>        00 33 34                30 31 32
!>        -- --
!>        01 11 44                40 41 42
!>
!>  Now let TRANSR = 'C'. RFP A in both UPLO cases is just the conjugate-
!>  transpose of RFP A above. One therefore gets:
!>
!>
!>           RFP A                   RFP A
!>
!>     -- -- --                   -- -- -- -- -- --
!>     02 12 22 00 01             00 10 20 30 40 50
!>     -- -- -- --                   -- -- -- -- --
!>     03 13 23 33 11             33 11 21 31 41 51
!>     -- -- -- -- --                   -- -- -- --
!>     04 14 24 34 44             43 44 22 32 42 52
!>

Definition at line 215 of file ctfttr.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          TRANSR, UPLO
      INTEGER            INFO, N, LDA
*     ..
*     .. Array Arguments ..
      COMPLEX            A( 0: LDA-1, 0: * ), ARF( 0: * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
*     ..
*     .. Local Scalars ..
      LOGICAL            LOWER, NISODD, NORMALTRANSR
      INTEGER            N1, N2, K, NT, NX2, NP1X2
      INTEGER            I, J, L, IJ
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          conjg, max, mod
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      normaltransr = lsame( transr, 'N' )
      lower = lsame( uplo, 'L' )
      IF( .NOT.normaltransr .AND. .NOT.lsame( transr, 'C' ) ) THEN
         info = -1
      ELSE IF( .NOT.lower .AND. .NOT.lsame( uplo, 'U' ) ) THEN
         info = -2
      ELSE IF( n.LT.0 ) THEN
         info = -3
      ELSE IF( lda.LT.max( 1, n ) ) THEN
         info = -6
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CTFTTR', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.LE.1 ) THEN
         IF( n.EQ.1 ) THEN
            IF( normaltransr ) THEN
               a( 0, 0 ) = arf( 0 )
            ELSE
               a( 0, 0 ) = conjg( arf( 0 ) )
            END IF
         END IF
         RETURN
      END IF
*
*     Size of array ARF(1:2,0:nt-1)
*
      nt = n*( n+1 ) / 2
*
*     set N1 and N2 depending on LOWER: for N even N1=N2=K
*
      IF( lower ) THEN
         n2 = n / 2
         n1 = n - n2
      ELSE
         n1 = n / 2
         n2 = n - n1
      END IF
*
*     If N is odd, set NISODD = .TRUE., LDA=N+1 and A is (N+1)--by--K2.
*     If N is even, set K = N/2 and NISODD = .FALSE., LDA=N and A is
*     N--by--(N+1)/2.
*
      IF( mod( n, 2 ).EQ.0 ) THEN
         k = n / 2
         nisodd = .false.
         IF( .NOT.lower )
     $      np1x2 = n + n + 2
      ELSE
         nisodd = .true.
         IF( .NOT.lower )
     $      nx2 = n + n
      END IF
*
      IF( nisodd ) THEN
*
*        N is odd
*
         IF( normaltransr ) THEN
*
*           N is odd and TRANSR = 'N'
*
            IF( lower ) THEN
*
*             SRPA for LOWER, NORMAL and N is odd ( a(0:n-1,0:n1-1) )
*             T1 -> a(0,0), T2 -> a(0,1), S -> a(n1,0)
*             T1 -> a(0), T2 -> a(n), S -> a(n1); lda=n
*
               ij = 0
               DO j = 0, n2
                  DO i = n1, n2 + j
                     a( n2+j, i ) = conjg( arf( ij ) )
                     ij = ij + 1
                  END DO
                  DO i = j, n - 1
                     a( i, j ) = arf( ij )
                     ij = ij + 1
                  END DO
               END DO
*
            ELSE
*
*             SRPA for UPPER, NORMAL and N is odd ( a(0:n-1,0:n2-1)
*             T1 -> a(n1+1,0), T2 -> a(n1,0), S -> a(0,0)
*             T1 -> a(n2), T2 -> a(n1), S -> a(0); lda=n
*
               ij = nt - n
               DO j = n - 1, n1, -1
                  DO i = 0, j
                     a( i, j ) = arf( ij )
                     ij = ij + 1
                  END DO
                  DO l = j - n1, n1 - 1
                     a( j-n1, l ) = conjg( arf( ij ) )
                     ij = ij + 1
                  END DO
                  ij = ij - nx2
               END DO
*
            END IF
*
         ELSE
*
*           N is odd and TRANSR = 'C'
*
            IF( lower ) THEN
*
*              SRPA for LOWER, TRANSPOSE and N is odd
*              T1 -> A(0,0) , T2 -> A(1,0) , S -> A(0,n1)
*              T1 -> A(0+0) , T2 -> A(1+0) , S -> A(0+n1*n1); lda=n1
*
               ij = 0
               DO j = 0, n2 - 1
                  DO i = 0, j
                     a( j, i ) = conjg( arf( ij ) )
                     ij = ij + 1
                  END DO
                  DO i = n1 + j, n - 1
                     a( i, n1+j ) = arf( ij )
                     ij = ij + 1
                  END DO
               END DO
               DO j = n2, n - 1
                  DO i = 0, n1 - 1
                     a( j, i ) = conjg( arf( ij ) )
                     ij = ij + 1
                  END DO
               END DO
*
            ELSE
*
*              SRPA for UPPER, TRANSPOSE and N is odd
*              T1 -> A(0,n1+1), T2 -> A(0,n1), S -> A(0,0)
*              T1 -> A(n2*n2), T2 -> A(n1*n2), S -> A(0); lda = n2
*
               ij = 0
               DO j = 0, n1
                  DO i = n1, n - 1
                     a( j, i ) = conjg( arf( ij ) )
                     ij = ij + 1
                  END DO
               END DO
               DO j = 0, n1 - 1
                  DO i = 0, j
                     a( i, j ) = arf( ij )
                     ij = ij + 1
                  END DO
                  DO l = n2 + j, n - 1
                     a( n2+j, l ) = conjg( arf( ij ) )
                     ij = ij + 1
                  END DO
               END DO
*
            END IF
*
         END IF
*
      ELSE
*
*        N is even
*
         IF( normaltransr ) THEN
*
*           N is even and TRANSR = 'N'
*
            IF( lower ) THEN
*
*              SRPA for LOWER, NORMAL, and N is even ( a(0:n,0:k-1) )
*              T1 -> a(1,0), T2 -> a(0,0), S -> a(k+1,0)
*              T1 -> a(1), T2 -> a(0), S -> a(k+1); lda=n+1
*
               ij = 0
               DO j = 0, k - 1
                  DO i = k, k + j
                     a( k+j, i ) = conjg( arf( ij ) )
                     ij = ij + 1
                  END DO
                  DO i = j, n - 1
                     a( i, j ) = arf( ij )
                     ij = ij + 1
                  END DO
               END DO
*
            ELSE
*
*              SRPA for UPPER, NORMAL, and N is even ( a(0:n,0:k-1) )
*              T1 -> a(k+1,0) ,  T2 -> a(k,0),   S -> a(0,0)
*              T1 -> a(k+1), T2 -> a(k), S -> a(0); lda=n+1
*
               ij = nt - n - 1
               DO j = n - 1, k, -1
                  DO i = 0, j
                     a( i, j ) = arf( ij )
                     ij = ij + 1
                  END DO
                  DO l = j - k, k - 1
                     a( j-k, l ) = conjg( arf( ij ) )
                     ij = ij + 1
                  END DO
                  ij = ij - np1x2
               END DO
*
            END IF
*
         ELSE
*
*           N is even and TRANSR = 'C'
*
            IF( lower ) THEN
*
*              SRPA for LOWER, TRANSPOSE and N is even (see paper, A=B)
*              T1 -> A(0,1) , T2 -> A(0,0) , S -> A(0,k+1) :
*              T1 -> A(0+k) , T2 -> A(0+0) , S -> A(0+k*(k+1)); lda=k
*
               ij = 0
               j = k
               DO i = k, n - 1
                  a( i, j ) = arf( ij )
                  ij = ij + 1
               END DO
               DO j = 0, k - 2
                  DO i = 0, j
                     a( j, i ) = conjg( arf( ij ) )
                     ij = ij + 1
                  END DO
                  DO i = k + 1 + j, n - 1
                     a( i, k+1+j ) = arf( ij )
                     ij = ij + 1
                  END DO
               END DO
               DO j = k - 1, n - 1
                  DO i = 0, k - 1
                     a( j, i ) = conjg( arf( ij ) )
                     ij = ij + 1
                  END DO
               END DO
*
            ELSE
*
*              SRPA for UPPER, TRANSPOSE and N is even (see paper, A=B)
*              T1 -> A(0,k+1) , T2 -> A(0,k) , S -> A(0,0)
*              T1 -> A(0+k*(k+1)) , T2 -> A(0+k*k) , S -> A(0+0)); lda=k
*
               ij = 0
               DO j = 0, k
                  DO i = k, n - 1
                     a( j, i ) = conjg( arf( ij ) )
                     ij = ij + 1
                  END DO
               END DO
               DO j = 0, k - 2
                  DO i = 0, j
                     a( i, j ) = arf( ij )
                     ij = ij + 1
                  END DO
                  DO l = k + 1 + j, n - 1
                     a( k+1+j, l ) = conjg( arf( ij ) )
                     ij = ij + 1
                  END DO
               END DO
*
*              Note that here J = K-1
*
               DO i = 0, j
                  a( i, j ) = arf( ij )
                  ij = ij + 1
               END DO
*
            END IF
*
         END IF
*
      END IF
*
      RETURN
*
*     End of CTFTTR
*

◆ ctgsen()

subroutine ctgsen	(	integer	ijob,
		logical	wantq,
		logical	wantz,
		logical, dimension( * )	select,
		integer	n,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( ldb, * )	b,
		integer	ldb,
		complex, dimension( * )	alpha,
		complex, dimension( * )	beta,
		complex, dimension( ldq, * )	q,
		integer	ldq,
		complex, dimension( ldz, * )	z,
		integer	ldz,
		integer	m,
		real	pl,
		real	pr,
		real, dimension( * )	dif,
		complex, dimension( * )	work,
		integer	lwork,
		integer, dimension( * )	iwork,
		integer	liwork,
		integer	info )

CTGSEN

Download CTGSEN + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CTGSEN reorders the generalized Schur decomposition of a complex
!> matrix pair (A, B) (in terms of an unitary equivalence trans-
!> formation Q**H * (A, B) * Z), so that a selected cluster of eigenvalues
!> appears in the leading diagonal blocks of the pair (A,B). The leading
!> columns of Q and Z form unitary bases of the corresponding left and
!> right eigenspaces (deflating subspaces). (A, B) must be in
!> generalized Schur canonical form, that is, A and B are both upper
!> triangular.
!>
!> CTGSEN also computes the generalized eigenvalues
!>
!>          w(j)= ALPHA(j) / BETA(j)
!>
!> of the reordered matrix pair (A, B).
!>
!> Optionally, the routine computes estimates of reciprocal condition
!> numbers for eigenvalues and eigenspaces. These are Difu[(A11,B11),
!> (A22,B22)] and Difl[(A11,B11), (A22,B22)], i.e. the separation(s)
!> between the matrix pairs (A11, B11) and (A22,B22) that correspond to
!> the selected cluster and the eigenvalues outside the cluster, resp.,
!> and norms of  onto left and right eigenspaces w.r.t.
!> the selected cluster in the (1,1)-block.
!>
!>

Parameters

[in]	IJOB	!> IJOB is INTEGER !> Specifies whether condition numbers are required for the !> cluster of eigenvalues (PL and PR) or the deflating subspaces !> (Difu and Difl): !> =0: Only reorder w.r.t. SELECT. No extras. !> =1: Reciprocal of norms of onto left and right !> eigenspaces w.r.t. the selected cluster (PL and PR). !> =2: Upper bounds on Difu and Difl. F-norm-based estimate !> (DIF(1:2)). !> =3: Estimate of Difu and Difl. 1-norm-based estimate !> (DIF(1:2)). !> About 5 times as expensive as IJOB = 2. !> =4: Compute PL, PR and DIF (i.e. 0, 1 and 2 above): Economic !> version to get it all. !> =5: Compute PL, PR and DIF (i.e. 0, 1 and 3 above) !>
[in]	WANTQ	!> WANTQ is LOGICAL !> .TRUE. : update the left transformation matrix Q; !> .FALSE.: do not update Q. !>
[in]	WANTZ	!> WANTZ is LOGICAL !> .TRUE. : update the right transformation matrix Z; !> .FALSE.: do not update Z. !>
[in]	SELECT	!> SELECT is LOGICAL array, dimension (N) !> SELECT specifies the eigenvalues in the selected cluster. To !> select an eigenvalue w(j), SELECT(j) must be set to !> .TRUE.. !>
[in]	N	!> N is INTEGER !> The order of the matrices A and B. N >= 0. !>
[in,out]	A	!> A is COMPLEX array, dimension(LDA,N) !> On entry, the upper triangular matrix A, in generalized !> Schur canonical form. !> On exit, A is overwritten by the reordered matrix A. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,N). !>
[in,out]	B	!> B is COMPLEX array, dimension(LDB,N) !> On entry, the upper triangular matrix B, in generalized !> Schur canonical form. !> On exit, B is overwritten by the reordered matrix B. !>
[in]	LDB	!> LDB is INTEGER !> The leading dimension of the array B. LDB >= max(1,N). !>
[out]	ALPHA	!> ALPHA is COMPLEX array, dimension (N) !>
[out]	BETA	!> BETA is COMPLEX array, dimension (N) !> !> The diagonal elements of A and B, respectively, !> when the pair (A,B) has been reduced to generalized Schur !> form. ALPHA(i)/BETA(i) i=1,...,N are the generalized !> eigenvalues. !>
[in,out]	Q	!> Q is COMPLEX array, dimension (LDQ,N) !> On entry, if WANTQ = .TRUE., Q is an N-by-N matrix. !> On exit, Q has been postmultiplied by the left unitary !> transformation matrix which reorder (A, B); The leading M !> columns of Q form orthonormal bases for the specified pair of !> left eigenspaces (deflating subspaces). !> If WANTQ = .FALSE., Q is not referenced. !>
[in]	LDQ	!> LDQ is INTEGER !> The leading dimension of the array Q. LDQ >= 1. !> If WANTQ = .TRUE., LDQ >= N. !>
[in,out]	Z	!> Z is COMPLEX array, dimension (LDZ,N) !> On entry, if WANTZ = .TRUE., Z is an N-by-N matrix. !> On exit, Z has been postmultiplied by the left unitary !> transformation matrix which reorder (A, B); The leading M !> columns of Z form orthonormal bases for the specified pair of !> left eigenspaces (deflating subspaces). !> If WANTZ = .FALSE., Z is not referenced. !>
[in]	LDZ	!> LDZ is INTEGER !> The leading dimension of the array Z. LDZ >= 1. !> If WANTZ = .TRUE., LDZ >= N. !>
[out]	M	!> M is INTEGER !> The dimension of the specified pair of left and right !> eigenspaces, (deflating subspaces) 0 <= M <= N. !>
[out]	PL	!> PL is REAL !>
[out]	PR	!> PR is REAL !> !> If IJOB = 1, 4 or 5, PL, PR are lower bounds on the !> reciprocal of the norm of onto left and right !> eigenspace with respect to the selected cluster. !> 0 < PL, PR <= 1. !> If M = 0 or M = N, PL = PR = 1. !> If IJOB = 0, 2 or 3 PL, PR are not referenced. !>
[out]	DIF	!> DIF is REAL array, dimension (2). !> If IJOB >= 2, DIF(1:2) store the estimates of Difu and Difl. !> If IJOB = 2 or 4, DIF(1:2) are F-norm-based upper bounds on !> Difu and Difl. If IJOB = 3 or 5, DIF(1:2) are 1-norm-based !> estimates of Difu and Difl, computed using reversed !> communication with CLACN2. !> If M = 0 or N, DIF(1:2) = F-norm([A, B]). !> If IJOB = 0 or 1, DIF is not referenced. !>
[out]	WORK	!> WORK is COMPLEX array, dimension (MAX(1,LWORK)) !> On exit, if INFO = 0, WORK(1) returns the optimal LWORK. !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the array WORK. LWORK >= 1 !> If IJOB = 1, 2 or 4, LWORK >= 2M(N-M) !> If IJOB = 3 or 5, LWORK >= 4M(N-M) !> !> If LWORK = -1, then a workspace query is assumed; the routine !> only calculates the optimal size of the WORK array, returns !> this value as the first entry of the WORK array, and no error !> message related to LWORK is issued by XERBLA. !>
[out]	IWORK	!> IWORK is INTEGER array, dimension (MAX(1,LIWORK)) !> On exit, if INFO = 0, IWORK(1) returns the optimal LIWORK. !>
[in]	LIWORK	!> LIWORK is INTEGER !> The dimension of the array IWORK. LIWORK >= 1. !> If IJOB = 1, 2 or 4, LIWORK >= N+2; !> If IJOB = 3 or 5, LIWORK >= MAX(N+2, 2M(N-M)); !> !> If LIWORK = -1, then a workspace query is assumed; the !> routine only calculates the optimal size of the IWORK array, !> returns this value as the first entry of the IWORK array, and !> no error message related to LIWORK is issued by XERBLA. !>
[out]	INFO	!> INFO is INTEGER !> =0: Successful exit. !> <0: If INFO = -i, the i-th argument had an illegal value. !> =1: Reordering of (A, B) failed because the transformed !> matrix pair (A, B) would be too far from generalized !> Schur form; the problem is very ill-conditioned. !> (A, B) may have been partially reordered. !> If requested, 0 is returned in DIF(*), PL and PR. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  CTGSEN first collects the selected eigenvalues by computing unitary
!>  U and W that move them to the top left corner of (A, B). In other
!>  words, the selected eigenvalues are the eigenvalues of (A11, B11) in
!>
!>              U**H*(A, B)*W = (A11 A12) (B11 B12) n1
!>                              ( 0  A22),( 0  B22) n2
!>                                n1  n2    n1  n2
!>
!>  where N = n1+n2 and U**H means the conjugate transpose of U. The first
!>  n1 columns of U and W span the specified pair of left and right
!>  eigenspaces (deflating subspaces) of (A, B).
!>
!>  If (A, B) has been obtained from the generalized real Schur
!>  decomposition of a matrix pair (C, D) = Q*(A, B)*Z', then the
!>  reordered generalized Schur form of (C, D) is given by
!>
!>           (C, D) = (Q*U)*(U**H *(A, B)*W)*(Z*W)**H,
!>
!>  and the first n1 columns of Q*U and Z*W span the corresponding
!>  deflating subspaces of (C, D) (Q and Z store Q*U and Z*W, resp.).
!>
!>  Note that if the selected eigenvalue is sufficiently ill-conditioned,
!>  then its value may differ significantly from its value before
!>  reordering.
!>
!>  The reciprocal condition numbers of the left and right eigenspaces
!>  spanned by the first n1 columns of U and W (or Q*U and Z*W) may
!>  be returned in DIF(1:2), corresponding to Difu and Difl, resp.
!>
!>  The Difu and Difl are defined as:
!>
!>       Difu[(A11, B11), (A22, B22)] = sigma-min( Zu )
!>  and
!>       Difl[(A11, B11), (A22, B22)] = Difu[(A22, B22), (A11, B11)],
!>
!>  where sigma-min(Zu) is the smallest singular value of the
!>  (2*n1*n2)-by-(2*n1*n2) matrix
!>
!>       Zu = [ kron(In2, A11)  -kron(A22**H, In1) ]
!>            [ kron(In2, B11)  -kron(B22**H, In1) ].
!>
!>  Here, Inx is the identity matrix of size nx and A22**H is the
!>  conjuguate transpose of A22. kron(X, Y) is the Kronecker product between
!>  the matrices X and Y.
!>
!>  When DIF(2) is small, small changes in (A, B) can cause large changes
!>  in the deflating subspace. An approximate (asymptotic) bound on the
!>  maximum angular error in the computed deflating subspaces is
!>
!>       EPS * norm((A, B)) / DIF(2),
!>
!>  where EPS is the machine precision.
!>
!>  The reciprocal norm of the projectors on the left and right
!>  eigenspaces associated with (A11, B11) may be returned in PL and PR.
!>  They are computed as follows. First we compute L and R so that
!>  P*(A, B)*Q is block diagonal, where
!>
!>       P = ( I -L ) n1           Q = ( I R ) n1
!>           ( 0  I ) n2    and        ( 0 I ) n2
!>             n1 n2                    n1 n2
!>
!>  and (L, R) is the solution to the generalized Sylvester equation
!>
!>       A11*R - L*A22 = -A12
!>       B11*R - L*B22 = -B12
!>
!>  Then PL = (F-norm(L)**2+1)**(-1/2) and PR = (F-norm(R)**2+1)**(-1/2).
!>  An approximate (asymptotic) bound on the average absolute error of
!>  the selected eigenvalues is
!>
!>       EPS * norm((A, B)) / PL.
!>
!>  There are also global error bounds which valid for perturbations up
!>  to a certain restriction:  A lower bound (x) on the smallest
!>  F-norm(E,F) for which an eigenvalue of (A11, B11) may move and
!>  coalesce with an eigenvalue of (A22, B22) under perturbation (E,F),
!>  (i.e. (A + E, B + F), is
!>
!>   x = min(Difu,Difl)/((1/(PL*PL)+1/(PR*PR))**(1/2)+2*max(1/PL,1/PR)).
!>
!>  An approximate bound on x can be computed from DIF(1:2), PL and PR.
!>
!>  If y = ( F-norm(E,F) / x) <= 1, the angles between the perturbed
!>  (L', R') and unperturbed (L, R) left and right deflating subspaces
!>  associated with the selected cluster in the (1,1)-blocks can be
!>  bounded as
!>
!>   max-angle(L, L') <= arctan( y * PL / (1 - y * (1 - PL * PL)**(1/2))
!>   max-angle(R, R') <= arctan( y * PR / (1 - y * (1 - PR * PR)**(1/2))
!>
!>  See LAPACK User's Guide section 4.11 or the following references
!>  for more information.
!>
!>  Note that if the default method for computing the Frobenius-norm-
!>  based estimate DIF is not wanted (see CLATDF), then the parameter
!>  IDIFJB (see below) should be changed from 3 to 4 (routine CLATDF
!>  (IJOB = 2 will be used)). See CTGSYL for more details.
!>

Contributors:: Bo Kagstrom and Peter Poromaa, Department of Computing Science, Umea University, S-901 87 Umea, Sweden.

References:: [1] B. Kagstrom; A Direct Method for Reordering Eigenvalues in the Generalized Real Schur Form of a Regular Matrix Pair (A, B), in M.S. Moonen et al (eds), Linear Algebra for Large Scale and Real-Time Applications, Kluwer Academic Publ. 1993, pp 195-218.
[2] B. Kagstrom and P. Poromaa; Computing Eigenspaces with Specified Eigenvalues of a Regular Matrix Pair (A, B) and Condition Estimation: Theory, Algorithms and Software, Report UMINF - 94.04, Department of Computing Science, Umea University, S-901 87 Umea, Sweden, 1994. Also as LAPACK Working Note 87. To appear in Numerical Algorithms, 1996.
[3] B. Kagstrom and P. Poromaa, LAPACK-Style Algorithms and Software for Solving the Generalized Sylvester Equation and Estimating the Separation between Regular Matrix Pairs, Report UMINF - 93.23, Department of Computing Science, Umea University, S-901 87 Umea, Sweden, December 1993, Revised April 1994, Also as LAPACK working Note 75. To appear in ACM Trans. on Math. Software, Vol 22, No 1, 1996.

Definition at line 430 of file ctgsen.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      LOGICAL            WANTQ, WANTZ
      INTEGER            IJOB, INFO, LDA, LDB, LDQ, LDZ, LIWORK, LWORK,
     $                   M, N
      REAL               PL, PR
*     ..
*     .. Array Arguments ..
      LOGICAL            SELECT( * )
      INTEGER            IWORK( * )
      REAL               DIF( * )
      COMPLEX            A( LDA, * ), ALPHA( * ), B( LDB, * ),
     $                   BETA( * ), Q( LDQ, * ), WORK( * ), Z( LDZ, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      INTEGER            IDIFJB
      parameter( idifjb = 3 )
      REAL               ZERO, ONE
      parameter( zero = 0.0e+0, one = 1.0e+0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            LQUERY, SWAP, WANTD, WANTD1, WANTD2, WANTP
      INTEGER            I, IERR, IJB, K, KASE, KS, LIWMIN, LWMIN, MN2,
     $                   N1, N2
      REAL               DSCALE, DSUM, RDSCAL, SAFMIN
      COMPLEX            TEMP1, TEMP2
*     ..
*     .. Local Arrays ..
      INTEGER            ISAVE( 3 )
*     ..
*     .. External Subroutines ..
      REAL               SLAMCH
      EXTERNAL           clacn2, clacpy, classq, cscal, ctgexc, ctgsyl,
     $                   slamch, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, cmplx, conjg, max, sqrt
*     ..
*     .. Executable Statements ..
*
*     Decode and test the input parameters
*
      info = 0
      lquery = ( lwork.EQ.-1 .OR. liwork.EQ.-1 )
*
      IF( ijob.LT.0 .OR. ijob.GT.5 ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -5
      ELSE IF( lda.LT.max( 1, n ) ) THEN
         info = -7
      ELSE IF( ldb.LT.max( 1, n ) ) THEN
         info = -9
      ELSE IF( ldq.LT.1 .OR. ( wantq .AND. ldq.LT.n ) ) THEN
         info = -13
      ELSE IF( ldz.LT.1 .OR. ( wantz .AND. ldz.LT.n ) ) THEN
         info = -15
      END IF
*
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CTGSEN', -info )
         RETURN
      END IF
*
      ierr = 0
*
      wantp = ijob.EQ.1 .OR. ijob.GE.4
      wantd1 = ijob.EQ.2 .OR. ijob.EQ.4
      wantd2 = ijob.EQ.3 .OR. ijob.EQ.5
      wantd = wantd1 .OR. wantd2
*
*     Set M to the dimension of the specified pair of deflating
*     subspaces.
*
      m = 0
      IF( .NOT.lquery .OR. ijob.NE.0 ) THEN
      DO 10 k = 1, n
         alpha( k ) = a( k, k )
         beta( k ) = b( k, k )
         IF( k.LT.n ) THEN
            IF( SELECT( k ) )
     $         m = m + 1
         ELSE
            IF( SELECT( n ) )
     $         m = m + 1
         END IF
   10 CONTINUE
      END IF
*
      IF( ijob.EQ.1 .OR. ijob.EQ.2 .OR. ijob.EQ.4 ) THEN
         lwmin = max( 1, 2*m*(n-m) )
         liwmin = max( 1, n+2 )
      ELSE IF( ijob.EQ.3 .OR. ijob.EQ.5 ) THEN
         lwmin = max( 1, 4*m*(n-m) )
         liwmin = max( 1, 2*m*(n-m), n+2 )
      ELSE
         lwmin = 1
         liwmin = 1
      END IF
*
      work( 1 ) = lwmin
      iwork( 1 ) = liwmin
*
      IF( lwork.LT.lwmin .AND. .NOT.lquery ) THEN
         info = -21
      ELSE IF( liwork.LT.liwmin .AND. .NOT.lquery ) THEN
         info = -23
      END IF
*
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CTGSEN', -info )
         RETURN
      ELSE IF( lquery ) THEN
         RETURN
      END IF
*
*     Quick return if possible.
*
      IF( m.EQ.n .OR. m.EQ.0 ) THEN
         IF( wantp ) THEN
            pl = one
            pr = one
         END IF
         IF( wantd ) THEN
            dscale = zero
            dsum = one
            DO 20 i = 1, n
               CALL classq( n, a( 1, i ), 1, dscale, dsum )
               CALL classq( n, b( 1, i ), 1, dscale, dsum )
   20       CONTINUE
            dif( 1 ) = dscale*sqrt( dsum )
            dif( 2 ) = dif( 1 )
         END IF
         GO TO 70
      END IF
*
*     Get machine constant
*
      safmin = slamch( 'S' )
*
*     Collect the selected blocks at the top-left corner of (A, B).
*
      ks = 0
      DO 30 k = 1, n
         swap = SELECT( k )
         IF( swap ) THEN
            ks = ks + 1
*
*           Swap the K-th block to position KS. Compute unitary Q
*           and Z that will swap adjacent diagonal blocks in (A, B).
*
            IF( k.NE.ks )
     $         CALL ctgexc( wantq, wantz, n, a, lda, b, ldb, q, ldq, z,
     $                      ldz, k, ks, ierr )
*
            IF( ierr.GT.0 ) THEN
*
*              Swap is rejected: exit.
*
               info = 1
               IF( wantp ) THEN
                  pl = zero
                  pr = zero
               END IF
               IF( wantd ) THEN
                  dif( 1 ) = zero
                  dif( 2 ) = zero
               END IF
               GO TO 70
            END IF
         END IF
   30 CONTINUE
      IF( wantp ) THEN
*
*        Solve generalized Sylvester equation for R and L:
*                   A11 * R - L * A22 = A12
*                   B11 * R - L * B22 = B12
*
         n1 = m
         n2 = n - m
         i = n1 + 1
         CALL clacpy( 'Full', n1, n2, a( 1, i ), lda, work, n1 )
         CALL clacpy( 'Full', n1, n2, b( 1, i ), ldb, work( n1*n2+1 ),
     $                n1 )
         ijb = 0
         CALL ctgsyl( 'N', ijb, n1, n2, a, lda, a( i, i ), lda, work,
     $                n1, b, ldb, b( i, i ), ldb, work( n1*n2+1 ), n1,
     $                dscale, dif( 1 ), work( n1*n2*2+1 ),
     $                lwork-2*n1*n2, iwork, ierr )
*
*        Estimate the reciprocal of norms of "projections" onto
*        left and right eigenspaces
*
         rdscal = zero
         dsum = one
         CALL classq( n1*n2, work, 1, rdscal, dsum )
         pl = rdscal*sqrt( dsum )
         IF( pl.EQ.zero ) THEN
            pl = one
         ELSE
            pl = dscale / ( sqrt( dscale*dscale / pl+pl )*sqrt( pl ) )
         END IF
         rdscal = zero
         dsum = one
         CALL classq( n1*n2, work( n1*n2+1 ), 1, rdscal, dsum )
         pr = rdscal*sqrt( dsum )
         IF( pr.EQ.zero ) THEN
            pr = one
         ELSE
            pr = dscale / ( sqrt( dscale*dscale / pr+pr )*sqrt( pr ) )
         END IF
      END IF
      IF( wantd ) THEN
*
*        Compute estimates Difu and Difl.
*
         IF( wantd1 ) THEN
            n1 = m
            n2 = n - m
            i = n1 + 1
            ijb = idifjb
*
*           Frobenius norm-based Difu estimate.
*
            CALL ctgsyl( 'N', ijb, n1, n2, a, lda, a( i, i ), lda, work,
     $                   n1, b, ldb, b( i, i ), ldb, work( n1*n2+1 ),
     $                   n1, dscale, dif( 1 ), work( n1*n2*2+1 ),
     $                   lwork-2*n1*n2, iwork, ierr )
*
*           Frobenius norm-based Difl estimate.
*
            CALL ctgsyl( 'N', ijb, n2, n1, a( i, i ), lda, a, lda, work,
     $                   n2, b( i, i ), ldb, b, ldb, work( n1*n2+1 ),
     $                   n2, dscale, dif( 2 ), work( n1*n2*2+1 ),
     $                   lwork-2*n1*n2, iwork, ierr )
         ELSE
*
*           Compute 1-norm-based estimates of Difu and Difl using
*           reversed communication with CLACN2. In each step a
*           generalized Sylvester equation or a transposed variant
*           is solved.
*
            kase = 0
            n1 = m
            n2 = n - m
            i = n1 + 1
            ijb = 0
            mn2 = 2*n1*n2
*
*           1-norm-based estimate of Difu.
*
   40       CONTINUE
            CALL clacn2( mn2, work( mn2+1 ), work, dif( 1 ), kase,
     $                   isave )
            IF( kase.NE.0 ) THEN
               IF( kase.EQ.1 ) THEN
*
*                 Solve generalized Sylvester equation
*
                  CALL ctgsyl( 'N', ijb, n1, n2, a, lda, a( i, i ), lda,
     $                         work, n1, b, ldb, b( i, i ), ldb,
     $                         work( n1*n2+1 ), n1, dscale, dif( 1 ),
     $                         work( n1*n2*2+1 ), lwork-2*n1*n2, iwork,
     $                         ierr )
               ELSE
*
*                 Solve the transposed variant.
*
                  CALL ctgsyl( 'C', ijb, n1, n2, a, lda, a( i, i ), lda,
     $                         work, n1, b, ldb, b( i, i ), ldb,
     $                         work( n1*n2+1 ), n1, dscale, dif( 1 ),
     $                         work( n1*n2*2+1 ), lwork-2*n1*n2, iwork,
     $                         ierr )
               END IF
               GO TO 40
            END IF
            dif( 1 ) = dscale / dif( 1 )
*
*           1-norm-based estimate of Difl.
*
   50       CONTINUE
            CALL clacn2( mn2, work( mn2+1 ), work, dif( 2 ), kase,
     $                   isave )
            IF( kase.NE.0 ) THEN
               IF( kase.EQ.1 ) THEN
*
*                 Solve generalized Sylvester equation
*
                  CALL ctgsyl( 'N', ijb, n2, n1, a( i, i ), lda, a, lda,
     $                         work, n2, b( i, i ), ldb, b, ldb,
     $                         work( n1*n2+1 ), n2, dscale, dif( 2 ),
     $                         work( n1*n2*2+1 ), lwork-2*n1*n2, iwork,
     $                         ierr )
               ELSE
*
*                 Solve the transposed variant.
*
                  CALL ctgsyl( 'C', ijb, n2, n1, a( i, i ), lda, a, lda,
     $                         work, n2, b, ldb, b( i, i ), ldb,
     $                         work( n1*n2+1 ), n2, dscale, dif( 2 ),
     $                         work( n1*n2*2+1 ), lwork-2*n1*n2, iwork,
     $                         ierr )
               END IF
               GO TO 50
            END IF
            dif( 2 ) = dscale / dif( 2 )
         END IF
      END IF
*
*     If B(K,K) is complex, make it real and positive (normalization
*     of the generalized Schur form) and Store the generalized
*     eigenvalues of reordered pair (A, B)
*
      DO 60 k = 1, n
         dscale = abs( b( k, k ) )
         IF( dscale.GT.safmin ) THEN
            temp1 = conjg( b( k, k ) / dscale )
            temp2 = b( k, k ) / dscale
            b( k, k ) = dscale
            CALL cscal( n-k, temp1, b( k, k+1 ), ldb )
            CALL cscal( n-k+1, temp1, a( k, k ), lda )
            IF( wantq )
     $         CALL cscal( n, temp2, q( 1, k ), 1 )
         ELSE
            b( k, k ) = cmplx( zero, zero )
         END IF
*
         alpha( k ) = a( k, k )
         beta( k ) = b( k, k )
*
   60 CONTINUE
*
   70 CONTINUE
*
      work( 1 ) = lwmin
      iwork( 1 ) = liwmin
*
      RETURN
*
*     End of CTGSEN
*

◆ ctgsja()

subroutine ctgsja	(	character	jobu,
		character	jobv,
		character	jobq,
		integer	m,
		integer	p,
		integer	n,
		integer	k,
		integer	l,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( ldb, * )	b,
		integer	ldb,
		real	tola,
		real	tolb,
		real, dimension( * )	alpha,
		real, dimension( * )	beta,
		complex, dimension( ldu, * )	u,
		integer	ldu,
		complex, dimension( ldv, * )	v,
		integer	ldv,
		complex, dimension( ldq, * )	q,
		integer	ldq,
		complex, dimension( * )	work,
		integer	ncycle,
		integer	info )

CTGSJA

Download CTGSJA + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CTGSJA computes the generalized singular value decomposition (GSVD)
!> of two complex upper triangular (or trapezoidal) matrices A and B.
!>
!> On entry, it is assumed that matrices A and B have the following
!> forms, which may be obtained by the preprocessing subroutine CGGSVP
!> from a general M-by-N matrix A and P-by-N matrix B:
!>
!>              N-K-L  K    L
!>    A =    K ( 0    A12  A13 ) if M-K-L >= 0;
!>           L ( 0     0   A23 )
!>       M-K-L ( 0     0    0  )
!>
!>            N-K-L  K    L
!>    A =  K ( 0    A12  A13 ) if M-K-L < 0;
!>       M-K ( 0     0   A23 )
!>
!>            N-K-L  K    L
!>    B =  L ( 0     0   B13 )
!>       P-L ( 0     0    0  )
!>
!> where the K-by-K matrix A12 and L-by-L matrix B13 are nonsingular
!> upper triangular; A23 is L-by-L upper triangular if M-K-L >= 0,
!> otherwise A23 is (M-K)-by-L upper trapezoidal.
!>
!> On exit,
!>
!>        U**H *A*Q = D1*( 0 R ),    V**H *B*Q = D2*( 0 R ),
!>
!> where U, V and Q are unitary matrices.
!> R is a nonsingular upper triangular matrix, and D1
!> and D2 are ``diagonal'' matrices, which are of the following
!> structures:
!>
!> If M-K-L >= 0,
!>
!>                     K  L
!>        D1 =     K ( I  0 )
!>                 L ( 0  C )
!>             M-K-L ( 0  0 )
!>
!>                    K  L
!>        D2 = L   ( 0  S )
!>             P-L ( 0  0 )
!>
!>                N-K-L  K    L
!>   ( 0 R ) = K (  0   R11  R12 ) K
!>             L (  0    0   R22 ) L
!>
!> where
!>
!>   C = diag( ALPHA(K+1), ... , ALPHA(K+L) ),
!>   S = diag( BETA(K+1),  ... , BETA(K+L) ),
!>   C**2 + S**2 = I.
!>
!>   R is stored in A(1:K+L,N-K-L+1:N) on exit.
!>
!> If M-K-L < 0,
!>
!>                K M-K K+L-M
!>     D1 =   K ( I  0    0   )
!>          M-K ( 0  C    0   )
!>
!>                  K M-K K+L-M
!>     D2 =   M-K ( 0  S    0   )
!>          K+L-M ( 0  0    I   )
!>            P-L ( 0  0    0   )
!>
!>                N-K-L  K   M-K  K+L-M
!> ( 0 R ) =    K ( 0    R11  R12  R13  )
!>           M-K ( 0     0   R22  R23  )
!>         K+L-M ( 0     0    0   R33  )
!>
!> where
!> C = diag( ALPHA(K+1), ... , ALPHA(M) ),
!> S = diag( BETA(K+1),  ... , BETA(M) ),
!> C**2 + S**2 = I.
!>
!> R = ( R11 R12 R13 ) is stored in A(1:M, N-K-L+1:N) and R33 is stored
!>     (  0  R22 R23 )
!> in B(M-K+1:L,N+M-K-L+1:N) on exit.
!>
!> The computation of the unitary transformation matrices U, V or Q
!> is optional.  These matrices may either be formed explicitly, or they
!> may be postmultiplied into input matrices U1, V1, or Q1.
!>

Parameters

[in]	JOBU	!> JOBU is CHARACTER1 !> = 'U': U must contain a unitary matrix U1 on entry, and !> the product U1U is returned; !> = 'I': U is initialized to the unit matrix, and the !> unitary matrix U is returned; !> = 'N': U is not computed. !>
[in]	JOBV	!> JOBV is CHARACTER1 !> = 'V': V must contain a unitary matrix V1 on entry, and !> the product V1V is returned; !> = 'I': V is initialized to the unit matrix, and the !> unitary matrix V is returned; !> = 'N': V is not computed. !>
[in]	JOBQ	!> JOBQ is CHARACTER1 !> = 'Q': Q must contain a unitary matrix Q1 on entry, and !> the product Q1Q is returned; !> = 'I': Q is initialized to the unit matrix, and the !> unitary matrix Q is returned; !> = 'N': Q is not computed. !>
[in]	M	!> M is INTEGER !> The number of rows of the matrix A. M >= 0. !>
[in]	P	!> P is INTEGER !> The number of rows of the matrix B. P >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrices A and B. N >= 0. !>
[in]	K	!> K is INTEGER !>
[in]	L	!> L is INTEGER !> !> K and L specify the subblocks in the input matrices A and B: !> A23 = A(K+1:MIN(K+L,M),N-L+1:N) and B13 = B(1:L,,N-L+1:N) !> of A and B, whose GSVD is going to be computed by CTGSJA. !> See Further Details. !>
[in,out]	A	!> A is COMPLEX array, dimension (LDA,N) !> On entry, the M-by-N matrix A. !> On exit, A(N-K+1:N,1:MIN(K+L,M) ) contains the triangular !> matrix R or part of R. See Purpose for details. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,M). !>
[in,out]	B	!> B is COMPLEX array, dimension (LDB,N) !> On entry, the P-by-N matrix B. !> On exit, if necessary, B(M-K+1:L,N+M-K-L+1:N) contains !> a part of R. See Purpose for details. !>
[in]	LDB	!> LDB is INTEGER !> The leading dimension of the array B. LDB >= max(1,P). !>
[in]	TOLA	!> TOLA is REAL !>
[in]	TOLB	!> TOLB is REAL !> !> TOLA and TOLB are the convergence criteria for the Jacobi- !> Kogbetliantz iteration procedure. Generally, they are the !> same as used in the preprocessing step, say !> TOLA = MAX(M,N)norm(A)MACHEPS, !> TOLB = MAX(P,N)norm(B)MACHEPS. !>
[out]	ALPHA	!> ALPHA is REAL array, dimension (N) !>
[out]	BETA	!> BETA is REAL array, dimension (N) !> !> On exit, ALPHA and BETA contain the generalized singular !> value pairs of A and B; !> ALPHA(1:K) = 1, !> BETA(1:K) = 0, !> and if M-K-L >= 0, !> ALPHA(K+1:K+L) = diag(C), !> BETA(K+1:K+L) = diag(S), !> or if M-K-L < 0, !> ALPHA(K+1:M)= C, ALPHA(M+1:K+L)= 0 !> BETA(K+1:M) = S, BETA(M+1:K+L) = 1. !> Furthermore, if K+L < N, !> ALPHA(K+L+1:N) = 0 !> BETA(K+L+1:N) = 0. !>
[in,out]	U	!> U is COMPLEX array, dimension (LDU,M) !> On entry, if JOBU = 'U', U must contain a matrix U1 (usually !> the unitary matrix returned by CGGSVP). !> On exit, !> if JOBU = 'I', U contains the unitary matrix U; !> if JOBU = 'U', U contains the product U1*U. !> If JOBU = 'N', U is not referenced. !>
[in]	LDU	!> LDU is INTEGER !> The leading dimension of the array U. LDU >= max(1,M) if !> JOBU = 'U'; LDU >= 1 otherwise. !>
[in,out]	V	!> V is COMPLEX array, dimension (LDV,P) !> On entry, if JOBV = 'V', V must contain a matrix V1 (usually !> the unitary matrix returned by CGGSVP). !> On exit, !> if JOBV = 'I', V contains the unitary matrix V; !> if JOBV = 'V', V contains the product V1*V. !> If JOBV = 'N', V is not referenced. !>
[in]	LDV	!> LDV is INTEGER !> The leading dimension of the array V. LDV >= max(1,P) if !> JOBV = 'V'; LDV >= 1 otherwise. !>
[in,out]	Q	!> Q is COMPLEX array, dimension (LDQ,N) !> On entry, if JOBQ = 'Q', Q must contain a matrix Q1 (usually !> the unitary matrix returned by CGGSVP). !> On exit, !> if JOBQ = 'I', Q contains the unitary matrix Q; !> if JOBQ = 'Q', Q contains the product Q1*Q. !> If JOBQ = 'N', Q is not referenced. !>
[in]	LDQ	!> LDQ is INTEGER !> The leading dimension of the array Q. LDQ >= max(1,N) if !> JOBQ = 'Q'; LDQ >= 1 otherwise. !>
[out]	WORK	!> WORK is COMPLEX array, dimension (2*N) !>
[out]	NCYCLE	!> NCYCLE is INTEGER !> The number of cycles required for convergence. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value. !> = 1: the procedure does not converge after MAXIT cycles. !>

Internal Parameters:

!>  MAXIT   INTEGER
!>          MAXIT specifies the total loops that the iterative procedure
!>          may take. If after MAXIT cycles, the routine fails to
!>          converge, we return INFO = 1.
!>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  CTGSJA essentially uses a variant of Kogbetliantz algorithm to reduce
!>  min(L,M-K)-by-L triangular (or trapezoidal) matrix A23 and L-by-L
!>  matrix B13 to the form:
!>
!>           U1**H *A13*Q1 = C1*R1; V1**H *B13*Q1 = S1*R1,
!>
!>  where U1, V1 and Q1 are unitary matrix.
!>  C1 and S1 are diagonal matrices satisfying
!>
!>                C1**2 + S1**2 = I,
!>
!>  and R1 is an L-by-L nonsingular upper triangular matrix.
!>

Definition at line 376 of file ctgsja.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          JOBQ, JOBU, JOBV
      INTEGER            INFO, K, L, LDA, LDB, LDQ, LDU, LDV, M, N,
     $                   NCYCLE, P
      REAL               TOLA, TOLB
*     ..
*     .. Array Arguments ..
      REAL               ALPHA( * ), BETA( * )
      COMPLEX            A( LDA, * ), B( LDB, * ), Q( LDQ, * ),
     $                   U( LDU, * ), V( LDV, * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      INTEGER            MAXIT
      parameter( maxit = 40 )
      REAL               ZERO, ONE, HUGENUM
      parameter( zero = 0.0e+0, one = 1.0e+0 )
      COMPLEX            CZERO, CONE
      parameter( czero = ( 0.0e+0, 0.0e+0 ),
     $                   cone = ( 1.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
*
      LOGICAL            INITQ, INITU, INITV, UPPER, WANTQ, WANTU, WANTV
      INTEGER            I, J, KCYCLE
      REAL               A1, A3, B1, B3, CSQ, CSU, CSV, ERROR, GAMMA,
     $                   RWK, SSMIN
      COMPLEX            A2, B2, SNQ, SNU, SNV
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           ccopy, clags2, clapll, claset, crot, csscal,
     $                   slartg, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, conjg, max, min, real, huge
      parameter( hugenum = huge(zero) )
*     ..
*     .. Executable Statements ..
*
*     Decode and test the input parameters
*
      initu = lsame( jobu, 'I' )
      wantu = initu .OR. lsame( jobu, 'U' )
*
      initv = lsame( jobv, 'I' )
      wantv = initv .OR. lsame( jobv, 'V' )
*
      initq = lsame( jobq, 'I' )
      wantq = initq .OR. lsame( jobq, 'Q' )
*
      info = 0
      IF( .NOT.( initu .OR. wantu .OR. lsame( jobu, 'N' ) ) ) THEN
         info = -1
      ELSE IF( .NOT.( initv .OR. wantv .OR. lsame( jobv, 'N' ) ) ) THEN
         info = -2
      ELSE IF( .NOT.( initq .OR. wantq .OR. lsame( jobq, 'N' ) ) ) THEN
         info = -3
      ELSE IF( m.LT.0 ) THEN
         info = -4
      ELSE IF( p.LT.0 ) THEN
         info = -5
      ELSE IF( n.LT.0 ) THEN
         info = -6
      ELSE IF( lda.LT.max( 1, m ) ) THEN
         info = -10
      ELSE IF( ldb.LT.max( 1, p ) ) THEN
         info = -12
      ELSE IF( ldu.LT.1 .OR. ( wantu .AND. ldu.LT.m ) ) THEN
         info = -18
      ELSE IF( ldv.LT.1 .OR. ( wantv .AND. ldv.LT.p ) ) THEN
         info = -20
      ELSE IF( ldq.LT.1 .OR. ( wantq .AND. ldq.LT.n ) ) THEN
         info = -22
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CTGSJA', -info )
         RETURN
      END IF
*
*     Initialize U, V and Q, if necessary
*
      IF( initu )
     $   CALL claset( 'Full', m, m, czero, cone, u, ldu )
      IF( initv )
     $   CALL claset( 'Full', p, p, czero, cone, v, ldv )
      IF( initq )
     $   CALL claset( 'Full', n, n, czero, cone, q, ldq )
*
*     Loop until convergence
*
      upper = .false.
      DO 40 kcycle = 1, maxit
*
         upper = .NOT.upper
*
         DO 20 i = 1, l - 1
            DO 10 j = i + 1, l
*
               a1 = zero
               a2 = czero
               a3 = zero
               IF( k+i.LE.m )
     $            a1 = real( a( k+i, n-l+i ) )
               IF( k+j.LE.m )
     $            a3 = real( a( k+j, n-l+j ) )
*
               b1 = real( b( i, n-l+i ) )
               b3 = real( b( j, n-l+j ) )
*
               IF( upper ) THEN
                  IF( k+i.LE.m )
     $               a2 = a( k+i, n-l+j )
                  b2 = b( i, n-l+j )
               ELSE
                  IF( k+j.LE.m )
     $               a2 = a( k+j, n-l+i )
                  b2 = b( j, n-l+i )
               END IF
*
               CALL clags2( upper, a1, a2, a3, b1, b2, b3, csu, snu,
     $                      csv, snv, csq, snq )
*
*              Update (K+I)-th and (K+J)-th rows of matrix A: U**H *A
*
               IF( k+j.LE.m )
     $            CALL crot( l, a( k+j, n-l+1 ), lda, a( k+i, n-l+1 ),
     $                       lda, csu, conjg( snu ) )
*
*              Update I-th and J-th rows of matrix B: V**H *B
*
               CALL crot( l, b( j, n-l+1 ), ldb, b( i, n-l+1 ), ldb,
     $                    csv, conjg( snv ) )
*
*              Update (N-L+I)-th and (N-L+J)-th columns of matrices
*              A and B: A*Q and B*Q
*
               CALL crot( min( k+l, m ), a( 1, n-l+j ), 1,
     $                    a( 1, n-l+i ), 1, csq, snq )
*
               CALL crot( l, b( 1, n-l+j ), 1, b( 1, n-l+i ), 1, csq,
     $                    snq )
*
               IF( upper ) THEN
                  IF( k+i.LE.m )
     $               a( k+i, n-l+j ) = czero
                  b( i, n-l+j ) = czero
               ELSE
                  IF( k+j.LE.m )
     $               a( k+j, n-l+i ) = czero
                  b( j, n-l+i ) = czero
               END IF
*
*              Ensure that the diagonal elements of A and B are real.
*
               IF( k+i.LE.m )
     $            a( k+i, n-l+i ) = real( a( k+i, n-l+i ) )
               IF( k+j.LE.m )
     $            a( k+j, n-l+j ) = real( a( k+j, n-l+j ) )
               b( i, n-l+i ) = real( b( i, n-l+i ) )
               b( j, n-l+j ) = real( b( j, n-l+j ) )
*
*              Update unitary matrices U, V, Q, if desired.
*
               IF( wantu .AND. k+j.LE.m )
     $            CALL crot( m, u( 1, k+j ), 1, u( 1, k+i ), 1, csu,
     $                       snu )
*
               IF( wantv )
     $            CALL crot( p, v( 1, j ), 1, v( 1, i ), 1, csv, snv )
*
               IF( wantq )
     $            CALL crot( n, q( 1, n-l+j ), 1, q( 1, n-l+i ), 1, csq,
     $                       snq )
*
   10       CONTINUE
   20    CONTINUE
*
         IF( .NOT.upper ) THEN
*
*           The matrices A13 and B13 were lower triangular at the start
*           of the cycle, and are now upper triangular.
*
*           Convergence test: test the parallelism of the corresponding
*           rows of A and B.
*
            error = zero
            DO 30 i = 1, min( l, m-k )
               CALL ccopy( l-i+1, a( k+i, n-l+i ), lda, work, 1 )
               CALL ccopy( l-i+1, b( i, n-l+i ), ldb, work( l+1 ), 1 )
               CALL clapll( l-i+1, work, 1, work( l+1 ), 1, ssmin )
               error = max( error, ssmin )
   30       CONTINUE
*
            IF( abs( error ).LE.min( tola, tolb ) )
     $         GO TO 50
         END IF
*
*        End of cycle loop
*
   40 CONTINUE
*
*     The algorithm has not converged after MAXIT cycles.
*
      info = 1
      GO TO 100
*
   50 CONTINUE
*
*     If ERROR <= MIN(TOLA,TOLB), then the algorithm has converged.
*     Compute the generalized singular value pairs (ALPHA, BETA), and
*     set the triangular matrix R to array A.
*
      DO 60 i = 1, k
         alpha( i ) = one
         beta( i ) = zero
   60 CONTINUE
*
      DO 70 i = 1, min( l, m-k )
*
         a1 = real( a( k+i, n-l+i ) )
         b1 = real( b( i, n-l+i ) )
         gamma = b1 / a1
*
         IF( (gamma.LE.hugenum).AND.(gamma.GE.-hugenum) ) THEN
*
            IF( gamma.LT.zero ) THEN
               CALL csscal( l-i+1, -one, b( i, n-l+i ), ldb )
               IF( wantv )
     $            CALL csscal( p, -one, v( 1, i ), 1 )
            END IF
*
            CALL slartg( abs( gamma ), one, beta( k+i ), alpha( k+i ),
     $                   rwk )
*
            IF( alpha( k+i ).GE.beta( k+i ) ) THEN
               CALL csscal( l-i+1, one / alpha( k+i ), a( k+i, n-l+i ),
     $                      lda )
            ELSE
               CALL csscal( l-i+1, one / beta( k+i ), b( i, n-l+i ),
     $                      ldb )
               CALL ccopy( l-i+1, b( i, n-l+i ), ldb, a( k+i, n-l+i ),
     $                     lda )
            END IF
*
         ELSE
            alpha( k+i ) = zero
            beta( k+i ) = one
            CALL ccopy( l-i+1, b( i, n-l+i ), ldb, a( k+i, n-l+i ),
     $                  lda )
         END IF
   70 CONTINUE
*
*     Post-assignment
*
      DO 80 i = m + 1, k + l
         alpha( i ) = zero
         beta( i ) = one
   80 CONTINUE
*
      IF( k+l.LT.n ) THEN
         DO 90 i = k + l + 1, n
            alpha( i ) = zero
            beta( i ) = zero
   90    CONTINUE
      END IF
*
  100 CONTINUE
      ncycle = kcycle
*
      RETURN
*
*     End of CTGSJA
*

◆ ctgsna()

subroutine ctgsna	(	character	job,
		character	howmny,
		logical, dimension( * )	select,
		integer	n,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( ldb, * )	b,
		integer	ldb,
		complex, dimension( ldvl, * )	vl,
		integer	ldvl,
		complex, dimension( ldvr, * )	vr,
		integer	ldvr,
		real, dimension( * )	s,
		real, dimension( * )	dif,
		integer	mm,
		integer	m,
		complex, dimension( * )	work,
		integer	lwork,
		integer, dimension( * )	iwork,
		integer	info )

CTGSNA

Download CTGSNA + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CTGSNA estimates reciprocal condition numbers for specified
!> eigenvalues and/or eigenvectors of a matrix pair (A, B).
!>
!> (A, B) must be in generalized Schur canonical form, that is, A and
!> B are both upper triangular.
!>

Parameters

[in]	JOB	!> JOB is CHARACTER*1 !> Specifies whether condition numbers are required for !> eigenvalues (S) or eigenvectors (DIF): !> = 'E': for eigenvalues only (S); !> = 'V': for eigenvectors only (DIF); !> = 'B': for both eigenvalues and eigenvectors (S and DIF). !>
[in]	HOWMNY	!> HOWMNY is CHARACTER*1 !> = 'A': compute condition numbers for all eigenpairs; !> = 'S': compute condition numbers for selected eigenpairs !> specified by the array SELECT. !>
[in]	SELECT	!> SELECT is LOGICAL array, dimension (N) !> If HOWMNY = 'S', SELECT specifies the eigenpairs for which !> condition numbers are required. To select condition numbers !> for the corresponding j-th eigenvalue and/or eigenvector, !> SELECT(j) must be set to .TRUE.. !> If HOWMNY = 'A', SELECT is not referenced. !>
[in]	N	!> N is INTEGER !> The order of the square matrix pair (A, B). N >= 0. !>
[in]	A	!> A is COMPLEX array, dimension (LDA,N) !> The upper triangular matrix A in the pair (A,B). !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,N). !>
[in]	B	!> B is COMPLEX array, dimension (LDB,N) !> The upper triangular matrix B in the pair (A, B). !>
[in]	LDB	!> LDB is INTEGER !> The leading dimension of the array B. LDB >= max(1,N). !>
[in]	VL	!> VL is COMPLEX array, dimension (LDVL,M) !> IF JOB = 'E' or 'B', VL must contain left eigenvectors of !> (A, B), corresponding to the eigenpairs specified by HOWMNY !> and SELECT. The eigenvectors must be stored in consecutive !> columns of VL, as returned by CTGEVC. !> If JOB = 'V', VL is not referenced. !>
[in]	LDVL	!> LDVL is INTEGER !> The leading dimension of the array VL. LDVL >= 1; and !> If JOB = 'E' or 'B', LDVL >= N. !>
[in]	VR	!> VR is COMPLEX array, dimension (LDVR,M) !> IF JOB = 'E' or 'B', VR must contain right eigenvectors of !> (A, B), corresponding to the eigenpairs specified by HOWMNY !> and SELECT. The eigenvectors must be stored in consecutive !> columns of VR, as returned by CTGEVC. !> If JOB = 'V', VR is not referenced. !>
[in]	LDVR	!> LDVR is INTEGER !> The leading dimension of the array VR. LDVR >= 1; !> If JOB = 'E' or 'B', LDVR >= N. !>
[out]	S	!> S is REAL array, dimension (MM) !> If JOB = 'E' or 'B', the reciprocal condition numbers of the !> selected eigenvalues, stored in consecutive elements of the !> array. !> If JOB = 'V', S is not referenced. !>
[out]	DIF	!> DIF is REAL array, dimension (MM) !> If JOB = 'V' or 'B', the estimated reciprocal condition !> numbers of the selected eigenvectors, stored in consecutive !> elements of the array. !> If the eigenvalues cannot be reordered to compute DIF(j), !> DIF(j) is set to 0; this can only occur when the true value !> would be very small anyway. !> For each eigenvalue/vector specified by SELECT, DIF stores !> a Frobenius norm-based estimate of Difl. !> If JOB = 'E', DIF is not referenced. !>
[in]	MM	!> MM is INTEGER !> The number of elements in the arrays S and DIF. MM >= M. !>
[out]	M	!> M is INTEGER !> The number of elements of the arrays S and DIF used to store !> the specified condition numbers; for each selected eigenvalue !> one element is used. If HOWMNY = 'A', M is set to N. !>
[out]	WORK	!> WORK is COMPLEX array, dimension (MAX(1,LWORK)) !> On exit, if INFO = 0, WORK(1) returns the optimal LWORK. !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the array WORK. LWORK >= max(1,N). !> If JOB = 'V' or 'B', LWORK >= max(1,2NN). !>
[out]	IWORK	!> IWORK is INTEGER array, dimension (N+2) !> If JOB = 'E', IWORK is not referenced. !>
[out]	INFO	!> INFO is INTEGER !> = 0: Successful exit !> < 0: If INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  The reciprocal of the condition number of the i-th generalized
!>  eigenvalue w = (a, b) is defined as
!>
!>          S(I) = (|v**HAu|**2 + |v**HBu|**2)**(1/2) / (norm(u)*norm(v))
!>
!>  where u and v are the right and left eigenvectors of (A, B)
!>  corresponding to w; |z| denotes the absolute value of the complex
!>  number, and norm(u) denotes the 2-norm of the vector u. The pair
!>  (a, b) corresponds to an eigenvalue w = a/b (= v**HAu/v**HBu) of the
!>  matrix pair (A, B). If both a and b equal zero, then (A,B) is
!>  singular and S(I) = -1 is returned.
!>
!>  An approximate error bound on the chordal distance between the i-th
!>  computed generalized eigenvalue w and the corresponding exact
!>  eigenvalue lambda is
!>
!>          chord(w, lambda) <=   EPS * norm(A, B) / S(I),
!>
!>  where EPS is the machine precision.
!>
!>  The reciprocal of the condition number of the right eigenvector u
!>  and left eigenvector v corresponding to the generalized eigenvalue w
!>  is defined as follows. Suppose
!>
!>                   (A, B) = ( a   *  ) ( b  *  )  1
!>                            ( 0  A22 ),( 0 B22 )  n-1
!>                              1  n-1     1 n-1
!>
!>  Then the reciprocal condition number DIF(I) is
!>
!>          Difl[(a, b), (A22, B22)]  = sigma-min( Zl )
!>
!>  where sigma-min(Zl) denotes the smallest singular value of
!>
!>         Zl = [ kron(a, In-1) -kron(1, A22) ]
!>              [ kron(b, In-1) -kron(1, B22) ].
!>
!>  Here In-1 is the identity matrix of size n-1 and X**H is the conjugate
!>  transpose of X. kron(X, Y) is the Kronecker product between the
!>  matrices X and Y.
!>
!>  We approximate the smallest singular value of Zl with an upper
!>  bound. This is done by CLATDF.
!>
!>  An approximate error bound for a computed eigenvector VL(i) or
!>  VR(i) is given by
!>
!>                      EPS * norm(A, B) / DIF(i).
!>
!>  See ref. [2-3] for more details and further references.
!>

Contributors:: Bo Kagstrom and Peter Poromaa, Department of Computing Science, Umea University, S-901 87 Umea, Sweden.

References:

!>
!>  [1] B. Kagstrom; A Direct Method for Reordering Eigenvalues in the
!>      Generalized Real Schur Form of a Regular Matrix Pair (A, B), in
!>      M.S. Moonen et al (eds), Linear Algebra for Large Scale and
!>      Real-Time Applications, Kluwer Academic Publ. 1993, pp 195-218.
!>
!>  [2] B. Kagstrom and P. Poromaa; Computing Eigenspaces with Specified
!>      Eigenvalues of a Regular Matrix Pair (A, B) and Condition
!>      Estimation: Theory, Algorithms and Software, Report
!>      UMINF - 94.04, Department of Computing Science, Umea University,
!>      S-901 87 Umea, Sweden, 1994. Also as LAPACK Working Note 87.
!>      To appear in Numerical Algorithms, 1996.
!>
!>  [3] B. Kagstrom and P. Poromaa, LAPACK-Style Algorithms and Software
!>      for Solving the Generalized Sylvester Equation and Estimating the
!>      Separation between Regular Matrix Pairs, Report UMINF - 93.23,
!>      Department of Computing Science, Umea University, S-901 87 Umea,
!>      Sweden, December 1993, Revised April 1994, Also as LAPACK Working
!>      Note 75.
!>      To appear in ACM Trans. on Math. Software, Vol 22, No 1, 1996.
!>

Definition at line 308 of file ctgsna.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          HOWMNY, JOB
      INTEGER            INFO, LDA, LDB, LDVL, LDVR, LWORK, M, MM, N
*     ..
*     .. Array Arguments ..
      LOGICAL            SELECT( * )
      INTEGER            IWORK( * )
      REAL               DIF( * ), S( * )
      COMPLEX            A( LDA, * ), B( LDB, * ), VL( LDVL, * ),
     $                   VR( LDVR, * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ZERO, ONE
      INTEGER            IDIFJB
      parameter( zero = 0.0e+0, one = 1.0e+0, idifjb = 3 )
*     ..
*     .. Local Scalars ..
      LOGICAL            LQUERY, SOMCON, WANTBH, WANTDF, WANTS
      INTEGER            I, IERR, IFST, ILST, K, KS, LWMIN, N1, N2
      REAL               BIGNUM, COND, EPS, LNRM, RNRM, SCALE, SMLNUM
      COMPLEX            YHAX, YHBX
*     ..
*     .. Local Arrays ..
      COMPLEX            DUMMY( 1 ), DUMMY1( 1 )
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      REAL               SCNRM2, SLAMCH, SLAPY2
      COMPLEX            CDOTC
      EXTERNAL           lsame, scnrm2, slamch, slapy2, cdotc
*     ..
*     .. External Subroutines ..
      EXTERNAL           cgemv, clacpy, ctgexc, ctgsyl, slabad, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, cmplx, max
*     ..
*     .. Executable Statements ..
*
*     Decode and test the input parameters
*
      wantbh = lsame( job, 'B' )
      wants = lsame( job, 'E' ) .OR. wantbh
      wantdf = lsame( job, 'V' ) .OR. wantbh
*
      somcon = lsame( howmny, 'S' )
*
      info = 0
      lquery = ( lwork.EQ.-1 )
*
      IF( .NOT.wants .AND. .NOT.wantdf ) THEN
         info = -1
      ELSE IF( .NOT.lsame( howmny, 'A' ) .AND. .NOT.somcon ) THEN
         info = -2
      ELSE IF( n.LT.0 ) THEN
         info = -4
      ELSE IF( lda.LT.max( 1, n ) ) THEN
         info = -6
      ELSE IF( ldb.LT.max( 1, n ) ) THEN
         info = -8
      ELSE IF( wants .AND. ldvl.LT.n ) THEN
         info = -10
      ELSE IF( wants .AND. ldvr.LT.n ) THEN
         info = -12
      ELSE
*
*        Set M to the number of eigenpairs for which condition numbers
*        are required, and test MM.
*
         IF( somcon ) THEN
            m = 0
            DO 10 k = 1, n
               IF( SELECT( k ) )
     $            m = m + 1
   10       CONTINUE
         ELSE
            m = n
         END IF
*
         IF( n.EQ.0 ) THEN
            lwmin = 1
         ELSE IF( lsame( job, 'V' ) .OR. lsame( job, 'B' ) ) THEN
            lwmin = 2*n*n
         ELSE
            lwmin = n
         END IF
         work( 1 ) = lwmin
*
         IF( mm.LT.m ) THEN
            info = -15
         ELSE IF( lwork.LT.lwmin .AND. .NOT.lquery ) THEN
            info = -18
         END IF
      END IF
*
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CTGSNA', -info )
         RETURN
      ELSE IF( lquery ) THEN
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
*     Get machine constants
*
      eps = slamch( 'P' )
      smlnum = slamch( 'S' ) / eps
      bignum = one / smlnum
      CALL slabad( smlnum, bignum )
      ks = 0
      DO 20 k = 1, n
*
*        Determine whether condition numbers are required for the k-th
*        eigenpair.
*
         IF( somcon ) THEN
            IF( .NOT.SELECT( k ) )
     $         GO TO 20
         END IF
*
         ks = ks + 1
*
         IF( wants ) THEN
*
*           Compute the reciprocal condition number of the k-th
*           eigenvalue.
*
            rnrm = scnrm2( n, vr( 1, ks ), 1 )
            lnrm = scnrm2( n, vl( 1, ks ), 1 )
            CALL cgemv( 'N', n, n, cmplx( one, zero ), a, lda,
     $                  vr( 1, ks ), 1, cmplx( zero, zero ), work, 1 )
            yhax = cdotc( n, work, 1, vl( 1, ks ), 1 )
            CALL cgemv( 'N', n, n, cmplx( one, zero ), b, ldb,
     $                  vr( 1, ks ), 1, cmplx( zero, zero ), work, 1 )
            yhbx = cdotc( n, work, 1, vl( 1, ks ), 1 )
            cond = slapy2( abs( yhax ), abs( yhbx ) )
            IF( cond.EQ.zero ) THEN
               s( ks ) = -one
            ELSE
               s( ks ) = cond / ( rnrm*lnrm )
            END IF
         END IF
*
         IF( wantdf ) THEN
            IF( n.EQ.1 ) THEN
               dif( ks ) = slapy2( abs( a( 1, 1 ) ), abs( b( 1, 1 ) ) )
            ELSE
*
*              Estimate the reciprocal condition number of the k-th
*              eigenvectors.
*
*              Copy the matrix (A, B) to the array WORK and move the
*              (k,k)th pair to the (1,1) position.
*
               CALL clacpy( 'Full', n, n, a, lda, work, n )
               CALL clacpy( 'Full', n, n, b, ldb, work( n*n+1 ), n )
               ifst = k
               ilst = 1
*
               CALL ctgexc( .false., .false., n, work, n, work( n*n+1 ),
     $                      n, dummy, 1, dummy1, 1, ifst, ilst, ierr )
*
               IF( ierr.GT.0 ) THEN
*
*                 Ill-conditioned problem - swap rejected.
*
                  dif( ks ) = zero
               ELSE
*
*                 Reordering successful, solve generalized Sylvester
*                 equation for R and L,
*                            A22 * R - L * A11 = A12
*                            B22 * R - L * B11 = B12,
*                 and compute estimate of Difl[(A11,B11), (A22, B22)].
*
                  n1 = 1
                  n2 = n - n1
                  i = n*n + 1
                  CALL ctgsyl( 'N', idifjb, n2, n1, work( n*n1+n1+1 ),
     $                         n, work, n, work( n1+1 ), n,
     $                         work( n*n1+n1+i ), n, work( i ), n,
     $                         work( n1+i ), n, scale, dif( ks ), dummy,
     $                         1, iwork, ierr )
               END IF
            END IF
         END IF
*
   20 CONTINUE
      work( 1 ) = lwmin
      RETURN
*
*     End of CTGSNA
*

◆ ctpcon()

subroutine ctpcon	(	character	norm,
		character	uplo,
		character	diag,
		integer	n,
		complex, dimension( * )	ap,
		real	rcond,
		complex, dimension( * )	work,
		real, dimension( * )	rwork,
		integer	info )

CTPCON

Download CTPCON + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CTPCON estimates the reciprocal of the condition number of a packed
!> triangular matrix A, in either the 1-norm or the infinity-norm.
!>
!> The norm of A is computed and an estimate is obtained for
!> norm(inv(A)), then the reciprocal of the condition number is
!> computed as
!>    RCOND = 1 / ( norm(A) * norm(inv(A)) ).
!>

Parameters

[in]	NORM	!> NORM is CHARACTER*1 !> Specifies whether the 1-norm condition number or the !> infinity-norm condition number is required: !> = '1' or 'O': 1-norm; !> = 'I': Infinity-norm. !>
[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': A is upper triangular; !> = 'L': A is lower triangular. !>
[in]	DIAG	!> DIAG is CHARACTER*1 !> = 'N': A is non-unit triangular; !> = 'U': A is unit triangular. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in]	AP	!> AP is COMPLEX array, dimension (N(N+1)/2) !> The upper or lower triangular matrix A, packed columnwise in !> a linear array. The j-th column of A is stored in the array !> AP as follows: !> if UPLO = 'U', AP(i + (j-1)j/2) = A(i,j) for 1<=i<=j; !> if UPLO = 'L', AP(i + (j-1)*(2n-j)/2) = A(i,j) for j<=i<=n. !> If DIAG = 'U', the diagonal elements of A are not referenced !> and are assumed to be 1. !>
[out]	RCOND	!> RCOND is REAL !> The reciprocal of the condition number of the matrix A, !> computed as RCOND = 1/(norm(A) * norm(inv(A))). !>
[out]	WORK	!> WORK is COMPLEX array, dimension (2*N) !>
[out]	RWORK	!> RWORK is REAL array, dimension (N) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 128 of file ctpcon.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          DIAG, NORM, UPLO
      INTEGER            INFO, N
      REAL               RCOND
*     ..
*     .. Array Arguments ..
      REAL               RWORK( * )
      COMPLEX            AP( * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ONE, ZERO
      parameter( one = 1.0e+0, zero = 0.0e+0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            NOUNIT, ONENRM, UPPER
      CHARACTER          NORMIN
      INTEGER            IX, KASE, KASE1
      REAL               AINVNM, ANORM, SCALE, SMLNUM, XNORM
      COMPLEX            ZDUM
*     ..
*     .. Local Arrays ..
      INTEGER            ISAVE( 3 )
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      INTEGER            ICAMAX
      REAL               CLANTP, SLAMCH
      EXTERNAL           lsame, icamax, clantp, slamch
*     ..
*     .. External Subroutines ..
      EXTERNAL           clacn2, clatps, csrscl, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, aimag, max, real
*     ..
*     .. Statement Functions ..
      REAL               CABS1
*     ..
*     .. Statement Function definitions ..
      cabs1( zdum ) = abs( real( zdum ) ) + abs( aimag( zdum ) )
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      upper = lsame( uplo, 'U' )
      onenrm = norm.EQ.'1' .OR. lsame( norm, 'O' )
      nounit = lsame( diag, 'N' )
*
      IF( .NOT.onenrm .AND. .NOT.lsame( norm, 'I' ) ) THEN
         info = -1
      ELSE IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -2
      ELSE IF( .NOT.nounit .AND. .NOT.lsame( diag, 'U' ) ) THEN
         info = -3
      ELSE IF( n.LT.0 ) THEN
         info = -4
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CTPCON', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 ) THEN
         rcond = one
         RETURN
      END IF
*
      rcond = zero
      smlnum = slamch( 'Safe minimum' )*real( max( 1, n ) )
*
*     Compute the norm of the triangular matrix A.
*
      anorm = clantp( norm, uplo, diag, n, ap, rwork )
*
*     Continue only if ANORM > 0.
*
      IF( anorm.GT.zero ) THEN
*
*        Estimate the norm of the inverse of A.
*
         ainvnm = zero
         normin = 'N'
         IF( onenrm ) THEN
            kase1 = 1
         ELSE
            kase1 = 2
         END IF
         kase = 0
   10    CONTINUE
         CALL clacn2( n, work( n+1 ), work, ainvnm, kase, isave )
         IF( kase.NE.0 ) THEN
            IF( kase.EQ.kase1 ) THEN
*
*              Multiply by inv(A).
*
               CALL clatps( uplo, 'No transpose', diag, normin, n, ap,
     $                      work, scale, rwork, info )
            ELSE
*
*              Multiply by inv(A**H).
*
               CALL clatps( uplo, 'Conjugate transpose', diag, normin,
     $                      n, ap, work, scale, rwork, info )
            END IF
            normin = 'Y'
*
*           Multiply by 1/SCALE if doing so will not cause overflow.
*
            IF( scale.NE.one ) THEN
               ix = icamax( n, work, 1 )
               xnorm = cabs1( work( ix ) )
               IF( scale.LT.xnorm*smlnum .OR. scale.EQ.zero )
     $            GO TO 20
               CALL csrscl( n, scale, work, 1 )
            END IF
            GO TO 10
         END IF
*
*        Compute the estimate of the reciprocal condition number.
*
         IF( ainvnm.NE.zero )
     $      rcond = ( one / anorm ) / ainvnm
      END IF
*
   20 CONTINUE
      RETURN
*
*     End of CTPCON
*

◆ ctpmqrt()

subroutine ctpmqrt	(	character	side,
		character	trans,
		integer	m,
		integer	n,
		integer	k,
		integer	l,
		integer	nb,
		complex, dimension( ldv, * )	v,
		integer	ldv,
		complex, dimension( ldt, * )	t,
		integer	ldt,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( ldb, * )	b,
		integer	ldb,
		complex, dimension( * )	work,
		integer	info )

CTPMQRT

Download CTPMQRT + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CTPMQRT applies a complex orthogonal matrix Q obtained from a
!>  complex block reflector H to a general
!> complex matrix C, which consists of two blocks A and B.
!>

Parameters

[in]	SIDE	!> SIDE is CHARACTER1 !> = 'L': apply Q or QH from the Left; !> = 'R': apply Q or Q*H from the Right. !>
[in]	TRANS	!> TRANS is CHARACTER1 !> = 'N': No transpose, apply Q; !> = 'C': Conjugate transpose, apply Q*H. !>
[in]	M	!> M is INTEGER !> The number of rows of the matrix B. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix B. N >= 0. !>
[in]	K	!> K is INTEGER !> The number of elementary reflectors whose product defines !> the matrix Q. !>
[in]	L	!> L is INTEGER !> The order of the trapezoidal part of V. !> K >= L >= 0. See Further Details. !>
[in]	NB	!> NB is INTEGER !> The block size used for the storage of T. K >= NB >= 1. !> This must be the same value of NB used to generate T !> in CTPQRT. !>
[in]	V	!> V is COMPLEX array, dimension (LDV,K) !> The i-th column must contain the vector which defines the !> elementary reflector H(i), for i = 1,2,...,k, as returned by !> CTPQRT in B. See Further Details. !>
[in]	LDV	!> LDV is INTEGER !> The leading dimension of the array V. !> If SIDE = 'L', LDV >= max(1,M); !> if SIDE = 'R', LDV >= max(1,N). !>
[in]	T	!> T is COMPLEX array, dimension (LDT,K) !> The upper triangular factors of the block reflectors !> as returned by CTPQRT, stored as a NB-by-K matrix. !>
[in]	LDT	!> LDT is INTEGER !> The leading dimension of the array T. LDT >= NB. !>
[in,out]	A	!> A is COMPLEX array, dimension !> (LDA,N) if SIDE = 'L' or !> (LDA,K) if SIDE = 'R' !> On entry, the K-by-N or M-by-K matrix A. !> On exit, A is overwritten by the corresponding block of !> QC or QHC or CQ or CQ**H. See Further Details. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. !> If SIDE = 'L', LDC >= max(1,K); !> If SIDE = 'R', LDC >= max(1,M). !>
[in,out]	B	!> B is COMPLEX array, dimension (LDB,N) !> On entry, the M-by-N matrix B. !> On exit, B is overwritten by the corresponding block of !> QC or QHC or CQ or CQ**H. See Further Details. !>
[in]	LDB	!> LDB is INTEGER !> The leading dimension of the array B. !> LDB >= max(1,M). !>
[out]	WORK	!> WORK is COMPLEX array. The dimension of WORK is !> NNB if SIDE = 'L', or MNB if SIDE = 'R'. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  The columns of the pentagonal matrix V contain the elementary reflectors
!>  H(1), H(2), ..., H(K); V is composed of a rectangular block V1 and a
!>  trapezoidal block V2:
!>
!>        V = [V1]
!>            [V2].
!>
!>  The size of the trapezoidal block V2 is determined by the parameter L,
!>  where 0 <= L <= K; V2 is upper trapezoidal, consisting of the first L
!>  rows of a K-by-K upper triangular matrix.  If L=K, V2 is upper triangular;
!>  if L=0, there is no trapezoidal block, hence V = V1 is rectangular.
!>
!>  If SIDE = 'L':  C = [A]  where A is K-by-N,  B is M-by-N and V is M-by-K.
!>                      [B]
!>
!>  If SIDE = 'R':  C = [A B]  where A is M-by-K, B is M-by-N and V is N-by-K.
!>
!>  The complex orthogonal matrix Q is formed from V and T.
!>
!>  If TRANS='N' and SIDE='L', C is on exit replaced with Q * C.
!>
!>  If TRANS='C' and SIDE='L', C is on exit replaced with Q**H * C.
!>
!>  If TRANS='N' and SIDE='R', C is on exit replaced with C * Q.
!>
!>  If TRANS='C' and SIDE='R', C is on exit replaced with C * Q**H.
!>

Definition at line 214 of file ctpmqrt.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER SIDE, TRANS
      INTEGER   INFO, K, LDV, LDA, LDB, M, N, L, NB, LDT
*     ..
*     .. Array Arguments ..
      COMPLEX   V( LDV, * ), A( LDA, * ), B( LDB, * ), T( LDT, * ),
     $          WORK( * )
*     ..
*
*  =====================================================================
*
*     ..
*     .. Local Scalars ..
      LOGICAL            LEFT, RIGHT, TRAN, NOTRAN
      INTEGER            I, IB, MB, LB, KF, LDAQ, LDVQ
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           ctprfb, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, min
*     ..
*     .. Executable Statements ..
*
*     .. Test the input arguments ..
*
      info   = 0
      left   = lsame( side,  'L' )
      right  = lsame( side,  'R' )
      tran   = lsame( trans, 'C' )
      notran = lsame( trans, 'N' )
*
      IF ( left ) THEN
         ldvq = max( 1, m )
         ldaq = max( 1, k )
      ELSE IF ( right ) THEN
         ldvq = max( 1, n )
         ldaq = max( 1, m )
      END IF
      IF( .NOT.left .AND. .NOT.right ) THEN
         info = -1
      ELSE IF( .NOT.tran .AND. .NOT.notran ) THEN
         info = -2
      ELSE IF( m.LT.0 ) THEN
         info = -3
      ELSE IF( n.LT.0 ) THEN
         info = -4
      ELSE IF( k.LT.0 ) THEN
         info = -5
      ELSE IF( l.LT.0 .OR. l.GT.k ) THEN
         info = -6
      ELSE IF( nb.LT.1 .OR. (nb.GT.k .AND. k.GT.0) ) THEN
         info = -7
      ELSE IF( ldv.LT.ldvq ) THEN
         info = -9
      ELSE IF( ldt.LT.nb ) THEN
         info = -11
      ELSE IF( lda.LT.ldaq ) THEN
         info = -13
      ELSE IF( ldb.LT.max( 1, m ) ) THEN
         info = -15
      END IF
*
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CTPMQRT', -info )
         RETURN
      END IF
*
*     .. Quick return if possible ..
*
      IF( m.EQ.0 .OR. n.EQ.0 .OR. k.EQ.0 ) RETURN
*
      IF( left .AND. tran ) THEN
*
         DO i = 1, k, nb
            ib = min( nb, k-i+1 )
            mb = min( m-l+i+ib-1, m )
            IF( i.GE.l ) THEN
               lb = 0
            ELSE
               lb = mb-m+l-i+1
            END IF
            CALL ctprfb( 'L', 'C', 'F', 'C', mb, n, ib, lb,
     $                   v( 1, i ), ldv, t( 1, i ), ldt,
     $                   a( i, 1 ), lda, b, ldb, work, ib )
         END DO
*
      ELSE IF( right .AND. notran ) THEN
*
         DO i = 1, k, nb
            ib = min( nb, k-i+1 )
            mb = min( n-l+i+ib-1, n )
            IF( i.GE.l ) THEN
               lb = 0
            ELSE
               lb = mb-n+l-i+1
            END IF
            CALL ctprfb( 'R', 'N', 'F', 'C', m, mb, ib, lb,
     $                   v( 1, i ), ldv, t( 1, i ), ldt,
     $                   a( 1, i ), lda, b, ldb, work, m )
         END DO
*
      ELSE IF( left .AND. notran ) THEN
*
         kf = ((k-1)/nb)*nb+1
         DO i = kf, 1, -nb
            ib = min( nb, k-i+1 )
            mb = min( m-l+i+ib-1, m )
            IF( i.GE.l ) THEN
               lb = 0
            ELSE
               lb = mb-m+l-i+1
            END IF
            CALL ctprfb( 'L', 'N', 'F', 'C', mb, n, ib, lb,
     $                   v( 1, i ), ldv, t( 1, i ), ldt,
     $                   a( i, 1 ), lda, b, ldb, work, ib )
         END DO
*
      ELSE IF( right .AND. tran ) THEN
*
         kf = ((k-1)/nb)*nb+1
         DO i = kf, 1, -nb
            ib = min( nb, k-i+1 )
            mb = min( n-l+i+ib-1, n )
            IF( i.GE.l ) THEN
               lb = 0
            ELSE
               lb = mb-n+l-i+1
            END IF
            CALL ctprfb( 'R', 'C', 'F', 'C', m, mb, ib, lb,
     $                   v( 1, i ), ldv, t( 1, i ), ldt,
     $                   a( 1, i ), lda, b, ldb, work, m )
         END DO
*
      END IF
*
      RETURN
*
*     End of CTPMQRT
*

◆ ctpqrt()

subroutine ctpqrt	(	integer	m,
		integer	n,
		integer	l,
		integer	nb,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( ldb, * )	b,
		integer	ldb,
		complex, dimension( ldt, * )	t,
		integer	ldt,
		complex, dimension( * )	work,
		integer	info )

CTPQRT

Download CTPQRT + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CTPQRT computes a blocked QR factorization of a complex
!>  matrix C, which is composed of a
!> triangular block A and pentagonal block B, using the compact
!> WY representation for Q.
!>

Parameters

[in]	M	!> M is INTEGER !> The number of rows of the matrix B. !> M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix B, and the order of the !> triangular matrix A. !> N >= 0. !>
[in]	L	!> L is INTEGER !> The number of rows of the upper trapezoidal part of B. !> MIN(M,N) >= L >= 0. See Further Details. !>
[in]	NB	!> NB is INTEGER !> The block size to be used in the blocked QR. N >= NB >= 1. !>
[in,out]	A	!> A is COMPLEX array, dimension (LDA,N) !> On entry, the upper triangular N-by-N matrix A. !> On exit, the elements on and above the diagonal of the array !> contain the upper triangular matrix R. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,N). !>
[in,out]	B	!> B is COMPLEX array, dimension (LDB,N) !> On entry, the pentagonal M-by-N matrix B. The first M-L rows !> are rectangular, and the last L rows are upper trapezoidal. !> On exit, B contains the pentagonal matrix V. See Further Details. !>
[in]	LDB	!> LDB is INTEGER !> The leading dimension of the array B. LDB >= max(1,M). !>
[out]	T	!> T is COMPLEX array, dimension (LDT,N) !> The upper triangular block reflectors stored in compact form !> as a sequence of upper triangular blocks. See Further Details. !>
[in]	LDT	!> LDT is INTEGER !> The leading dimension of the array T. LDT >= NB. !>
[out]	WORK	!> WORK is COMPLEX array, dimension (NB*N) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  The input matrix C is a (N+M)-by-N matrix
!>
!>               C = [ A ]
!>                   [ B ]
!>
!>  where A is an upper triangular N-by-N matrix, and B is M-by-N pentagonal
!>  matrix consisting of a (M-L)-by-N rectangular matrix B1 on top of a L-by-N
!>  upper trapezoidal matrix B2:
!>
!>               B = [ B1 ]  <- (M-L)-by-N rectangular
!>                   [ B2 ]  <-     L-by-N upper trapezoidal.
!>
!>  The upper trapezoidal matrix B2 consists of the first L rows of a
!>  N-by-N upper triangular matrix, where 0 <= L <= MIN(M,N).  If L=0,
!>  B is rectangular M-by-N; if M=L=N, B is upper triangular.
!>
!>  The matrix W stores the elementary reflectors H(i) in the i-th column
!>  below the diagonal (of A) in the (N+M)-by-N input matrix C
!>
!>               C = [ A ]  <- upper triangular N-by-N
!>                   [ B ]  <- M-by-N pentagonal
!>
!>  so that W can be represented as
!>
!>               W = [ I ]  <- identity, N-by-N
!>                   [ V ]  <- M-by-N, same form as B.
!>
!>  Thus, all of information needed for W is contained on exit in B, which
!>  we call V above.  Note that V has the same form as B; that is,
!>
!>               V = [ V1 ] <- (M-L)-by-N rectangular
!>                   [ V2 ] <-     L-by-N upper trapezoidal.
!>
!>  The columns of V represent the vectors which define the H(i)'s.
!>
!>  The number of blocks is B = ceiling(N/NB), where each
!>  block is of order NB except for the last block, which is of order
!>  IB = N - (B-1)*NB.  For each of the B blocks, a upper triangular block
!>  reflector factor is computed: T1, T2, ..., TB.  The NB-by-NB (and IB-by-IB
!>  for the last block) T's are stored in the NB-by-N matrix T as
!>
!>               T = [T1 T2 ... TB].
!>

Definition at line 187 of file ctpqrt.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER INFO, LDA, LDB, LDT, N, M, L, NB
*     ..
*     .. Array Arguments ..
      COMPLEX A( LDA, * ), B( LDB, * ), T( LDT, * ), WORK( * )
*     ..
*
* =====================================================================
*
*     ..
*     .. Local Scalars ..
      INTEGER    I, IB, LB, MB, IINFO
*     ..
*     .. External Subroutines ..
      EXTERNAL   ctpqrt2, ctprfb, xerbla
*     ..
*     .. Executable Statements ..
*
*     Test the input arguments
*
      info = 0
      IF( m.LT.0 ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( l.LT.0 .OR. (l.GT.min(m,n) .AND. min(m,n).GE.0)) THEN
         info = -3
      ELSE IF( nb.LT.1 .OR. (nb.GT.n .AND. n.GT.0)) THEN
         info = -4
      ELSE IF( lda.LT.max( 1, n ) ) THEN
         info = -6
      ELSE IF( ldb.LT.max( 1, m ) ) THEN
         info = -8
      ELSE IF( ldt.LT.nb ) THEN
         info = -10
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CTPQRT', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( m.EQ.0 .OR. n.EQ.0 ) RETURN
*
      DO i = 1, n, nb
*
*     Compute the QR factorization of the current block
*
         ib = min( n-i+1, nb )
         mb = min( m-l+i+ib-1, m )
         IF( i.GE.l ) THEN
            lb = 0
         ELSE
            lb = mb-m+l-i+1
         END IF
*
         CALL ctpqrt2( mb, ib, lb, a(i,i), lda, b( 1, i ), ldb,
     $                 t(1, i ), ldt, iinfo )
*
*     Update by applying H**H to B(:,I+IB:N) from the left
*
         IF( i+ib.LE.n ) THEN
            CALL ctprfb( 'L', 'C', 'F', 'C', mb, n-i-ib+1, ib, lb,
     $                    b( 1, i ), ldb, t( 1, i ), ldt,
     $                    a( i, i+ib ), lda, b( 1, i+ib ), ldb,
     $                    work, ib )
         END IF
      END DO
      RETURN
*
*     End of CTPQRT
*

◆ ctpqrt2()

subroutine ctpqrt2	(	integer	m,
		integer	n,
		integer	l,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( ldb, * )	b,
		integer	ldb,
		complex, dimension( ldt, * )	t,
		integer	ldt,
		integer	info )

CTPQRT2 computes a QR factorization of a real or complex "triangular-pentagonal" matrix, which is composed of a triangular block and a pentagonal block, using the compact WY representation for Q.

Download CTPQRT2 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CTPQRT2 computes a QR factorization of a complex 
!> matrix C, which is composed of a triangular block A and pentagonal block B,
!> using the compact WY representation for Q.
!>

Parameters

[in]	M	!> M is INTEGER !> The total number of rows of the matrix B. !> M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix B, and the order of !> the triangular matrix A. !> N >= 0. !>
[in]	L	!> L is INTEGER !> The number of rows of the upper trapezoidal part of B. !> MIN(M,N) >= L >= 0. See Further Details. !>
[in,out]	A	!> A is COMPLEX array, dimension (LDA,N) !> On entry, the upper triangular N-by-N matrix A. !> On exit, the elements on and above the diagonal of the array !> contain the upper triangular matrix R. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,N). !>
[in,out]	B	!> B is COMPLEX array, dimension (LDB,N) !> On entry, the pentagonal M-by-N matrix B. The first M-L rows !> are rectangular, and the last L rows are upper trapezoidal. !> On exit, B contains the pentagonal matrix V. See Further Details. !>
[in]	LDB	!> LDB is INTEGER !> The leading dimension of the array B. LDB >= max(1,M). !>
[out]	T	!> T is COMPLEX array, dimension (LDT,N) !> The N-by-N upper triangular factor T of the block reflector. !> See Further Details. !>
[in]	LDT	!> LDT is INTEGER !> The leading dimension of the array T. LDT >= max(1,N) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  The input matrix C is a (N+M)-by-N matrix
!>
!>               C = [ A ]
!>                   [ B ]
!>
!>  where A is an upper triangular N-by-N matrix, and B is M-by-N pentagonal
!>  matrix consisting of a (M-L)-by-N rectangular matrix B1 on top of a L-by-N
!>  upper trapezoidal matrix B2:
!>
!>               B = [ B1 ]  <- (M-L)-by-N rectangular
!>                   [ B2 ]  <-     L-by-N upper trapezoidal.
!>
!>  The upper trapezoidal matrix B2 consists of the first L rows of a
!>  N-by-N upper triangular matrix, where 0 <= L <= MIN(M,N).  If L=0,
!>  B is rectangular M-by-N; if M=L=N, B is upper triangular.
!>
!>  The matrix W stores the elementary reflectors H(i) in the i-th column
!>  below the diagonal (of A) in the (N+M)-by-N input matrix C
!>
!>               C = [ A ]  <- upper triangular N-by-N
!>                   [ B ]  <- M-by-N pentagonal
!>
!>  so that W can be represented as
!>
!>               W = [ I ]  <- identity, N-by-N
!>                   [ V ]  <- M-by-N, same form as B.
!>
!>  Thus, all of information needed for W is contained on exit in B, which
!>  we call V above.  Note that V has the same form as B; that is,
!>
!>               V = [ V1 ] <- (M-L)-by-N rectangular
!>                   [ V2 ] <-     L-by-N upper trapezoidal.
!>
!>  The columns of V represent the vectors which define the H(i)'s.
!>  The (M+N)-by-(M+N) block reflector H is then given by
!>
!>               H = I - W * T * W**H
!>
!>  where W**H is the conjugate transpose of W and T is the upper triangular
!>  factor of the block reflector.
!>

Definition at line 172 of file ctpqrt2.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER   INFO, LDA, LDB, LDT, N, M, L
*     ..
*     .. Array Arguments ..
      COMPLEX   A( LDA, * ), B( LDB, * ), T( LDT, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX  ONE, ZERO
      parameter( one = (1.0,0.0), zero = (0.0,0.0) )
*     ..
*     .. Local Scalars ..
      INTEGER   I, J, P, MP, NP
      COMPLEX   ALPHA
*     ..
*     .. External Subroutines ..
      EXTERNAL  clarfg, cgemv, cgerc, ctrmv, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC max, min
*     ..
*     .. Executable Statements ..
*
*     Test the input arguments
*
      info = 0
      IF( m.LT.0 ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( l.LT.0 .OR. l.GT.min(m,n) ) THEN
         info = -3
      ELSE IF( lda.LT.max( 1, n ) ) THEN
         info = -5
      ELSE IF( ldb.LT.max( 1, m ) ) THEN
         info = -7
      ELSE IF( ldt.LT.max( 1, n ) ) THEN
         info = -9
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CTPQRT2', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 .OR. m.EQ.0 ) RETURN
*
      DO i = 1, n
*
*        Generate elementary reflector H(I) to annihilate B(:,I)
*
         p = m-l+min( l, i )
         CALL clarfg( p+1, a( i, i ), b( 1, i ), 1, t( i, 1 ) )
         IF( i.LT.n ) THEN
*
*           W(1:N-I) := C(I:M,I+1:N)**H * C(I:M,I) [use W = T(:,N)]
*
            DO j = 1, n-i
               t( j, n ) = conjg(a( i, i+j ))
            END DO
            CALL cgemv( 'C', p, n-i, one, b( 1, i+1 ), ldb,
     $                  b( 1, i ), 1, one, t( 1, n ), 1 )
*
*           C(I:M,I+1:N) = C(I:m,I+1:N) + alpha*C(I:M,I)*W(1:N-1)**H
*
            alpha = -conjg(t( i, 1 ))
            DO j = 1, n-i
               a( i, i+j ) = a( i, i+j ) + alpha*conjg(t( j, n ))
            END DO
            CALL cgerc( p, n-i, alpha, b( 1, i ), 1,
     $           t( 1, n ), 1, b( 1, i+1 ), ldb )
         END IF
      END DO
*
      DO i = 2, n
*
*        T(1:I-1,I) := C(I:M,1:I-1)**H * (alpha * C(I:M,I))
*
         alpha = -t( i, 1 )
 
         DO j = 1, i-1
            t( j, i ) = zero
         END DO
         p = min( i-1, l )
         mp = min( m-l+1, m )
         np = min( p+1, n )
*
*        Triangular part of B2
*
         DO j = 1, p
            t( j, i ) = alpha*b( m-l+j, i )
         END DO
         CALL ctrmv( 'U', 'C', 'N', p, b( mp, 1 ), ldb,
     $               t( 1, i ), 1 )
*
*        Rectangular part of B2
*
         CALL cgemv( 'C', l, i-1-p, alpha, b( mp, np ), ldb,
     $               b( mp, i ), 1, zero, t( np, i ), 1 )
*
*        B1
*
         CALL cgemv( 'C', m-l, i-1, alpha, b, ldb, b( 1, i ), 1,
     $               one, t( 1, i ), 1 )
*
*        T(1:I-1,I) := T(1:I-1,1:I-1) * T(1:I-1,I)
*
         CALL ctrmv( 'U', 'N', 'N', i-1, t, ldt, t( 1, i ), 1 )
*
*        T(I,I) = tau(I)
*
         t( i, i ) = t( i, 1 )
         t( i, 1 ) = zero
      END DO
 
*
*     End of CTPQRT2
*

◆ ctprfs()

subroutine ctprfs	(	character	uplo,
		character	trans,
		character	diag,
		integer	n,
		integer	nrhs,
		complex, dimension( * )	ap,
		complex, dimension( ldb, * )	b,
		integer	ldb,
		complex, dimension( ldx, * )	x,
		integer	ldx,
		real, dimension( * )	ferr,
		real, dimension( * )	berr,
		complex, dimension( * )	work,
		real, dimension( * )	rwork,
		integer	info )

CTPRFS

Download CTPRFS + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CTPRFS provides error bounds and backward error estimates for the
!> solution to a system of linear equations with a triangular packed
!> coefficient matrix.
!>
!> The solution matrix X must be computed by CTPTRS or some other
!> means before entering this routine.  CTPRFS does not do iterative
!> refinement because doing so cannot improve the backward error.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': A is upper triangular; !> = 'L': A is lower triangular. !>
[in]	TRANS	!> TRANS is CHARACTER1 !> Specifies the form of the system of equations: !> = 'N': A X = B (No transpose) !> = 'T': A*T X = B (Transpose) !> = 'C': A*H X = B (Conjugate transpose) !>
[in]	DIAG	!> DIAG is CHARACTER*1 !> = 'N': A is non-unit triangular; !> = 'U': A is unit triangular. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in]	NRHS	!> NRHS is INTEGER !> The number of right hand sides, i.e., the number of columns !> of the matrices B and X. NRHS >= 0. !>
[in]	AP	!> AP is COMPLEX array, dimension (N(N+1)/2) !> The upper or lower triangular matrix A, packed columnwise in !> a linear array. The j-th column of A is stored in the array !> AP as follows: !> if UPLO = 'U', AP(i + (j-1)j/2) = A(i,j) for 1<=i<=j; !> if UPLO = 'L', AP(i + (j-1)*(2n-j)/2) = A(i,j) for j<=i<=n. !> If DIAG = 'U', the diagonal elements of A are not referenced !> and are assumed to be 1. !>
[in]	B	!> B is COMPLEX array, dimension (LDB,NRHS) !> The right hand side matrix B. !>
[in]	LDB	!> LDB is INTEGER !> The leading dimension of the array B. LDB >= max(1,N). !>
[in]	X	!> X is COMPLEX array, dimension (LDX,NRHS) !> The solution matrix X. !>
[in]	LDX	!> LDX is INTEGER !> The leading dimension of the array X. LDX >= max(1,N). !>
[out]	FERR	!> FERR is REAL array, dimension (NRHS) !> The estimated forward error bound for each solution vector !> X(j) (the j-th column of the solution matrix X). !> If XTRUE is the true solution corresponding to X(j), FERR(j) !> is an estimated upper bound for the magnitude of the largest !> element in (X(j) - XTRUE) divided by the magnitude of the !> largest element in X(j). The estimate is as reliable as !> the estimate for RCOND, and is almost always a slight !> overestimate of the true error. !>
[out]	BERR	!> BERR is REAL array, dimension (NRHS) !> The componentwise relative backward error of each solution !> vector X(j) (i.e., the smallest relative change in !> any element of A or B that makes X(j) an exact solution). !>
[out]	WORK	!> WORK is COMPLEX array, dimension (2*N) !>
[out]	RWORK	!> RWORK is REAL array, dimension (N) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 172 of file ctprfs.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          DIAG, TRANS, UPLO
      INTEGER            INFO, LDB, LDX, N, NRHS
*     ..
*     .. Array Arguments ..
      REAL               BERR( * ), FERR( * ), RWORK( * )
      COMPLEX            AP( * ), B( LDB, * ), WORK( * ), X( LDX, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ZERO
      parameter( zero = 0.0e+0 )
      COMPLEX            ONE
      parameter( one = ( 1.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      LOGICAL            NOTRAN, NOUNIT, UPPER
      CHARACTER          TRANSN, TRANST
      INTEGER            I, J, K, KASE, KC, NZ
      REAL               EPS, LSTRES, S, SAFE1, SAFE2, SAFMIN, XK
      COMPLEX            ZDUM
*     ..
*     .. Local Arrays ..
      INTEGER            ISAVE( 3 )
*     ..
*     .. External Subroutines ..
      EXTERNAL           caxpy, ccopy, clacn2, ctpmv, ctpsv, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, aimag, max, real
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      REAL               SLAMCH
      EXTERNAL           lsame, slamch
*     ..
*     .. Statement Functions ..
      REAL               CABS1
*     ..
*     .. Statement Function definitions ..
      cabs1( zdum ) = abs( real( zdum ) ) + abs( aimag( zdum ) )
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      upper = lsame( uplo, 'U' )
      notran = lsame( trans, 'N' )
      nounit = lsame( diag, 'N' )
*
      IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -1
      ELSE IF( .NOT.notran .AND. .NOT.lsame( trans, 'T' ) .AND. .NOT.
     $         lsame( trans, 'C' ) ) THEN
         info = -2
      ELSE IF( .NOT.nounit .AND. .NOT.lsame( diag, 'U' ) ) THEN
         info = -3
      ELSE IF( n.LT.0 ) THEN
         info = -4
      ELSE IF( nrhs.LT.0 ) THEN
         info = -5
      ELSE IF( ldb.LT.max( 1, n ) ) THEN
         info = -8
      ELSE IF( ldx.LT.max( 1, n ) ) THEN
         info = -10
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CTPRFS', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 .OR. nrhs.EQ.0 ) THEN
         DO 10 j = 1, nrhs
            ferr( j ) = zero
            berr( j ) = zero
   10    CONTINUE
         RETURN
      END IF
*
      IF( notran ) THEN
         transn = 'N'
         transt = 'C'
      ELSE
         transn = 'C'
         transt = 'N'
      END IF
*
*     NZ = maximum number of nonzero elements in each row of A, plus 1
*
      nz = n + 1
      eps = slamch( 'Epsilon' )
      safmin = slamch( 'Safe minimum' )
      safe1 = nz*safmin
      safe2 = safe1 / eps
*
*     Do for each right hand side
*
      DO 250 j = 1, nrhs
*
*        Compute residual R = B - op(A) * X,
*        where op(A) = A, A**T, or A**H, depending on TRANS.
*
         CALL ccopy( n, x( 1, j ), 1, work, 1 )
         CALL ctpmv( uplo, trans, diag, n, ap, work, 1 )
         CALL caxpy( n, -one, b( 1, j ), 1, work, 1 )
*
*        Compute componentwise relative backward error from formula
*
*        max(i) ( abs(R(i)) / ( abs(op(A))*abs(X) + abs(B) )(i) )
*
*        where abs(Z) is the componentwise absolute value of the matrix
*        or vector Z.  If the i-th component of the denominator is less
*        than SAFE2, then SAFE1 is added to the i-th components of the
*        numerator and denominator before dividing.
*
         DO 20 i = 1, n
            rwork( i ) = cabs1( b( i, j ) )
   20    CONTINUE
*
         IF( notran ) THEN
*
*           Compute abs(A)*abs(X) + abs(B).
*
            IF( upper ) THEN
               kc = 1
               IF( nounit ) THEN
                  DO 40 k = 1, n
                     xk = cabs1( x( k, j ) )
                     DO 30 i = 1, k
                        rwork( i ) = rwork( i ) +
     $                               cabs1( ap( kc+i-1 ) )*xk
   30                CONTINUE
                     kc = kc + k
   40             CONTINUE
               ELSE
                  DO 60 k = 1, n
                     xk = cabs1( x( k, j ) )
                     DO 50 i = 1, k - 1
                        rwork( i ) = rwork( i ) +
     $                               cabs1( ap( kc+i-1 ) )*xk
   50                CONTINUE
                     rwork( k ) = rwork( k ) + xk
                     kc = kc + k
   60             CONTINUE
               END IF
            ELSE
               kc = 1
               IF( nounit ) THEN
                  DO 80 k = 1, n
                     xk = cabs1( x( k, j ) )
                     DO 70 i = k, n
                        rwork( i ) = rwork( i ) +
     $                               cabs1( ap( kc+i-k ) )*xk
   70                CONTINUE
                     kc = kc + n - k + 1
   80             CONTINUE
               ELSE
                  DO 100 k = 1, n
                     xk = cabs1( x( k, j ) )
                     DO 90 i = k + 1, n
                        rwork( i ) = rwork( i ) +
     $                               cabs1( ap( kc+i-k ) )*xk
   90                CONTINUE
                     rwork( k ) = rwork( k ) + xk
                     kc = kc + n - k + 1
  100             CONTINUE
               END IF
            END IF
         ELSE
*
*           Compute abs(A**H)*abs(X) + abs(B).
*
            IF( upper ) THEN
               kc = 1
               IF( nounit ) THEN
                  DO 120 k = 1, n
                     s = zero
                     DO 110 i = 1, k
                        s = s + cabs1( ap( kc+i-1 ) )*cabs1( x( i, j ) )
  110                CONTINUE
                     rwork( k ) = rwork( k ) + s
                     kc = kc + k
  120             CONTINUE
               ELSE
                  DO 140 k = 1, n
                     s = cabs1( x( k, j ) )
                     DO 130 i = 1, k - 1
                        s = s + cabs1( ap( kc+i-1 ) )*cabs1( x( i, j ) )
  130                CONTINUE
                     rwork( k ) = rwork( k ) + s
                     kc = kc + k
  140             CONTINUE
               END IF
            ELSE
               kc = 1
               IF( nounit ) THEN
                  DO 160 k = 1, n
                     s = zero
                     DO 150 i = k, n
                        s = s + cabs1( ap( kc+i-k ) )*cabs1( x( i, j ) )
  150                CONTINUE
                     rwork( k ) = rwork( k ) + s
                     kc = kc + n - k + 1
  160             CONTINUE
               ELSE
                  DO 180 k = 1, n
                     s = cabs1( x( k, j ) )
                     DO 170 i = k + 1, n
                        s = s + cabs1( ap( kc+i-k ) )*cabs1( x( i, j ) )
  170                CONTINUE
                     rwork( k ) = rwork( k ) + s
                     kc = kc + n - k + 1
  180             CONTINUE
               END IF
            END IF
         END IF
         s = zero
         DO 190 i = 1, n
            IF( rwork( i ).GT.safe2 ) THEN
               s = max( s, cabs1( work( i ) ) / rwork( i ) )
            ELSE
               s = max( s, ( cabs1( work( i ) )+safe1 ) /
     $             ( rwork( i )+safe1 ) )
            END IF
  190    CONTINUE
         berr( j ) = s
*
*        Bound error from formula
*
*        norm(X - XTRUE) / norm(X) .le. FERR =
*        norm( abs(inv(op(A)))*
*           ( abs(R) + NZ*EPS*( abs(op(A))*abs(X)+abs(B) ))) / norm(X)
*
*        where
*          norm(Z) is the magnitude of the largest component of Z
*          inv(op(A)) is the inverse of op(A)
*          abs(Z) is the componentwise absolute value of the matrix or
*             vector Z
*          NZ is the maximum number of nonzeros in any row of A, plus 1
*          EPS is machine epsilon
*
*        The i-th component of abs(R)+NZ*EPS*(abs(op(A))*abs(X)+abs(B))
*        is incremented by SAFE1 if the i-th component of
*        abs(op(A))*abs(X) + abs(B) is less than SAFE2.
*
*        Use CLACN2 to estimate the infinity-norm of the matrix
*           inv(op(A)) * diag(W),
*        where W = abs(R) + NZ*EPS*( abs(op(A))*abs(X)+abs(B) )))
*
         DO 200 i = 1, n
            IF( rwork( i ).GT.safe2 ) THEN
               rwork( i ) = cabs1( work( i ) ) + nz*eps*rwork( i )
            ELSE
               rwork( i ) = cabs1( work( i ) ) + nz*eps*rwork( i ) +
     $                      safe1
            END IF
  200    CONTINUE
*
         kase = 0
  210    CONTINUE
         CALL clacn2( n, work( n+1 ), work, ferr( j ), kase, isave )
         IF( kase.NE.0 ) THEN
            IF( kase.EQ.1 ) THEN
*
*              Multiply by diag(W)*inv(op(A)**H).
*
               CALL ctpsv( uplo, transt, diag, n, ap, work, 1 )
               DO 220 i = 1, n
                  work( i ) = rwork( i )*work( i )
  220          CONTINUE
            ELSE
*
*              Multiply by inv(op(A))*diag(W).
*
               DO 230 i = 1, n
                  work( i ) = rwork( i )*work( i )
  230          CONTINUE
               CALL ctpsv( uplo, transn, diag, n, ap, work, 1 )
            END IF
            GO TO 210
         END IF
*
*        Normalize error.
*
         lstres = zero
         DO 240 i = 1, n
            lstres = max( lstres, cabs1( x( i, j ) ) )
  240    CONTINUE
         IF( lstres.NE.zero )
     $      ferr( j ) = ferr( j ) / lstres
*
  250 CONTINUE
*
      RETURN
*
*     End of CTPRFS
*

◆ ctptri()

subroutine ctptri	(	character	uplo,
		character	diag,
		integer	n,
		complex, dimension( * )	ap,
		integer	info )

CTPTRI

Download CTPTRI + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CTPTRI computes the inverse of a complex upper or lower triangular
!> matrix A stored in packed format.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': A is upper triangular; !> = 'L': A is lower triangular. !>
[in]	DIAG	!> DIAG is CHARACTER*1 !> = 'N': A is non-unit triangular; !> = 'U': A is unit triangular. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in,out]	AP	!> AP is COMPLEX array, dimension (N(N+1)/2) !> On entry, the upper or lower triangular matrix A, stored !> columnwise in a linear array. The j-th column of A is stored !> in the array AP as follows: !> if UPLO = 'U', AP(i + (j-1)j/2) = A(i,j) for 1<=i<=j; !> if UPLO = 'L', AP(i + (j-1)((2n-j)/2) = A(i,j) for j<=i<=n. !> See below for further details. !> On exit, the (triangular) inverse of the original matrix, in !> the same packed storage format. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !> > 0: if INFO = i, A(i,i) is exactly zero. The triangular !> matrix is singular and its inverse can not be computed. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  A triangular matrix A can be transferred to packed storage using one
!>  of the following program segments:
!>
!>  UPLO = 'U':                      UPLO = 'L':
!>
!>        JC = 1                           JC = 1
!>        DO 2 J = 1, N                    DO 2 J = 1, N
!>           DO 1 I = 1, J                    DO 1 I = J, N
!>              AP(JC+I-1) = A(I,J)              AP(JC+I-J) = A(I,J)
!>      1    CONTINUE                    1    CONTINUE
!>           JC = JC + J                      JC = JC + N - J + 1
!>      2 CONTINUE                       2 CONTINUE
!>

Definition at line 116 of file ctptri.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          DIAG, UPLO
      INTEGER            INFO, N
*     ..
*     .. Array Arguments ..
      COMPLEX            AP( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            ONE, ZERO
      parameter( one = ( 1.0e+0, 0.0e+0 ),
     $                   zero = ( 0.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      LOGICAL            NOUNIT, UPPER
      INTEGER            J, JC, JCLAST, JJ
      COMPLEX            AJJ
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           cscal, ctpmv, xerbla
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      upper = lsame( uplo, 'U' )
      nounit = lsame( diag, 'N' )
      IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -1
      ELSE IF( .NOT.nounit .AND. .NOT.lsame( diag, 'U' ) ) THEN
         info = -2
      ELSE IF( n.LT.0 ) THEN
         info = -3
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CTPTRI', -info )
         RETURN
      END IF
*
*     Check for singularity if non-unit.
*
      IF( nounit ) THEN
         IF( upper ) THEN
            jj = 0
            DO 10 info = 1, n
               jj = jj + info
               IF( ap( jj ).EQ.zero )
     $            RETURN
   10       CONTINUE
         ELSE
            jj = 1
            DO 20 info = 1, n
               IF( ap( jj ).EQ.zero )
     $            RETURN
               jj = jj + n - info + 1
   20       CONTINUE
         END IF
         info = 0
      END IF
*
      IF( upper ) THEN
*
*        Compute inverse of upper triangular matrix.
*
         jc = 1
         DO 30 j = 1, n
            IF( nounit ) THEN
               ap( jc+j-1 ) = one / ap( jc+j-1 )
               ajj = -ap( jc+j-1 )
            ELSE
               ajj = -one
            END IF
*
*           Compute elements 1:j-1 of j-th column.
*
            CALL ctpmv( 'Upper', 'No transpose', diag, j-1, ap,
     $                  ap( jc ), 1 )
            CALL cscal( j-1, ajj, ap( jc ), 1 )
            jc = jc + j
   30    CONTINUE
*
      ELSE
*
*        Compute inverse of lower triangular matrix.
*
         jc = n*( n+1 ) / 2
         DO 40 j = n, 1, -1
            IF( nounit ) THEN
               ap( jc ) = one / ap( jc )
               ajj = -ap( jc )
            ELSE
               ajj = -one
            END IF
            IF( j.LT.n ) THEN
*
*              Compute elements j+1:n of j-th column.
*
               CALL ctpmv( 'Lower', 'No transpose', diag, n-j,
     $                     ap( jclast ), ap( jc+1 ), 1 )
               CALL cscal( n-j, ajj, ap( jc+1 ), 1 )
            END IF
            jclast = jc
            jc = jc - n + j - 2
   40    CONTINUE
      END IF
*
      RETURN
*
*     End of CTPTRI
*

◆ ctptrs()

subroutine ctptrs	(	character	uplo,
		character	trans,
		character	diag,
		integer	n,
		integer	nrhs,
		complex, dimension( * )	ap,
		complex, dimension( ldb, * )	b,
		integer	ldb,
		integer	info )

CTPTRS

Download CTPTRS + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CTPTRS solves a triangular system of the form
!>
!>    A * X = B,  A**T * X = B,  or  A**H * X = B,
!>
!> where A is a triangular matrix of order N stored in packed format,
!> and B is an N-by-NRHS matrix.  A check is made to verify that A is
!> nonsingular.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': A is upper triangular; !> = 'L': A is lower triangular. !>
[in]	TRANS	!> TRANS is CHARACTER1 !> Specifies the form of the system of equations: !> = 'N': A X = B (No transpose) !> = 'T': A*T X = B (Transpose) !> = 'C': A*H X = B (Conjugate transpose) !>
[in]	DIAG	!> DIAG is CHARACTER*1 !> = 'N': A is non-unit triangular; !> = 'U': A is unit triangular. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in]	NRHS	!> NRHS is INTEGER !> The number of right hand sides, i.e., the number of columns !> of the matrix B. NRHS >= 0. !>
[in]	AP	!> AP is COMPLEX array, dimension (N(N+1)/2) !> The upper or lower triangular matrix A, packed columnwise in !> a linear array. The j-th column of A is stored in the array !> AP as follows: !> if UPLO = 'U', AP(i + (j-1)j/2) = A(i,j) for 1<=i<=j; !> if UPLO = 'L', AP(i + (j-1)(2n-j)/2) = A(i,j) for j<=i<=n. !>
[in,out]	B	!> B is COMPLEX array, dimension (LDB,NRHS) !> On entry, the right hand side matrix B. !> On exit, if INFO = 0, the solution matrix X. !>
[in]	LDB	!> LDB is INTEGER !> The leading dimension of the array B. LDB >= max(1,N). !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !> > 0: if INFO = i, the i-th diagonal element of A is zero, !> indicating that the matrix is singular and the !> solutions X have not been computed. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 129 of file ctptrs.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          DIAG, TRANS, UPLO
      INTEGER            INFO, LDB, N, NRHS
*     ..
*     .. Array Arguments ..
      COMPLEX            AP( * ), B( LDB, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            ZERO
      parameter( zero = ( 0.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      LOGICAL            NOUNIT, UPPER
      INTEGER            J, JC
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           ctpsv, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      upper = lsame( uplo, 'U' )
      nounit = lsame( diag, 'N' )
      IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -1
      ELSE IF( .NOT.lsame( trans, 'N' ) .AND. .NOT.
     $         lsame( trans, 'T' ) .AND. .NOT.lsame( trans, 'C' ) ) THEN
         info = -2
      ELSE IF( .NOT.nounit .AND. .NOT.lsame( diag, 'U' ) ) THEN
         info = -3
      ELSE IF( n.LT.0 ) THEN
         info = -4
      ELSE IF( nrhs.LT.0 ) THEN
         info = -5
      ELSE IF( ldb.LT.max( 1, n ) ) THEN
         info = -8
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CTPTRS', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
*     Check for singularity.
*
      IF( nounit ) THEN
         IF( upper ) THEN
            jc = 1
            DO 10 info = 1, n
               IF( ap( jc+info-1 ).EQ.zero )
     $            RETURN
               jc = jc + info
   10       CONTINUE
         ELSE
            jc = 1
            DO 20 info = 1, n
               IF( ap( jc ).EQ.zero )
     $            RETURN
               jc = jc + n - info + 1
   20       CONTINUE
         END IF
      END IF
      info = 0
*
*     Solve  A * x = b,  A**T * x = b,  or  A**H * x = b.
*
      DO 30 j = 1, nrhs
         CALL ctpsv( uplo, trans, diag, n, ap, b( 1, j ), 1 )
   30 CONTINUE
*
      RETURN
*
*     End of CTPTRS
*

◆ ctpttf()

subroutine ctpttf	(	character	transr,
		character	uplo,
		integer	n,
		complex, dimension( 0: * )	ap,
		complex, dimension( 0: * )	arf,
		integer	info )

CTPTTF copies a triangular matrix from the standard packed format (TP) to the rectangular full packed format (TF).

Download CTPTTF + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CTPTTF copies a triangular matrix A from standard packed format (TP)
!> to rectangular full packed format (TF).
!>

Parameters

[in]	TRANSR	!> TRANSR is CHARACTER*1 !> = 'N': ARF in Normal format is wanted; !> = 'C': ARF in Conjugate-transpose format is wanted. !>
[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': A is upper triangular; !> = 'L': A is lower triangular. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in]	AP	!> AP is COMPLEX array, dimension ( N(N+1)/2 ), !> On entry, the upper or lower triangular matrix A, packed !> columnwise in a linear array. The j-th column of A is stored !> in the array AP as follows: !> if UPLO = 'U', AP(i + (j-1)j/2) = A(i,j) for 1<=i<=j; !> if UPLO = 'L', AP(i + (j-1)*(2n-j)/2) = A(i,j) for j<=i<=n. !>
[out]	ARF	!> ARF is COMPLEX array, dimension ( N*(N+1)/2 ), !> On exit, the upper or lower triangular matrix A stored in !> RFP format. For a further discussion see Notes below. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  We first consider Standard Packed Format when N is even.
!>  We give an example where N = 6.
!>
!>      AP is Upper             AP is Lower
!>
!>   00 01 02 03 04 05       00
!>      11 12 13 14 15       10 11
!>         22 23 24 25       20 21 22
!>            33 34 35       30 31 32 33
!>               44 45       40 41 42 43 44
!>                  55       50 51 52 53 54 55
!>
!>
!>  Let TRANSR = 'N'. RFP holds AP as follows:
!>  For UPLO = 'U' the upper trapezoid A(0:5,0:2) consists of the last
!>  three columns of AP upper. The lower triangle A(4:6,0:2) consists of
!>  conjugate-transpose of the first three columns of AP upper.
!>  For UPLO = 'L' the lower trapezoid A(1:6,0:2) consists of the first
!>  three columns of AP lower. The upper triangle A(0:2,0:2) consists of
!>  conjugate-transpose of the last three columns of AP lower.
!>  To denote conjugate we place -- above the element. This covers the
!>  case N even and TRANSR = 'N'.
!>
!>         RFP A                   RFP A
!>
!>                                -- -- --
!>        03 04 05                33 43 53
!>                                   -- --
!>        13 14 15                00 44 54
!>                                      --
!>        23 24 25                10 11 55
!>
!>        33 34 35                20 21 22
!>        --
!>        00 44 45                30 31 32
!>        -- --
!>        01 11 55                40 41 42
!>        -- -- --
!>        02 12 22                50 51 52
!>
!>  Now let TRANSR = 'C'. RFP A in both UPLO cases is just the conjugate-
!>  transpose of RFP A above. One therefore gets:
!>
!>
!>           RFP A                   RFP A
!>
!>     -- -- -- --                -- -- -- -- -- --
!>     03 13 23 33 00 01 02    33 00 10 20 30 40 50
!>     -- -- -- -- --                -- -- -- -- --
!>     04 14 24 34 44 11 12    43 44 11 21 31 41 51
!>     -- -- -- -- -- --                -- -- -- --
!>     05 15 25 35 45 55 22    53 54 55 22 32 42 52
!>
!>
!>  We next  consider Standard Packed Format when N is odd.
!>  We give an example where N = 5.
!>
!>     AP is Upper                 AP is Lower
!>
!>   00 01 02 03 04              00
!>      11 12 13 14              10 11
!>         22 23 24              20 21 22
!>            33 34              30 31 32 33
!>               44              40 41 42 43 44
!>
!>
!>  Let TRANSR = 'N'. RFP holds AP as follows:
!>  For UPLO = 'U' the upper trapezoid A(0:4,0:2) consists of the last
!>  three columns of AP upper. The lower triangle A(3:4,0:1) consists of
!>  conjugate-transpose of the first two   columns of AP upper.
!>  For UPLO = 'L' the lower trapezoid A(0:4,0:2) consists of the first
!>  three columns of AP lower. The upper triangle A(0:1,1:2) consists of
!>  conjugate-transpose of the last two   columns of AP lower.
!>  To denote conjugate we place -- above the element. This covers the
!>  case N odd  and TRANSR = 'N'.
!>
!>         RFP A                   RFP A
!>
!>                                   -- --
!>        02 03 04                00 33 43
!>                                      --
!>        12 13 14                10 11 44
!>
!>        22 23 24                20 21 22
!>        --
!>        00 33 34                30 31 32
!>        -- --
!>        01 11 44                40 41 42
!>
!>  Now let TRANSR = 'C'. RFP A in both UPLO cases is just the conjugate-
!>  transpose of RFP A above. One therefore gets:
!>
!>
!>           RFP A                   RFP A
!>
!>     -- -- --                   -- -- -- -- -- --
!>     02 12 22 00 01             00 10 20 30 40 50
!>     -- -- -- --                   -- -- -- -- --
!>     03 13 23 33 11             33 11 21 31 41 51
!>     -- -- -- -- --                   -- -- -- --
!>     04 14 24 34 44             43 44 22 32 42 52
!>

Definition at line 206 of file ctpttf.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          TRANSR, UPLO
      INTEGER            INFO, N
*     ..
*     .. Array Arguments ..
      COMPLEX            AP( 0: * ), ARF( 0: * )
*
*  =====================================================================
*
*     .. Parameters ..
*     ..
*     .. Local Scalars ..
      LOGICAL            LOWER, NISODD, NORMALTRANSR
      INTEGER            N1, N2, K, NT
      INTEGER            I, J, IJ
      INTEGER            IJP, JP, LDA, JS
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          conjg, mod
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      normaltransr = lsame( transr, 'N' )
      lower = lsame( uplo, 'L' )
      IF( .NOT.normaltransr .AND. .NOT.lsame( transr, 'C' ) ) THEN
         info = -1
      ELSE IF( .NOT.lower .AND. .NOT.lsame( uplo, 'U' ) ) THEN
         info = -2
      ELSE IF( n.LT.0 ) THEN
         info = -3
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CTPTTF', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
      IF( n.EQ.1 ) THEN
         IF( normaltransr ) THEN
            arf( 0 ) = ap( 0 )
         ELSE
            arf( 0 ) = conjg( ap( 0 ) )
         END IF
         RETURN
      END IF
*
*     Size of array ARF(0:NT-1)
*
      nt = n*( n+1 ) / 2
*
*     Set N1 and N2 depending on LOWER
*
      IF( lower ) THEN
         n2 = n / 2
         n1 = n - n2
      ELSE
         n1 = n / 2
         n2 = n - n1
      END IF
*
*     If N is odd, set NISODD = .TRUE.
*     If N is even, set K = N/2 and NISODD = .FALSE.
*
*     set lda of ARF^C; ARF^C is (0:(N+1)/2-1,0:N-noe)
*     where noe = 0 if n is even, noe = 1 if n is odd
*
      IF( mod( n, 2 ).EQ.0 ) THEN
         k = n / 2
         nisodd = .false.
         lda = n + 1
      ELSE
         nisodd = .true.
         lda = n
      END IF
*
*     ARF^C has lda rows and n+1-noe cols
*
      IF( .NOT.normaltransr )
     $   lda = ( n+1 ) / 2
*
*     start execution: there are eight cases
*
      IF( nisodd ) THEN
*
*        N is odd
*
         IF( normaltransr ) THEN
*
*           N is odd and TRANSR = 'N'
*
            IF( lower ) THEN
*
*             SRPA for LOWER, NORMAL and N is odd ( a(0:n-1,0:n1-1) )
*             T1 -> a(0,0), T2 -> a(0,1), S -> a(n1,0)
*             T1 -> a(0), T2 -> a(n), S -> a(n1); lda = n
*
               ijp = 0
               jp = 0
               DO j = 0, n2
                  DO i = j, n - 1
                     ij = i + jp
                     arf( ij ) = ap( ijp )
                     ijp = ijp + 1
                  END DO
                  jp = jp + lda
               END DO
               DO i = 0, n2 - 1
                  DO j = 1 + i, n2
                     ij = i + j*lda
                     arf( ij ) = conjg( ap( ijp ) )
                     ijp = ijp + 1
                  END DO
               END DO
*
            ELSE
*
*             SRPA for UPPER, NORMAL and N is odd ( a(0:n-1,0:n2-1)
*             T1 -> a(n1+1,0), T2 -> a(n1,0), S -> a(0,0)
*             T1 -> a(n2), T2 -> a(n1), S -> a(0)
*
               ijp = 0
               DO j = 0, n1 - 1
                  ij = n2 + j
                  DO i = 0, j
                     arf( ij ) = conjg( ap( ijp ) )
                     ijp = ijp + 1
                     ij = ij + lda
                  END DO
               END DO
               js = 0
               DO j = n1, n - 1
                  ij = js
                  DO ij = js, js + j
                     arf( ij ) = ap( ijp )
                     ijp = ijp + 1
                  END DO
                  js = js + lda
               END DO
*
            END IF
*
         ELSE
*
*           N is odd and TRANSR = 'C'
*
            IF( lower ) THEN
*
*              SRPA for LOWER, TRANSPOSE and N is odd
*              T1 -> A(0,0) , T2 -> A(1,0) , S -> A(0,n1)
*              T1 -> a(0+0) , T2 -> a(1+0) , S -> a(0+n1*n1); lda=n1
*
               ijp = 0
               DO i = 0, n2
                  DO ij = i*( lda+1 ), n*lda - 1, lda
                     arf( ij ) = conjg( ap( ijp ) )
                     ijp = ijp + 1
                  END DO
               END DO
               js = 1
               DO j = 0, n2 - 1
                  DO ij = js, js + n2 - j - 1
                     arf( ij ) = ap( ijp )
                     ijp = ijp + 1
                  END DO
                  js = js + lda + 1
               END DO
*
            ELSE
*
*              SRPA for UPPER, TRANSPOSE and N is odd
*              T1 -> A(0,n1+1), T2 -> A(0,n1), S -> A(0,0)
*              T1 -> a(n2*n2), T2 -> a(n1*n2), S -> a(0); lda = n2
*
               ijp = 0
               js = n2*lda
               DO j = 0, n1 - 1
                  DO ij = js, js + j
                     arf( ij ) = ap( ijp )
                     ijp = ijp + 1
                  END DO
                  js = js + lda
               END DO
               DO i = 0, n1
                  DO ij = i, i + ( n1+i )*lda, lda
                     arf( ij ) = conjg( ap( ijp ) )
                     ijp = ijp + 1
                  END DO
               END DO
*
            END IF
*
         END IF
*
      ELSE
*
*        N is even
*
         IF( normaltransr ) THEN
*
*           N is even and TRANSR = 'N'
*
            IF( lower ) THEN
*
*              SRPA for LOWER, NORMAL, and N is even ( a(0:n,0:k-1) )
*              T1 -> a(1,0), T2 -> a(0,0), S -> a(k+1,0)
*              T1 -> a(1), T2 -> a(0), S -> a(k+1)
*
               ijp = 0
               jp = 0
               DO j = 0, k - 1
                  DO i = j, n - 1
                     ij = 1 + i + jp
                     arf( ij ) = ap( ijp )
                     ijp = ijp + 1
                  END DO
                  jp = jp + lda
               END DO
               DO i = 0, k - 1
                  DO j = i, k - 1
                     ij = i + j*lda
                     arf( ij ) = conjg( ap( ijp ) )
                     ijp = ijp + 1
                  END DO
               END DO
*
            ELSE
*
*              SRPA for UPPER, NORMAL, and N is even ( a(0:n,0:k-1) )
*              T1 -> a(k+1,0) ,  T2 -> a(k,0),   S -> a(0,0)
*              T1 -> a(k+1), T2 -> a(k), S -> a(0)
*
               ijp = 0
               DO j = 0, k - 1
                  ij = k + 1 + j
                  DO i = 0, j
                     arf( ij ) = conjg( ap( ijp ) )
                     ijp = ijp + 1
                     ij = ij + lda
                  END DO
               END DO
               js = 0
               DO j = k, n - 1
                  ij = js
                  DO ij = js, js + j
                     arf( ij ) = ap( ijp )
                     ijp = ijp + 1
                  END DO
                  js = js + lda
               END DO
*
            END IF
*
         ELSE
*
*           N is even and TRANSR = 'C'
*
            IF( lower ) THEN
*
*              SRPA for LOWER, TRANSPOSE and N is even (see paper)
*              T1 -> B(0,1), T2 -> B(0,0), S -> B(0,k+1)
*              T1 -> a(0+k), T2 -> a(0+0), S -> a(0+k*(k+1)); lda=k
*
               ijp = 0
               DO i = 0, k - 1
                  DO ij = i + ( i+1 )*lda, ( n+1 )*lda - 1, lda
                     arf( ij ) = conjg( ap( ijp ) )
                     ijp = ijp + 1
                  END DO
               END DO
               js = 0
               DO j = 0, k - 1
                  DO ij = js, js + k - j - 1
                     arf( ij ) = ap( ijp )
                     ijp = ijp + 1
                  END DO
                  js = js + lda + 1
               END DO
*
            ELSE
*
*              SRPA for UPPER, TRANSPOSE and N is even (see paper)
*              T1 -> B(0,k+1),     T2 -> B(0,k),   S -> B(0,0)
*              T1 -> a(0+k*(k+1)), T2 -> a(0+k*k), S -> a(0+0)); lda=k
*
               ijp = 0
               js = ( k+1 )*lda
               DO j = 0, k - 1
                  DO ij = js, js + j
                     arf( ij ) = ap( ijp )
                     ijp = ijp + 1
                  END DO
                  js = js + lda
               END DO
               DO i = 0, k - 1
                  DO ij = i, i + ( k+i )*lda, lda
                     arf( ij ) = conjg( ap( ijp ) )
                     ijp = ijp + 1
                  END DO
               END DO
*
            END IF
*
         END IF
*
      END IF
*
      RETURN
*
*     End of CTPTTF
*

◆ ctpttr()

subroutine ctpttr	(	character	uplo,
		integer	n,
		complex, dimension( * )	ap,
		complex, dimension( lda, * )	a,
		integer	lda,
		integer	info )

CTPTTR copies a triangular matrix from the standard packed format (TP) to the standard full format (TR).

Download CTPTTR + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CTPTTR copies a triangular matrix A from standard packed format (TP)
!> to standard full format (TR).
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': A is upper triangular. !> = 'L': A is lower triangular. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in]	AP	!> AP is COMPLEX array, dimension ( N(N+1)/2 ), !> On entry, the upper or lower triangular matrix A, packed !> columnwise in a linear array. The j-th column of A is stored !> in the array AP as follows: !> if UPLO = 'U', AP(i + (j-1)j/2) = A(i,j) for 1<=i<=j; !> if UPLO = 'L', AP(i + (j-1)*(2n-j)/2) = A(i,j) for j<=i<=n. !>
[out]	A	!> A is COMPLEX array, dimension ( LDA, N ) !> On exit, the triangular matrix A. If UPLO = 'U', the leading !> N-by-N upper triangular part of A contains the upper !> triangular part of the matrix A, and the strictly lower !> triangular part of A is not referenced. If UPLO = 'L', the !> leading N-by-N lower triangular part of A contains the lower !> triangular part of the matrix A, and the strictly upper !> triangular part of A is not referenced. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,N). !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 103 of file ctpttr.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          UPLO
      INTEGER            INFO, N, LDA
*     ..
*     .. Array Arguments ..
      COMPLEX            A( LDA, * ), AP( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
*     ..
*     .. Local Scalars ..
      LOGICAL            LOWER
      INTEGER            I, J, K
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           xerbla
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      lower = lsame( uplo, 'L' )
      IF( .NOT.lower .AND. .NOT.lsame( uplo, 'U' ) ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( lda.LT.max( 1, n ) ) THEN
         info = -5
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CTPTTR', -info )
         RETURN
      END IF
*
      IF( lower ) THEN
         k = 0
         DO j = 1, n
            DO i = j, n
               k = k + 1
               a( i, j ) = ap( k )
            END DO
         END DO
      ELSE
         k = 0
         DO j = 1, n
            DO i = 1, j
               k = k + 1
               a( i, j ) = ap( k )
            END DO
         END DO
      END IF
*
*
      RETURN
*
*     End of CTPTTR
*

◆ ctrcon()

subroutine ctrcon	(	character	norm,
		character	uplo,
		character	diag,
		integer	n,
		complex, dimension( lda, * )	a,
		integer	lda,
		real	rcond,
		complex, dimension( * )	work,
		real, dimension( * )	rwork,
		integer	info )

CTRCON

Download CTRCON + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CTRCON estimates the reciprocal of the condition number of a
!> triangular matrix A, in either the 1-norm or the infinity-norm.
!>
!> The norm of A is computed and an estimate is obtained for
!> norm(inv(A)), then the reciprocal of the condition number is
!> computed as
!>    RCOND = 1 / ( norm(A) * norm(inv(A)) ).
!>

Parameters

[in]	NORM	!> NORM is CHARACTER*1 !> Specifies whether the 1-norm condition number or the !> infinity-norm condition number is required: !> = '1' or 'O': 1-norm; !> = 'I': Infinity-norm. !>
[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': A is upper triangular; !> = 'L': A is lower triangular. !>
[in]	DIAG	!> DIAG is CHARACTER*1 !> = 'N': A is non-unit triangular; !> = 'U': A is unit triangular. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in]	A	!> A is COMPLEX array, dimension (LDA,N) !> The triangular matrix A. If UPLO = 'U', the leading N-by-N !> upper triangular part of the array A contains the upper !> triangular matrix, and the strictly lower triangular part of !> A is not referenced. If UPLO = 'L', the leading N-by-N lower !> triangular part of the array A contains the lower triangular !> matrix, and the strictly upper triangular part of A is not !> referenced. If DIAG = 'U', the diagonal elements of A are !> also not referenced and are assumed to be 1. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,N). !>
[out]	RCOND	!> RCOND is REAL !> The reciprocal of the condition number of the matrix A, !> computed as RCOND = 1/(norm(A) * norm(inv(A))). !>
[out]	WORK	!> WORK is COMPLEX array, dimension (2*N) !>
[out]	RWORK	!> RWORK is REAL array, dimension (N) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 135 of file ctrcon.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          DIAG, NORM, UPLO
      INTEGER            INFO, LDA, N
      REAL               RCOND
*     ..
*     .. Array Arguments ..
      REAL               RWORK( * )
      COMPLEX            A( LDA, * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ONE, ZERO
      parameter( one = 1.0e+0, zero = 0.0e+0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            NOUNIT, ONENRM, UPPER
      CHARACTER          NORMIN
      INTEGER            IX, KASE, KASE1
      REAL               AINVNM, ANORM, SCALE, SMLNUM, XNORM
      COMPLEX            ZDUM
*     ..
*     .. Local Arrays ..
      INTEGER            ISAVE( 3 )
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      INTEGER            ICAMAX
      REAL               CLANTR, SLAMCH
      EXTERNAL           lsame, icamax, clantr, slamch
*     ..
*     .. External Subroutines ..
      EXTERNAL           clacn2, clatrs, csrscl, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, aimag, max, real
*     ..
*     .. Statement Functions ..
      REAL               CABS1
*     ..
*     .. Statement Function definitions ..
      cabs1( zdum ) = abs( real( zdum ) ) + abs( aimag( zdum ) )
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      upper = lsame( uplo, 'U' )
      onenrm = norm.EQ.'1' .OR. lsame( norm, 'O' )
      nounit = lsame( diag, 'N' )
*
      IF( .NOT.onenrm .AND. .NOT.lsame( norm, 'I' ) ) THEN
         info = -1
      ELSE IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -2
      ELSE IF( .NOT.nounit .AND. .NOT.lsame( diag, 'U' ) ) THEN
         info = -3
      ELSE IF( n.LT.0 ) THEN
         info = -4
      ELSE IF( lda.LT.max( 1, n ) ) THEN
         info = -6
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CTRCON', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 ) THEN
         rcond = one
         RETURN
      END IF
*
      rcond = zero
      smlnum = slamch( 'Safe minimum' )*real( max( 1, n ) )
*
*     Compute the norm of the triangular matrix A.
*
      anorm = clantr( norm, uplo, diag, n, n, a, lda, rwork )
*
*     Continue only if ANORM > 0.
*
      IF( anorm.GT.zero ) THEN
*
*        Estimate the norm of the inverse of A.
*
         ainvnm = zero
         normin = 'N'
         IF( onenrm ) THEN
            kase1 = 1
         ELSE
            kase1 = 2
         END IF
         kase = 0
   10    CONTINUE
         CALL clacn2( n, work( n+1 ), work, ainvnm, kase, isave )
         IF( kase.NE.0 ) THEN
            IF( kase.EQ.kase1 ) THEN
*
*              Multiply by inv(A).
*
               CALL clatrs( uplo, 'No transpose', diag, normin, n, a,
     $                      lda, work, scale, rwork, info )
            ELSE
*
*              Multiply by inv(A**H).
*
               CALL clatrs( uplo, 'Conjugate transpose', diag, normin,
     $                      n, a, lda, work, scale, rwork, info )
            END IF
            normin = 'Y'
*
*           Multiply by 1/SCALE if doing so will not cause overflow.
*
            IF( scale.NE.one ) THEN
               ix = icamax( n, work, 1 )
               xnorm = cabs1( work( ix ) )
               IF( scale.LT.xnorm*smlnum .OR. scale.EQ.zero )
     $            GO TO 20
               CALL csrscl( n, scale, work, 1 )
            END IF
            GO TO 10
         END IF
*
*        Compute the estimate of the reciprocal condition number.
*
         IF( ainvnm.NE.zero )
     $      rcond = ( one / anorm ) / ainvnm
      END IF
*
   20 CONTINUE
      RETURN
*
*     End of CTRCON
*

◆ ctrevc()

subroutine ctrevc	(	character	side,
		character	howmny,
		logical, dimension( * )	select,
		integer	n,
		complex, dimension( ldt, * )	t,
		integer	ldt,
		complex, dimension( ldvl, * )	vl,
		integer	ldvl,
		complex, dimension( ldvr, * )	vr,
		integer	ldvr,
		integer	mm,
		integer	m,
		complex, dimension( * )	work,
		real, dimension( * )	rwork,
		integer	info )

CTREVC

Download CTREVC + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CTREVC computes some or all of the right and/or left eigenvectors of
!> a complex upper triangular matrix T.
!> Matrices of this type are produced by the Schur factorization of
!> a complex general matrix:  A = Q*T*Q**H, as computed by CHSEQR.
!>
!> The right eigenvector x and the left eigenvector y of T corresponding
!> to an eigenvalue w are defined by:
!>
!>              T*x = w*x,     (y**H)*T = w*(y**H)
!>
!> where y**H denotes the conjugate transpose of the vector y.
!> The eigenvalues are not input to this routine, but are read directly
!> from the diagonal of T.
!>
!> This routine returns the matrices X and/or Y of right and left
!> eigenvectors of T, or the products Q*X and/or Q*Y, where Q is an
!> input matrix.  If Q is the unitary factor that reduces a matrix A to
!> Schur form T, then Q*X and Q*Y are the matrices of right and left
!> eigenvectors of A.
!>

Parameters

[in]	SIDE	!> SIDE is CHARACTER*1 !> = 'R': compute right eigenvectors only; !> = 'L': compute left eigenvectors only; !> = 'B': compute both right and left eigenvectors. !>
[in]	HOWMNY	!> HOWMNY is CHARACTER*1 !> = 'A': compute all right and/or left eigenvectors; !> = 'B': compute all right and/or left eigenvectors, !> backtransformed using the matrices supplied in !> VR and/or VL; !> = 'S': compute selected right and/or left eigenvectors, !> as indicated by the logical array SELECT. !>
[in]	SELECT	!> SELECT is LOGICAL array, dimension (N) !> If HOWMNY = 'S', SELECT specifies the eigenvectors to be !> computed. !> The eigenvector corresponding to the j-th eigenvalue is !> computed if SELECT(j) = .TRUE.. !> Not referenced if HOWMNY = 'A' or 'B'. !>
[in]	N	!> N is INTEGER !> The order of the matrix T. N >= 0. !>
[in,out]	T	!> T is COMPLEX array, dimension (LDT,N) !> The upper triangular matrix T. T is modified, but restored !> on exit. !>
[in]	LDT	!> LDT is INTEGER !> The leading dimension of the array T. LDT >= max(1,N). !>
[in,out]	VL	!> VL is COMPLEX array, dimension (LDVL,MM) !> On entry, if SIDE = 'L' or 'B' and HOWMNY = 'B', VL must !> contain an N-by-N matrix Q (usually the unitary matrix Q of !> Schur vectors returned by CHSEQR). !> On exit, if SIDE = 'L' or 'B', VL contains: !> if HOWMNY = 'A', the matrix Y of left eigenvectors of T; !> if HOWMNY = 'B', the matrix Q*Y; !> if HOWMNY = 'S', the left eigenvectors of T specified by !> SELECT, stored consecutively in the columns !> of VL, in the same order as their !> eigenvalues. !> Not referenced if SIDE = 'R'. !>
[in]	LDVL	!> LDVL is INTEGER !> The leading dimension of the array VL. LDVL >= 1, and if !> SIDE = 'L' or 'B', LDVL >= N. !>
[in,out]	VR	!> VR is COMPLEX array, dimension (LDVR,MM) !> On entry, if SIDE = 'R' or 'B' and HOWMNY = 'B', VR must !> contain an N-by-N matrix Q (usually the unitary matrix Q of !> Schur vectors returned by CHSEQR). !> On exit, if SIDE = 'R' or 'B', VR contains: !> if HOWMNY = 'A', the matrix X of right eigenvectors of T; !> if HOWMNY = 'B', the matrix Q*X; !> if HOWMNY = 'S', the right eigenvectors of T specified by !> SELECT, stored consecutively in the columns !> of VR, in the same order as their !> eigenvalues. !> Not referenced if SIDE = 'L'. !>
[in]	LDVR	!> LDVR is INTEGER !> The leading dimension of the array VR. LDVR >= 1, and if !> SIDE = 'R' or 'B'; LDVR >= N. !>
[in]	MM	!> MM is INTEGER !> The number of columns in the arrays VL and/or VR. MM >= M. !>
[out]	M	!> M is INTEGER !> The number of columns in the arrays VL and/or VR actually !> used to store the eigenvectors. If HOWMNY = 'A' or 'B', M !> is set to N. Each selected eigenvector occupies one !> column. !>
[out]	WORK	!> WORK is COMPLEX array, dimension (2*N) !>
[out]	RWORK	!> RWORK is REAL array, dimension (N) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  The algorithm used in this program is basically backward (forward)
!>  substitution, with scaling to make the the code robust against
!>  possible overflow.
!>
!>  Each eigenvector is normalized so that the element of largest
!>  magnitude has magnitude 1; here the magnitude of a complex number
!>  (x,y) is taken to be |x| + |y|.
!>

Definition at line 216 of file ctrevc.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          HOWMNY, SIDE
      INTEGER            INFO, LDT, LDVL, LDVR, M, MM, N
*     ..
*     .. Array Arguments ..
      LOGICAL            SELECT( * )
      REAL               RWORK( * )
      COMPLEX            T( LDT, * ), VL( LDVL, * ), VR( LDVR, * ),
     $                   WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ZERO, ONE
      parameter( zero = 0.0e+0, one = 1.0e+0 )
      COMPLEX            CMZERO, CMONE
      parameter( cmzero = ( 0.0e+0, 0.0e+0 ),
     $                   cmone = ( 1.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      LOGICAL            ALLV, BOTHV, LEFTV, OVER, RIGHTV, SOMEV
      INTEGER            I, II, IS, J, K, KI
      REAL               OVFL, REMAX, SCALE, SMIN, SMLNUM, ULP, UNFL
      COMPLEX            CDUM
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      INTEGER            ICAMAX
      REAL               SCASUM, SLAMCH
      EXTERNAL           lsame, icamax, scasum, slamch
*     ..
*     .. External Subroutines ..
      EXTERNAL           ccopy, cgemv, clatrs, csscal, slabad, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, aimag, cmplx, conjg, max, real
*     ..
*     .. Statement Functions ..
      REAL               CABS1
*     ..
*     .. Statement Function definitions ..
      cabs1( cdum ) = abs( real( cdum ) ) + abs( aimag( cdum ) )
*     ..
*     .. Executable Statements ..
*
*     Decode and test the input parameters
*
      bothv = lsame( side, 'B' )
      rightv = lsame( side, 'R' ) .OR. bothv
      leftv = lsame( side, 'L' ) .OR. bothv
*
      allv = lsame( howmny, 'A' )
      over = lsame( howmny, 'B' )
      somev = lsame( howmny, 'S' )
*
*     Set M to the number of columns required to store the selected
*     eigenvectors.
*
      IF( somev ) THEN
         m = 0
         DO 10 j = 1, n
            IF( SELECT( j ) )
     $         m = m + 1
   10    CONTINUE
      ELSE
         m = n
      END IF
*
      info = 0
      IF( .NOT.rightv .AND. .NOT.leftv ) THEN
         info = -1
      ELSE IF( .NOT.allv .AND. .NOT.over .AND. .NOT.somev ) THEN
         info = -2
      ELSE IF( n.LT.0 ) THEN
         info = -4
      ELSE IF( ldt.LT.max( 1, n ) ) THEN
         info = -6
      ELSE IF( ldvl.LT.1 .OR. ( leftv .AND. ldvl.LT.n ) ) THEN
         info = -8
      ELSE IF( ldvr.LT.1 .OR. ( rightv .AND. ldvr.LT.n ) ) THEN
         info = -10
      ELSE IF( mm.LT.m ) THEN
         info = -11
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CTREVC', -info )
         RETURN
      END IF
*
*     Quick return if possible.
*
      IF( n.EQ.0 )
     $   RETURN
*
*     Set the constants to control overflow.
*
      unfl = slamch( 'Safe minimum' )
      ovfl = one / unfl
      CALL slabad( unfl, ovfl )
      ulp = slamch( 'Precision' )
      smlnum = unfl*( n / ulp )
*
*     Store the diagonal elements of T in working array WORK.
*
      DO 20 i = 1, n
         work( i+n ) = t( i, i )
   20 CONTINUE
*
*     Compute 1-norm of each column of strictly upper triangular
*     part of T to control overflow in triangular solver.
*
      rwork( 1 ) = zero
      DO 30 j = 2, n
         rwork( j ) = scasum( j-1, t( 1, j ), 1 )
   30 CONTINUE
*
      IF( rightv ) THEN
*
*        Compute right eigenvectors.
*
         is = m
         DO 80 ki = n, 1, -1
*
            IF( somev ) THEN
               IF( .NOT.SELECT( ki ) )
     $            GO TO 80
            END IF
            smin = max( ulp*( cabs1( t( ki, ki ) ) ), smlnum )
*
            work( 1 ) = cmone
*
*           Form right-hand side.
*
            DO 40 k = 1, ki - 1
               work( k ) = -t( k, ki )
   40       CONTINUE
*
*           Solve the triangular system:
*              (T(1:KI-1,1:KI-1) - T(KI,KI))*X = SCALE*WORK.
*
            DO 50 k = 1, ki - 1
               t( k, k ) = t( k, k ) - t( ki, ki )
               IF( cabs1( t( k, k ) ).LT.smin )
     $            t( k, k ) = smin
   50       CONTINUE
*
            IF( ki.GT.1 ) THEN
               CALL clatrs( 'Upper', 'No transpose', 'Non-unit', 'Y',
     $                      ki-1, t, ldt, work( 1 ), scale, rwork,
     $                      info )
               work( ki ) = scale
            END IF
*
*           Copy the vector x or Q*x to VR and normalize.
*
            IF( .NOT.over ) THEN
               CALL ccopy( ki, work( 1 ), 1, vr( 1, is ), 1 )
*
               ii = icamax( ki, vr( 1, is ), 1 )
               remax = one / cabs1( vr( ii, is ) )
               CALL csscal( ki, remax, vr( 1, is ), 1 )
*
               DO 60 k = ki + 1, n
                  vr( k, is ) = cmzero
   60          CONTINUE
            ELSE
               IF( ki.GT.1 )
     $            CALL cgemv( 'N', n, ki-1, cmone, vr, ldvr, work( 1 ),
     $                        1, cmplx( scale ), vr( 1, ki ), 1 )
*
               ii = icamax( n, vr( 1, ki ), 1 )
               remax = one / cabs1( vr( ii, ki ) )
               CALL csscal( n, remax, vr( 1, ki ), 1 )
            END IF
*
*           Set back the original diagonal elements of T.
*
            DO 70 k = 1, ki - 1
               t( k, k ) = work( k+n )
   70       CONTINUE
*
            is = is - 1
   80    CONTINUE
      END IF
*
      IF( leftv ) THEN
*
*        Compute left eigenvectors.
*
         is = 1
         DO 130 ki = 1, n
*
            IF( somev ) THEN
               IF( .NOT.SELECT( ki ) )
     $            GO TO 130
            END IF
            smin = max( ulp*( cabs1( t( ki, ki ) ) ), smlnum )
*
            work( n ) = cmone
*
*           Form right-hand side.
*
            DO 90 k = ki + 1, n
               work( k ) = -conjg( t( ki, k ) )
   90       CONTINUE
*
*           Solve the triangular system:
*              (T(KI+1:N,KI+1:N) - T(KI,KI))**H*X = SCALE*WORK.
*
            DO 100 k = ki + 1, n
               t( k, k ) = t( k, k ) - t( ki, ki )
               IF( cabs1( t( k, k ) ).LT.smin )
     $            t( k, k ) = smin
  100       CONTINUE
*
            IF( ki.LT.n ) THEN
               CALL clatrs( 'Upper', 'Conjugate transpose', 'Non-unit',
     $                      'Y', n-ki, t( ki+1, ki+1 ), ldt,
     $                      work( ki+1 ), scale, rwork, info )
               work( ki ) = scale
            END IF
*
*           Copy the vector x or Q*x to VL and normalize.
*
            IF( .NOT.over ) THEN
               CALL ccopy( n-ki+1, work( ki ), 1, vl( ki, is ), 1 )
*
               ii = icamax( n-ki+1, vl( ki, is ), 1 ) + ki - 1
               remax = one / cabs1( vl( ii, is ) )
               CALL csscal( n-ki+1, remax, vl( ki, is ), 1 )
*
               DO 110 k = 1, ki - 1
                  vl( k, is ) = cmzero
  110          CONTINUE
            ELSE
               IF( ki.LT.n )
     $            CALL cgemv( 'N', n, n-ki, cmone, vl( 1, ki+1 ), ldvl,
     $                        work( ki+1 ), 1, cmplx( scale ),
     $                        vl( 1, ki ), 1 )
*
               ii = icamax( n, vl( 1, ki ), 1 )
               remax = one / cabs1( vl( ii, ki ) )
               CALL csscal( n, remax, vl( 1, ki ), 1 )
            END IF
*
*           Set back the original diagonal elements of T.
*
            DO 120 k = ki + 1, n
               t( k, k ) = work( k+n )
  120       CONTINUE
*
            is = is + 1
  130    CONTINUE
      END IF
*
      RETURN
*
*     End of CTREVC
*

◆ ctrevc3()

subroutine ctrevc3	(	character	side,
		character	howmny,
		logical, dimension( * )	select,
		integer	n,
		complex, dimension( ldt, * )	t,
		integer	ldt,
		complex, dimension( ldvl, * )	vl,
		integer	ldvl,
		complex, dimension( ldvr, * )	vr,
		integer	ldvr,
		integer	mm,
		integer	m,
		complex, dimension( * )	work,
		integer	lwork,
		real, dimension( * )	rwork,
		integer	lrwork,
		integer	info )

CTREVC3

Download CTREVC3 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CTREVC3 computes some or all of the right and/or left eigenvectors of
!> a complex upper triangular matrix T.
!> Matrices of this type are produced by the Schur factorization of
!> a complex general matrix:  A = Q*T*Q**H, as computed by CHSEQR.
!>
!> The right eigenvector x and the left eigenvector y of T corresponding
!> to an eigenvalue w are defined by:
!>
!>              T*x = w*x,     (y**H)*T = w*(y**H)
!>
!> where y**H denotes the conjugate transpose of the vector y.
!> The eigenvalues are not input to this routine, but are read directly
!> from the diagonal of T.
!>
!> This routine returns the matrices X and/or Y of right and left
!> eigenvectors of T, or the products Q*X and/or Q*Y, where Q is an
!> input matrix. If Q is the unitary factor that reduces a matrix A to
!> Schur form T, then Q*X and Q*Y are the matrices of right and left
!> eigenvectors of A.
!>
!> This uses a Level 3 BLAS version of the back transformation.
!>

Parameters

[in]	SIDE	!> SIDE is CHARACTER*1 !> = 'R': compute right eigenvectors only; !> = 'L': compute left eigenvectors only; !> = 'B': compute both right and left eigenvectors. !>
[in]	HOWMNY	!> HOWMNY is CHARACTER*1 !> = 'A': compute all right and/or left eigenvectors; !> = 'B': compute all right and/or left eigenvectors, !> backtransformed using the matrices supplied in !> VR and/or VL; !> = 'S': compute selected right and/or left eigenvectors, !> as indicated by the logical array SELECT. !>
[in]	SELECT	!> SELECT is LOGICAL array, dimension (N) !> If HOWMNY = 'S', SELECT specifies the eigenvectors to be !> computed. !> The eigenvector corresponding to the j-th eigenvalue is !> computed if SELECT(j) = .TRUE.. !> Not referenced if HOWMNY = 'A' or 'B'. !>
[in]	N	!> N is INTEGER !> The order of the matrix T. N >= 0. !>
[in,out]	T	!> T is COMPLEX array, dimension (LDT,N) !> The upper triangular matrix T. T is modified, but restored !> on exit. !>
[in]	LDT	!> LDT is INTEGER !> The leading dimension of the array T. LDT >= max(1,N). !>
[in,out]	VL	!> VL is COMPLEX array, dimension (LDVL,MM) !> On entry, if SIDE = 'L' or 'B' and HOWMNY = 'B', VL must !> contain an N-by-N matrix Q (usually the unitary matrix Q of !> Schur vectors returned by CHSEQR). !> On exit, if SIDE = 'L' or 'B', VL contains: !> if HOWMNY = 'A', the matrix Y of left eigenvectors of T; !> if HOWMNY = 'B', the matrix Q*Y; !> if HOWMNY = 'S', the left eigenvectors of T specified by !> SELECT, stored consecutively in the columns !> of VL, in the same order as their !> eigenvalues. !> Not referenced if SIDE = 'R'. !>
[in]	LDVL	!> LDVL is INTEGER !> The leading dimension of the array VL. !> LDVL >= 1, and if SIDE = 'L' or 'B', LDVL >= N. !>
[in,out]	VR	!> VR is COMPLEX array, dimension (LDVR,MM) !> On entry, if SIDE = 'R' or 'B' and HOWMNY = 'B', VR must !> contain an N-by-N matrix Q (usually the unitary matrix Q of !> Schur vectors returned by CHSEQR). !> On exit, if SIDE = 'R' or 'B', VR contains: !> if HOWMNY = 'A', the matrix X of right eigenvectors of T; !> if HOWMNY = 'B', the matrix Q*X; !> if HOWMNY = 'S', the right eigenvectors of T specified by !> SELECT, stored consecutively in the columns !> of VR, in the same order as their !> eigenvalues. !> Not referenced if SIDE = 'L'. !>
[in]	LDVR	!> LDVR is INTEGER !> The leading dimension of the array VR. !> LDVR >= 1, and if SIDE = 'R' or 'B', LDVR >= N. !>
[in]	MM	!> MM is INTEGER !> The number of columns in the arrays VL and/or VR. MM >= M. !>
[out]	M	!> M is INTEGER !> The number of columns in the arrays VL and/or VR actually !> used to store the eigenvectors. !> If HOWMNY = 'A' or 'B', M is set to N. !> Each selected eigenvector occupies one column. !>
[out]	WORK	!> WORK is COMPLEX array, dimension (MAX(1,LWORK)) !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of array WORK. LWORK >= max(1,2N). !> For optimum performance, LWORK >= N + 2N*NB, where NB is !> the optimal blocksize. !> !> If LWORK = -1, then a workspace query is assumed; the routine !> only calculates the optimal size of the WORK array, returns !> this value as the first entry of the WORK array, and no error !> message related to LWORK is issued by XERBLA. !>
[out]	RWORK	!> RWORK is REAL array, dimension (LRWORK) !>
[in]	LRWORK	!> LRWORK is INTEGER !> The dimension of array RWORK. LRWORK >= max(1,N). !> !> If LRWORK = -1, then a workspace query is assumed; the routine !> only calculates the optimal size of the RWORK array, returns !> this value as the first entry of the RWORK array, and no error !> message related to LRWORK is issued by XERBLA. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  The algorithm used in this program is basically backward (forward)
!>  substitution, with scaling to make the the code robust against
!>  possible overflow.
!>
!>  Each eigenvector is normalized so that the element of largest
!>  magnitude has magnitude 1; here the magnitude of a complex number
!>  (x,y) is taken to be |x| + |y|.
!>

Definition at line 242 of file ctrevc3.f.

      IMPLICIT NONE
*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          HOWMNY, SIDE
      INTEGER            INFO, LDT, LDVL, LDVR, LWORK, LRWORK, M, MM, N
*     ..
*     .. Array Arguments ..
      LOGICAL            SELECT( * )
      REAL               RWORK( * )
      COMPLEX            T( LDT, * ), VL( LDVL, * ), VR( LDVR, * ),
     $                   WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ZERO, ONE
      parameter( zero = 0.0e+0, one = 1.0e+0 )
      COMPLEX            CZERO, CONE
      parameter( czero = ( 0.0e+0, 0.0e+0 ),
     $                     cone  = ( 1.0e+0, 0.0e+0 ) )
      INTEGER            NBMIN, NBMAX
      parameter( nbmin = 8, nbmax = 128 )
*     ..
*     .. Local Scalars ..
      LOGICAL            ALLV, BOTHV, LEFTV, LQUERY, OVER, RIGHTV, SOMEV
      INTEGER            I, II, IS, J, K, KI, IV, MAXWRK, NB
      REAL               OVFL, REMAX, SCALE, SMIN, SMLNUM, ULP, UNFL
      COMPLEX            CDUM
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      INTEGER            ILAENV, ICAMAX
      REAL               SLAMCH, SCASUM
      EXTERNAL           lsame, ilaenv, icamax, slamch, scasum
*     ..
*     .. External Subroutines ..
      EXTERNAL           xerbla, ccopy, claset, csscal, cgemm, cgemv,
     $                   clatrs, clacpy, slabad
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, real, cmplx, conjg, aimag, max
*     ..
*     .. Statement Functions ..
      REAL   CABS1
*     ..
*     .. Statement Function definitions ..
      cabs1( cdum ) = abs( real( cdum ) ) + abs( aimag( cdum ) )
*     ..
*     .. Executable Statements ..
*
*     Decode and test the input parameters
*
      bothv  = lsame( side, 'B' )
      rightv = lsame( side, 'R' ) .OR. bothv
      leftv  = lsame( side, 'L' ) .OR. bothv
*
      allv  = lsame( howmny, 'A' )
      over  = lsame( howmny, 'B' )
      somev = lsame( howmny, 'S' )
*
*     Set M to the number of columns required to store the selected
*     eigenvectors.
*
      IF( somev ) THEN
         m = 0
         DO 10 j = 1, n
            IF( SELECT( j ) )
     $         m = m + 1
   10    CONTINUE
      ELSE
         m = n
      END IF
*
      info = 0
      nb = ilaenv( 1, 'CTREVC', side // howmny, n, -1, -1, -1 )
      maxwrk = n + 2*n*nb
      work(1) = maxwrk
      rwork(1) = n
      lquery = ( lwork.EQ.-1 .OR. lrwork.EQ.-1 )
      IF( .NOT.rightv .AND. .NOT.leftv ) THEN
         info = -1
      ELSE IF( .NOT.allv .AND. .NOT.over .AND. .NOT.somev ) THEN
         info = -2
      ELSE IF( n.LT.0 ) THEN
         info = -4
      ELSE IF( ldt.LT.max( 1, n ) ) THEN
         info = -6
      ELSE IF( ldvl.LT.1 .OR. ( leftv .AND. ldvl.LT.n ) ) THEN
         info = -8
      ELSE IF( ldvr.LT.1 .OR. ( rightv .AND. ldvr.LT.n ) ) THEN
         info = -10
      ELSE IF( mm.LT.m ) THEN
         info = -11
      ELSE IF( lwork.LT.max( 1, 2*n ) .AND. .NOT.lquery ) THEN
         info = -14
      ELSE IF ( lrwork.LT.max( 1, n ) .AND. .NOT.lquery ) THEN
         info = -16
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CTREVC3', -info )
         RETURN
      ELSE IF( lquery ) THEN
         RETURN
      END IF
*
*     Quick return if possible.
*
      IF( n.EQ.0 )
     $   RETURN
*
*     Use blocked version of back-transformation if sufficient workspace.
*     Zero-out the workspace to avoid potential NaN propagation.
*
      IF( over .AND. lwork .GE. n + 2*n*nbmin ) THEN
         nb = (lwork - n) / (2*n)
         nb = min( nb, nbmax )
         CALL claset( 'F', n, 1+2*nb, czero, czero, work, n )
      ELSE
         nb = 1
      END IF
*
*     Set the constants to control overflow.
*
      unfl = slamch( 'Safe minimum' )
      ovfl = one / unfl
      CALL slabad( unfl, ovfl )
      ulp = slamch( 'Precision' )
      smlnum = unfl*( n / ulp )
*
*     Store the diagonal elements of T in working array WORK.
*
      DO 20 i = 1, n
         work( i ) = t( i, i )
   20 CONTINUE
*
*     Compute 1-norm of each column of strictly upper triangular
*     part of T to control overflow in triangular solver.
*
      rwork( 1 ) = zero
      DO 30 j = 2, n
         rwork( j ) = scasum( j-1, t( 1, j ), 1 )
   30 CONTINUE
*
      IF( rightv ) THEN
*
*        ============================================================
*        Compute right eigenvectors.
*
*        IV is index of column in current block.
*        Non-blocked version always uses IV=NB=1;
*        blocked     version starts with IV=NB, goes down to 1.
*        (Note the "0-th" column is used to store the original diagonal.)
         iv = nb
         is = m
         DO 80 ki = n, 1, -1
            IF( somev ) THEN
               IF( .NOT.SELECT( ki ) )
     $            GO TO 80
            END IF
            smin = max( ulp*( cabs1( t( ki, ki ) ) ), smlnum )
*
*           --------------------------------------------------------
*           Complex right eigenvector
*
            work( ki + iv*n ) = cone
*
*           Form right-hand side.
*
            DO 40 k = 1, ki - 1
               work( k + iv*n ) = -t( k, ki )
   40       CONTINUE
*
*           Solve upper triangular system:
*           [ T(1:KI-1,1:KI-1) - T(KI,KI) ]*X = SCALE*WORK.
*
            DO 50 k = 1, ki - 1
               t( k, k ) = t( k, k ) - t( ki, ki )
               IF( cabs1( t( k, k ) ).LT.smin )
     $            t( k, k ) = smin
   50       CONTINUE
*
            IF( ki.GT.1 ) THEN
               CALL clatrs( 'Upper', 'No transpose', 'Non-unit', 'Y',
     $                      ki-1, t, ldt, work( 1 + iv*n ), scale,
     $                      rwork, info )
               work( ki + iv*n ) = scale
            END IF
*
*           Copy the vector x or Q*x to VR and normalize.
*
            IF( .NOT.over ) THEN
*              ------------------------------
*              no back-transform: copy x to VR and normalize.
               CALL ccopy( ki, work( 1 + iv*n ), 1, vr( 1, is ), 1 )
*
               ii = icamax( ki, vr( 1, is ), 1 )
               remax = one / cabs1( vr( ii, is ) )
               CALL csscal( ki, remax, vr( 1, is ), 1 )
*
               DO 60 k = ki + 1, n
                  vr( k, is ) = czero
   60          CONTINUE
*
            ELSE IF( nb.EQ.1 ) THEN
*              ------------------------------
*              version 1: back-transform each vector with GEMV, Q*x.
               IF( ki.GT.1 )
     $            CALL cgemv( 'N', n, ki-1, cone, vr, ldvr,
     $                        work( 1 + iv*n ), 1, cmplx( scale ),
     $                        vr( 1, ki ), 1 )
*
               ii = icamax( n, vr( 1, ki ), 1 )
               remax = one / cabs1( vr( ii, ki ) )
               CALL csscal( n, remax, vr( 1, ki ), 1 )
*
            ELSE
*              ------------------------------
*              version 2: back-transform block of vectors with GEMM
*              zero out below vector
               DO k = ki + 1, n
                  work( k + iv*n ) = czero
               END DO
*
*              Columns IV:NB of work are valid vectors.
*              When the number of vectors stored reaches NB,
*              or if this was last vector, do the GEMM
               IF( (iv.EQ.1) .OR. (ki.EQ.1) ) THEN
                  CALL cgemm( 'N', 'N', n, nb-iv+1, ki+nb-iv, cone,
     $                        vr, ldvr,
     $                        work( 1 + (iv)*n    ), n,
     $                        czero,
     $                        work( 1 + (nb+iv)*n ), n )
*                 normalize vectors
                  DO k = iv, nb
                     ii = icamax( n, work( 1 + (nb+k)*n ), 1 )
                     remax = one / cabs1( work( ii + (nb+k)*n ) )
                     CALL csscal( n, remax, work( 1 + (nb+k)*n ), 1 )
                  END DO
                  CALL clacpy( 'F', n, nb-iv+1,
     $                         work( 1 + (nb+iv)*n ), n,
     $                         vr( 1, ki ), ldvr )
                  iv = nb
               ELSE
                  iv = iv - 1
               END IF
            END IF
*
*           Restore the original diagonal elements of T.
*
            DO 70 k = 1, ki - 1
               t( k, k ) = work( k )
   70       CONTINUE
*
            is = is - 1
   80    CONTINUE
      END IF
*
      IF( leftv ) THEN
*
*        ============================================================
*        Compute left eigenvectors.
*
*        IV is index of column in current block.
*        Non-blocked version always uses IV=1;
*        blocked     version starts with IV=1, goes up to NB.
*        (Note the "0-th" column is used to store the original diagonal.)
         iv = 1
         is = 1
         DO 130 ki = 1, n
*
            IF( somev ) THEN
               IF( .NOT.SELECT( ki ) )
     $            GO TO 130
            END IF
            smin = max( ulp*( cabs1( t( ki, ki ) ) ), smlnum )
*
*           --------------------------------------------------------
*           Complex left eigenvector
*
            work( ki + iv*n ) = cone
*
*           Form right-hand side.
*
            DO 90 k = ki + 1, n
               work( k + iv*n ) = -conjg( t( ki, k ) )
   90       CONTINUE
*
*           Solve conjugate-transposed triangular system:
*           [ T(KI+1:N,KI+1:N) - T(KI,KI) ]**H * X = SCALE*WORK.
*
            DO 100 k = ki + 1, n
               t( k, k ) = t( k, k ) - t( ki, ki )
               IF( cabs1( t( k, k ) ).LT.smin )
     $            t( k, k ) = smin
  100       CONTINUE
*
            IF( ki.LT.n ) THEN
               CALL clatrs( 'Upper', 'Conjugate transpose', 'Non-unit',
     $                      'Y', n-ki, t( ki+1, ki+1 ), ldt,
     $                      work( ki+1 + iv*n ), scale, rwork, info )
               work( ki + iv*n ) = scale
            END IF
*
*           Copy the vector x or Q*x to VL and normalize.
*
            IF( .NOT.over ) THEN
*              ------------------------------
*              no back-transform: copy x to VL and normalize.
               CALL ccopy( n-ki+1, work( ki + iv*n ), 1, vl(ki,is), 1 )
*
               ii = icamax( n-ki+1, vl( ki, is ), 1 ) + ki - 1
               remax = one / cabs1( vl( ii, is ) )
               CALL csscal( n-ki+1, remax, vl( ki, is ), 1 )
*
               DO 110 k = 1, ki - 1
                  vl( k, is ) = czero
  110          CONTINUE
*
            ELSE IF( nb.EQ.1 ) THEN
*              ------------------------------
*              version 1: back-transform each vector with GEMV, Q*x.
               IF( ki.LT.n )
     $            CALL cgemv( 'N', n, n-ki, cone, vl( 1, ki+1 ), ldvl,
     $                        work( ki+1 + iv*n ), 1, cmplx( scale ),
     $                        vl( 1, ki ), 1 )
*
               ii = icamax( n, vl( 1, ki ), 1 )
               remax = one / cabs1( vl( ii, ki ) )
               CALL csscal( n, remax, vl( 1, ki ), 1 )
*
            ELSE
*              ------------------------------
*              version 2: back-transform block of vectors with GEMM
*              zero out above vector
*              could go from KI-NV+1 to KI-1
               DO k = 1, ki - 1
                  work( k + iv*n ) = czero
               END DO
*
*              Columns 1:IV of work are valid vectors.
*              When the number of vectors stored reaches NB,
*              or if this was last vector, do the GEMM
               IF( (iv.EQ.nb) .OR. (ki.EQ.n) ) THEN
                  CALL cgemm( 'N', 'N', n, iv, n-ki+iv, cone,
     $                        vl( 1, ki-iv+1 ), ldvl,
     $                        work( ki-iv+1 + (1)*n ), n,
     $                        czero,
     $                        work( 1 + (nb+1)*n ), n )
*                 normalize vectors
                  DO k = 1, iv
                     ii = icamax( n, work( 1 + (nb+k)*n ), 1 )
                     remax = one / cabs1( work( ii + (nb+k)*n ) )
                     CALL csscal( n, remax, work( 1 + (nb+k)*n ), 1 )
                  END DO
                  CALL clacpy( 'F', n, iv,
     $                         work( 1 + (nb+1)*n ), n,
     $                         vl( 1, ki-iv+1 ), ldvl )
                  iv = 1
               ELSE
                  iv = iv + 1
               END IF
            END IF
*
*           Restore the original diagonal elements of T.
*
            DO 120 k = ki + 1, n
               t( k, k ) = work( k )
  120       CONTINUE
*
            is = is + 1
  130    CONTINUE
      END IF
*
      RETURN
*
*     End of CTREVC3
*

◆ ctrexc()

subroutine ctrexc	(	character	compq,
		integer	n,
		complex, dimension( ldt, * )	t,
		integer	ldt,
		complex, dimension( ldq, * )	q,
		integer	ldq,
		integer	ifst,
		integer	ilst,
		integer	info )

CTREXC

Download CTREXC + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CTREXC reorders the Schur factorization of a complex matrix
!> A = Q*T*Q**H, so that the diagonal element of T with row index IFST
!> is moved to row ILST.
!>
!> The Schur form T is reordered by a unitary similarity transformation
!> Z**H*T*Z, and optionally the matrix Q of Schur vectors is updated by
!> postmultplying it with Z.
!>

Parameters

[in]	COMPQ	!> COMPQ is CHARACTER*1 !> = 'V': update the matrix Q of Schur vectors; !> = 'N': do not update Q. !>
[in]	N	!> N is INTEGER !> The order of the matrix T. N >= 0. !> If N == 0 arguments ILST and IFST may be any value. !>
[in,out]	T	!> T is COMPLEX array, dimension (LDT,N) !> On entry, the upper triangular matrix T. !> On exit, the reordered upper triangular matrix. !>
[in]	LDT	!> LDT is INTEGER !> The leading dimension of the array T. LDT >= max(1,N). !>
[in,out]	Q	!> Q is COMPLEX array, dimension (LDQ,N) !> On entry, if COMPQ = 'V', the matrix Q of Schur vectors. !> On exit, if COMPQ = 'V', Q has been postmultiplied by the !> unitary transformation matrix Z which reorders T. !> If COMPQ = 'N', Q is not referenced. !>
[in]	LDQ	!> LDQ is INTEGER !> The leading dimension of the array Q. LDQ >= 1, and if !> COMPQ = 'V', LDQ >= max(1,N). !>
[in]	IFST	!> IFST is INTEGER !>
[in]	ILST	!> ILST is INTEGER !> !> Specify the reordering of the diagonal elements of T: !> The element with row index IFST is moved to row ILST by a !> sequence of transpositions between adjacent elements. !> 1 <= IFST <= N; 1 <= ILST <= N. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 125 of file ctrexc.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          COMPQ
      INTEGER            IFST, ILST, INFO, LDQ, LDT, N
*     ..
*     .. Array Arguments ..
      COMPLEX            Q( LDQ, * ), T( LDT, * )
*     ..
*
*  =====================================================================
*
*     .. Local Scalars ..
      LOGICAL            WANTQ
      INTEGER            K, M1, M2, M3
      REAL               CS
      COMPLEX            SN, T11, T22, TEMP
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           clartg, crot, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          conjg, max
*     ..
*     .. Executable Statements ..
*
*     Decode and test the input parameters.
*
      info = 0
      wantq = lsame( compq, 'V' )
      IF( .NOT.lsame( compq, 'N' ) .AND. .NOT.wantq ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( ldt.LT.max( 1, n ) ) THEN
         info = -4
      ELSE IF( ldq.LT.1 .OR. ( wantq .AND. ldq.LT.max( 1, n ) ) ) THEN
         info = -6
      ELSE IF(( ifst.LT.1 .OR. ifst.GT.n ).AND.( n.GT.0 )) THEN
         info = -7
      ELSE IF(( ilst.LT.1 .OR. ilst.GT.n ).AND.( n.GT.0 )) THEN
         info = -8
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CTREXC', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.LE.1 .OR. ifst.EQ.ilst )
     $   RETURN
*
      IF( ifst.LT.ilst ) THEN
*
*        Move the IFST-th diagonal element forward down the diagonal.
*
         m1 = 0
         m2 = -1
         m3 = 1
      ELSE
*
*        Move the IFST-th diagonal element backward up the diagonal.
*
         m1 = -1
         m2 = 0
         m3 = -1
      END IF
*
      DO 10 k = ifst + m1, ilst + m2, m3
*
*        Interchange the k-th and (k+1)-th diagonal elements.
*
         t11 = t( k, k )
         t22 = t( k+1, k+1 )
*
*        Determine the transformation to perform the interchange.
*
         CALL clartg( t( k, k+1 ), t22-t11, cs, sn, temp )
*
*        Apply transformation to the matrix T.
*
         IF( k+2.LE.n )
     $      CALL crot( n-k-1, t( k, k+2 ), ldt, t( k+1, k+2 ), ldt, cs,
     $                 sn )
         CALL crot( k-1, t( 1, k ), 1, t( 1, k+1 ), 1, cs, conjg( sn ) )
*
         t( k, k ) = t22
         t( k+1, k+1 ) = t11
*
         IF( wantq ) THEN
*
*           Accumulate transformation in the matrix Q.
*
            CALL crot( n, q( 1, k ), 1, q( 1, k+1 ), 1, cs,
     $                 conjg( sn ) )
         END IF
*
   10 CONTINUE
*
      RETURN
*
*     End of CTREXC
*

◆ ctrrfs()

subroutine ctrrfs	(	character	uplo,
		character	trans,
		character	diag,
		integer	n,
		integer	nrhs,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( ldb, * )	b,
		integer	ldb,
		complex, dimension( ldx, * )	x,
		integer	ldx,
		real, dimension( * )	ferr,
		real, dimension( * )	berr,
		complex, dimension( * )	work,
		real, dimension( * )	rwork,
		integer	info )

CTRRFS

Download CTRRFS + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CTRRFS provides error bounds and backward error estimates for the
!> solution to a system of linear equations with a triangular
!> coefficient matrix.
!>
!> The solution matrix X must be computed by CTRTRS or some other
!> means before entering this routine.  CTRRFS does not do iterative
!> refinement because doing so cannot improve the backward error.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': A is upper triangular; !> = 'L': A is lower triangular. !>
[in]	TRANS	!> TRANS is CHARACTER1 !> Specifies the form of the system of equations: !> = 'N': A X = B (No transpose) !> = 'T': A*T X = B (Transpose) !> = 'C': A*H X = B (Conjugate transpose) !>
[in]	DIAG	!> DIAG is CHARACTER*1 !> = 'N': A is non-unit triangular; !> = 'U': A is unit triangular. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in]	NRHS	!> NRHS is INTEGER !> The number of right hand sides, i.e., the number of columns !> of the matrices B and X. NRHS >= 0. !>
[in]	A	!> A is COMPLEX array, dimension (LDA,N) !> The triangular matrix A. If UPLO = 'U', the leading N-by-N !> upper triangular part of the array A contains the upper !> triangular matrix, and the strictly lower triangular part of !> A is not referenced. If UPLO = 'L', the leading N-by-N lower !> triangular part of the array A contains the lower triangular !> matrix, and the strictly upper triangular part of A is not !> referenced. If DIAG = 'U', the diagonal elements of A are !> also not referenced and are assumed to be 1. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,N). !>
[in]	B	!> B is COMPLEX array, dimension (LDB,NRHS) !> The right hand side matrix B. !>
[in]	LDB	!> LDB is INTEGER !> The leading dimension of the array B. LDB >= max(1,N). !>
[in]	X	!> X is COMPLEX array, dimension (LDX,NRHS) !> The solution matrix X. !>
[in]	LDX	!> LDX is INTEGER !> The leading dimension of the array X. LDX >= max(1,N). !>
[out]	FERR	!> FERR is REAL array, dimension (NRHS) !> The estimated forward error bound for each solution vector !> X(j) (the j-th column of the solution matrix X). !> If XTRUE is the true solution corresponding to X(j), FERR(j) !> is an estimated upper bound for the magnitude of the largest !> element in (X(j) - XTRUE) divided by the magnitude of the !> largest element in X(j). The estimate is as reliable as !> the estimate for RCOND, and is almost always a slight !> overestimate of the true error. !>
[out]	BERR	!> BERR is REAL array, dimension (NRHS) !> The componentwise relative backward error of each solution !> vector X(j) (i.e., the smallest relative change in !> any element of A or B that makes X(j) an exact solution). !>
[out]	WORK	!> WORK is COMPLEX array, dimension (2*N) !>
[out]	RWORK	!> RWORK is REAL array, dimension (N) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 180 of file ctrrfs.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          DIAG, TRANS, UPLO
      INTEGER            INFO, LDA, LDB, LDX, N, NRHS
*     ..
*     .. Array Arguments ..
      REAL               BERR( * ), FERR( * ), RWORK( * )
      COMPLEX            A( LDA, * ), B( LDB, * ), WORK( * ),
     $                   X( LDX, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ZERO
      parameter( zero = 0.0e+0 )
      COMPLEX            ONE
      parameter( one = ( 1.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      LOGICAL            NOTRAN, NOUNIT, UPPER
      CHARACTER          TRANSN, TRANST
      INTEGER            I, J, K, KASE, NZ
      REAL               EPS, LSTRES, S, SAFE1, SAFE2, SAFMIN, XK
      COMPLEX            ZDUM
*     ..
*     .. Local Arrays ..
      INTEGER            ISAVE( 3 )
*     ..
*     .. External Subroutines ..
      EXTERNAL           caxpy, ccopy, clacn2, ctrmv, ctrsv, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, aimag, max, real
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      REAL               SLAMCH
      EXTERNAL           lsame, slamch
*     ..
*     .. Statement Functions ..
      REAL               CABS1
*     ..
*     .. Statement Function definitions ..
      cabs1( zdum ) = abs( real( zdum ) ) + abs( aimag( zdum ) )
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      upper = lsame( uplo, 'U' )
      notran = lsame( trans, 'N' )
      nounit = lsame( diag, 'N' )
*
      IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -1
      ELSE IF( .NOT.notran .AND. .NOT.lsame( trans, 'T' ) .AND. .NOT.
     $         lsame( trans, 'C' ) ) THEN
         info = -2
      ELSE IF( .NOT.nounit .AND. .NOT.lsame( diag, 'U' ) ) THEN
         info = -3
      ELSE IF( n.LT.0 ) THEN
         info = -4
      ELSE IF( nrhs.LT.0 ) THEN
         info = -5
      ELSE IF( lda.LT.max( 1, n ) ) THEN
         info = -7
      ELSE IF( ldb.LT.max( 1, n ) ) THEN
         info = -9
      ELSE IF( ldx.LT.max( 1, n ) ) THEN
         info = -11
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CTRRFS', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 .OR. nrhs.EQ.0 ) THEN
         DO 10 j = 1, nrhs
            ferr( j ) = zero
            berr( j ) = zero
   10    CONTINUE
         RETURN
      END IF
*
      IF( notran ) THEN
         transn = 'N'
         transt = 'C'
      ELSE
         transn = 'C'
         transt = 'N'
      END IF
*
*     NZ = maximum number of nonzero elements in each row of A, plus 1
*
      nz = n + 1
      eps = slamch( 'Epsilon' )
      safmin = slamch( 'Safe minimum' )
      safe1 = nz*safmin
      safe2 = safe1 / eps
*
*     Do for each right hand side
*
      DO 250 j = 1, nrhs
*
*        Compute residual R = B - op(A) * X,
*        where op(A) = A, A**T, or A**H, depending on TRANS.
*
         CALL ccopy( n, x( 1, j ), 1, work, 1 )
         CALL ctrmv( uplo, trans, diag, n, a, lda, work, 1 )
         CALL caxpy( n, -one, b( 1, j ), 1, work, 1 )
*
*        Compute componentwise relative backward error from formula
*
*        max(i) ( abs(R(i)) / ( abs(op(A))*abs(X) + abs(B) )(i) )
*
*        where abs(Z) is the componentwise absolute value of the matrix
*        or vector Z.  If the i-th component of the denominator is less
*        than SAFE2, then SAFE1 is added to the i-th components of the
*        numerator and denominator before dividing.
*
         DO 20 i = 1, n
            rwork( i ) = cabs1( b( i, j ) )
   20    CONTINUE
*
         IF( notran ) THEN
*
*           Compute abs(A)*abs(X) + abs(B).
*
            IF( upper ) THEN
               IF( nounit ) THEN
                  DO 40 k = 1, n
                     xk = cabs1( x( k, j ) )
                     DO 30 i = 1, k
                        rwork( i ) = rwork( i ) + cabs1( a( i, k ) )*xk
   30                CONTINUE
   40             CONTINUE
               ELSE
                  DO 60 k = 1, n
                     xk = cabs1( x( k, j ) )
                     DO 50 i = 1, k - 1
                        rwork( i ) = rwork( i ) + cabs1( a( i, k ) )*xk
   50                CONTINUE
                     rwork( k ) = rwork( k ) + xk
   60             CONTINUE
               END IF
            ELSE
               IF( nounit ) THEN
                  DO 80 k = 1, n
                     xk = cabs1( x( k, j ) )
                     DO 70 i = k, n
                        rwork( i ) = rwork( i ) + cabs1( a( i, k ) )*xk
   70                CONTINUE
   80             CONTINUE
               ELSE
                  DO 100 k = 1, n
                     xk = cabs1( x( k, j ) )
                     DO 90 i = k + 1, n
                        rwork( i ) = rwork( i ) + cabs1( a( i, k ) )*xk
   90                CONTINUE
                     rwork( k ) = rwork( k ) + xk
  100             CONTINUE
               END IF
            END IF
         ELSE
*
*           Compute abs(A**H)*abs(X) + abs(B).
*
            IF( upper ) THEN
               IF( nounit ) THEN
                  DO 120 k = 1, n
                     s = zero
                     DO 110 i = 1, k
                        s = s + cabs1( a( i, k ) )*cabs1( x( i, j ) )
  110                CONTINUE
                     rwork( k ) = rwork( k ) + s
  120             CONTINUE
               ELSE
                  DO 140 k = 1, n
                     s = cabs1( x( k, j ) )
                     DO 130 i = 1, k - 1
                        s = s + cabs1( a( i, k ) )*cabs1( x( i, j ) )
  130                CONTINUE
                     rwork( k ) = rwork( k ) + s
  140             CONTINUE
               END IF
            ELSE
               IF( nounit ) THEN
                  DO 160 k = 1, n
                     s = zero
                     DO 150 i = k, n
                        s = s + cabs1( a( i, k ) )*cabs1( x( i, j ) )
  150                CONTINUE
                     rwork( k ) = rwork( k ) + s
  160             CONTINUE
               ELSE
                  DO 180 k = 1, n
                     s = cabs1( x( k, j ) )
                     DO 170 i = k + 1, n
                        s = s + cabs1( a( i, k ) )*cabs1( x( i, j ) )
  170                CONTINUE
                     rwork( k ) = rwork( k ) + s
  180             CONTINUE
               END IF
            END IF
         END IF
         s = zero
         DO 190 i = 1, n
            IF( rwork( i ).GT.safe2 ) THEN
               s = max( s, cabs1( work( i ) ) / rwork( i ) )
            ELSE
               s = max( s, ( cabs1( work( i ) )+safe1 ) /
     $             ( rwork( i )+safe1 ) )
            END IF
  190    CONTINUE
         berr( j ) = s
*
*        Bound error from formula
*
*        norm(X - XTRUE) / norm(X) .le. FERR =
*        norm( abs(inv(op(A)))*
*           ( abs(R) + NZ*EPS*( abs(op(A))*abs(X)+abs(B) ))) / norm(X)
*
*        where
*          norm(Z) is the magnitude of the largest component of Z
*          inv(op(A)) is the inverse of op(A)
*          abs(Z) is the componentwise absolute value of the matrix or
*             vector Z
*          NZ is the maximum number of nonzeros in any row of A, plus 1
*          EPS is machine epsilon
*
*        The i-th component of abs(R)+NZ*EPS*(abs(op(A))*abs(X)+abs(B))
*        is incremented by SAFE1 if the i-th component of
*        abs(op(A))*abs(X) + abs(B) is less than SAFE2.
*
*        Use CLACN2 to estimate the infinity-norm of the matrix
*           inv(op(A)) * diag(W),
*        where W = abs(R) + NZ*EPS*( abs(op(A))*abs(X)+abs(B) )))
*
         DO 200 i = 1, n
            IF( rwork( i ).GT.safe2 ) THEN
               rwork( i ) = cabs1( work( i ) ) + nz*eps*rwork( i )
            ELSE
               rwork( i ) = cabs1( work( i ) ) + nz*eps*rwork( i ) +
     $                      safe1
            END IF
  200    CONTINUE
*
         kase = 0
  210    CONTINUE
         CALL clacn2( n, work( n+1 ), work, ferr( j ), kase, isave )
         IF( kase.NE.0 ) THEN
            IF( kase.EQ.1 ) THEN
*
*              Multiply by diag(W)*inv(op(A)**H).
*
               CALL ctrsv( uplo, transt, diag, n, a, lda, work, 1 )
               DO 220 i = 1, n
                  work( i ) = rwork( i )*work( i )
  220          CONTINUE
            ELSE
*
*              Multiply by inv(op(A))*diag(W).
*
               DO 230 i = 1, n
                  work( i ) = rwork( i )*work( i )
  230          CONTINUE
               CALL ctrsv( uplo, transn, diag, n, a, lda, work, 1 )
            END IF
            GO TO 210
         END IF
*
*        Normalize error.
*
         lstres = zero
         DO 240 i = 1, n
            lstres = max( lstres, cabs1( x( i, j ) ) )
  240    CONTINUE
         IF( lstres.NE.zero )
     $      ferr( j ) = ferr( j ) / lstres
*
  250 CONTINUE
*
      RETURN
*
*     End of CTRRFS
*

◆ ctrsen()

subroutine ctrsen	(	character	job,
		character	compq,
		logical, dimension( * )	select,
		integer	n,
		complex, dimension( ldt, * )	t,
		integer	ldt,
		complex, dimension( ldq, * )	q,
		integer	ldq,
		complex, dimension( * )	w,
		integer	m,
		real	s,
		real	sep,
		complex, dimension( * )	work,
		integer	lwork,
		integer	info )

CTRSEN

Download CTRSEN + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CTRSEN reorders the Schur factorization of a complex matrix
!> A = Q*T*Q**H, so that a selected cluster of eigenvalues appears in
!> the leading positions on the diagonal of the upper triangular matrix
!> T, and the leading columns of Q form an orthonormal basis of the
!> corresponding right invariant subspace.
!>
!> Optionally the routine computes the reciprocal condition numbers of
!> the cluster of eigenvalues and/or the invariant subspace.
!>

Parameters

[in]	JOB	!> JOB is CHARACTER*1 !> Specifies whether condition numbers are required for the !> cluster of eigenvalues (S) or the invariant subspace (SEP): !> = 'N': none; !> = 'E': for eigenvalues only (S); !> = 'V': for invariant subspace only (SEP); !> = 'B': for both eigenvalues and invariant subspace (S and !> SEP). !>
[in]	COMPQ	!> COMPQ is CHARACTER*1 !> = 'V': update the matrix Q of Schur vectors; !> = 'N': do not update Q. !>
[in]	SELECT	!> SELECT is LOGICAL array, dimension (N) !> SELECT specifies the eigenvalues in the selected cluster. To !> select the j-th eigenvalue, SELECT(j) must be set to .TRUE.. !>
[in]	N	!> N is INTEGER !> The order of the matrix T. N >= 0. !>
[in,out]	T	!> T is COMPLEX array, dimension (LDT,N) !> On entry, the upper triangular matrix T. !> On exit, T is overwritten by the reordered matrix T, with the !> selected eigenvalues as the leading diagonal elements. !>
[in]	LDT	!> LDT is INTEGER !> The leading dimension of the array T. LDT >= max(1,N). !>
[in,out]	Q	!> Q is COMPLEX array, dimension (LDQ,N) !> On entry, if COMPQ = 'V', the matrix Q of Schur vectors. !> On exit, if COMPQ = 'V', Q has been postmultiplied by the !> unitary transformation matrix which reorders T; the leading M !> columns of Q form an orthonormal basis for the specified !> invariant subspace. !> If COMPQ = 'N', Q is not referenced. !>
[in]	LDQ	!> LDQ is INTEGER !> The leading dimension of the array Q. !> LDQ >= 1; and if COMPQ = 'V', LDQ >= N. !>
[out]	W	!> W is COMPLEX array, dimension (N) !> The reordered eigenvalues of T, in the same order as they !> appear on the diagonal of T. !>
[out]	M	!> M is INTEGER !> The dimension of the specified invariant subspace. !> 0 <= M <= N. !>
[out]	S	!> S is REAL !> If JOB = 'E' or 'B', S is a lower bound on the reciprocal !> condition number for the selected cluster of eigenvalues. !> S cannot underestimate the true reciprocal condition number !> by more than a factor of sqrt(N). If M = 0 or N, S = 1. !> If JOB = 'N' or 'V', S is not referenced. !>
[out]	SEP	!> SEP is REAL !> If JOB = 'V' or 'B', SEP is the estimated reciprocal !> condition number of the specified invariant subspace. If !> M = 0 or N, SEP = norm(T). !> If JOB = 'N' or 'E', SEP is not referenced. !>
[out]	WORK	!> WORK is COMPLEX array, dimension (MAX(1,LWORK)) !> On exit, if INFO = 0, WORK(1) returns the optimal LWORK. !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the array WORK. !> If JOB = 'N', LWORK >= 1; !> if JOB = 'E', LWORK = max(1,M(N-M)); !> if JOB = 'V' or 'B', LWORK >= max(1,2M*(N-M)). !> !> If LWORK = -1, then a workspace query is assumed; the routine !> only calculates the optimal size of the WORK array, returns !> this value as the first entry of the WORK array, and no error !> message related to LWORK is issued by XERBLA. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  CTRSEN first collects the selected eigenvalues by computing a unitary
!>  transformation Z to move them to the top left corner of T. In other
!>  words, the selected eigenvalues are the eigenvalues of T11 in:
!>
!>          Z**H * T * Z = ( T11 T12 ) n1
!>                         (  0  T22 ) n2
!>                            n1  n2
!>
!>  where N = n1+n2. The first
!>  n1 columns of Z span the specified invariant subspace of T.
!>
!>  If T has been obtained from the Schur factorization of a matrix
!>  A = Q*T*Q**H, then the reordered Schur factorization of A is given by
!>  A = (Q*Z)*(Z**H*T*Z)*(Q*Z)**H, and the first n1 columns of Q*Z span the
!>  corresponding invariant subspace of A.
!>
!>  The reciprocal condition number of the average of the eigenvalues of
!>  T11 may be returned in S. S lies between 0 (very badly conditioned)
!>  and 1 (very well conditioned). It is computed as follows. First we
!>  compute R so that
!>
!>                         P = ( I  R ) n1
!>                             ( 0  0 ) n2
!>                               n1 n2
!>
!>  is the projector on the invariant subspace associated with T11.
!>  R is the solution of the Sylvester equation:
!>
!>                        T11*R - R*T22 = T12.
!>
!>  Let F-norm(M) denote the Frobenius-norm of M and 2-norm(M) denote
!>  the two-norm of M. Then S is computed as the lower bound
!>
!>                      (1 + F-norm(R)**2)**(-1/2)
!>
!>  on the reciprocal of 2-norm(P), the true reciprocal condition number.
!>  S cannot underestimate 1 / 2-norm(P) by more than a factor of
!>  sqrt(N).
!>
!>  An approximate error bound for the computed average of the
!>  eigenvalues of T11 is
!>
!>                         EPS * norm(T) / S
!>
!>  where EPS is the machine precision.
!>
!>  The reciprocal condition number of the right invariant subspace
!>  spanned by the first n1 columns of Z (or of Q*Z) is returned in SEP.
!>  SEP is defined as the separation of T11 and T22:
!>
!>                     sep( T11, T22 ) = sigma-min( C )
!>
!>  where sigma-min(C) is the smallest singular value of the
!>  n1*n2-by-n1*n2 matrix
!>
!>     C  = kprod( I(n2), T11 ) - kprod( transpose(T22), I(n1) )
!>
!>  I(m) is an m by m identity matrix, and kprod denotes the Kronecker
!>  product. We estimate sigma-min(C) by the reciprocal of an estimate of
!>  the 1-norm of inverse(C). The true reciprocal 1-norm of inverse(C)
!>  cannot differ from sigma-min(C) by more than a factor of sqrt(n1*n2).
!>
!>  When SEP is small, small changes in T can cause large changes in
!>  the invariant subspace. An approximate bound on the maximum angular
!>  error in the computed right invariant subspace is
!>
!>                      EPS * norm(T) / SEP
!>

Definition at line 262 of file ctrsen.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          COMPQ, JOB
      INTEGER            INFO, LDQ, LDT, LWORK, M, N
      REAL               S, SEP
*     ..
*     .. Array Arguments ..
      LOGICAL            SELECT( * )
      COMPLEX            Q( LDQ, * ), T( LDT, * ), W( * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ZERO, ONE
      parameter( zero = 0.0e+0, one = 1.0e+0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            LQUERY, WANTBH, WANTQ, WANTS, WANTSP
      INTEGER            IERR, K, KASE, KS, LWMIN, N1, N2, NN
      REAL               EST, RNORM, SCALE
*     ..
*     .. Local Arrays ..
      INTEGER            ISAVE( 3 )
      REAL               RWORK( 1 )
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      REAL               CLANGE
      EXTERNAL           lsame, clange
*     ..
*     .. External Subroutines ..
      EXTERNAL           clacn2, clacpy, ctrexc, ctrsyl, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, sqrt
*     ..
*     .. Executable Statements ..
*
*     Decode and test the input parameters.
*
      wantbh = lsame( job, 'B' )
      wants = lsame( job, 'E' ) .OR. wantbh
      wantsp = lsame( job, 'V' ) .OR. wantbh
      wantq = lsame( compq, 'V' )
*
*     Set M to the number of selected eigenvalues.
*
      m = 0
      DO 10 k = 1, n
         IF( SELECT( k ) )
     $      m = m + 1
   10 CONTINUE
*
      n1 = m
      n2 = n - m
      nn = n1*n2
*
      info = 0
      lquery = ( lwork.EQ.-1 )
*
      IF( wantsp ) THEN
         lwmin = max( 1, 2*nn )
      ELSE IF( lsame( job, 'N' ) ) THEN
         lwmin = 1
      ELSE IF( lsame( job, 'E' ) ) THEN
         lwmin = max( 1, nn )
      END IF
*
      IF( .NOT.lsame( job, 'N' ) .AND. .NOT.wants .AND. .NOT.wantsp )
     $     THEN
         info = -1
      ELSE IF( .NOT.lsame( compq, 'N' ) .AND. .NOT.wantq ) THEN
         info = -2
      ELSE IF( n.LT.0 ) THEN
         info = -4
      ELSE IF( ldt.LT.max( 1, n ) ) THEN
         info = -6
      ELSE IF( ldq.LT.1 .OR. ( wantq .AND. ldq.LT.n ) ) THEN
         info = -8
      ELSE IF( lwork.LT.lwmin .AND. .NOT.lquery ) THEN
         info = -14
      END IF
*
      IF( info.EQ.0 ) THEN
         work( 1 ) = lwmin
      END IF
*
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CTRSEN', -info )
         RETURN
      ELSE IF( lquery ) THEN
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( m.EQ.n .OR. m.EQ.0 ) THEN
         IF( wants )
     $      s = one
         IF( wantsp )
     $      sep = clange( '1', n, n, t, ldt, rwork )
         GO TO 40
      END IF
*
*     Collect the selected eigenvalues at the top left corner of T.
*
      ks = 0
      DO 20 k = 1, n
         IF( SELECT( k ) ) THEN
            ks = ks + 1
*
*           Swap the K-th eigenvalue to position KS.
*
            IF( k.NE.ks )
     $         CALL ctrexc( compq, n, t, ldt, q, ldq, k, ks, ierr )
         END IF
   20 CONTINUE
*
      IF( wants ) THEN
*
*        Solve the Sylvester equation for R:
*
*           T11*R - R*T22 = scale*T12
*
         CALL clacpy( 'F', n1, n2, t( 1, n1+1 ), ldt, work, n1 )
         CALL ctrsyl( 'N', 'N', -1, n1, n2, t, ldt, t( n1+1, n1+1 ),
     $                ldt, work, n1, scale, ierr )
*
*        Estimate the reciprocal of the condition number of the cluster
*        of eigenvalues.
*
         rnorm = clange( 'F', n1, n2, work, n1, rwork )
         IF( rnorm.EQ.zero ) THEN
            s = one
         ELSE
            s = scale / ( sqrt( scale*scale / rnorm+rnorm )*
     $          sqrt( rnorm ) )
         END IF
      END IF
*
      IF( wantsp ) THEN
*
*        Estimate sep(T11,T22).
*
         est = zero
         kase = 0
   30    CONTINUE
         CALL clacn2( nn, work( nn+1 ), work, est, kase, isave )
         IF( kase.NE.0 ) THEN
            IF( kase.EQ.1 ) THEN
*
*              Solve T11*R - R*T22 = scale*X.
*
               CALL ctrsyl( 'N', 'N', -1, n1, n2, t, ldt,
     $                      t( n1+1, n1+1 ), ldt, work, n1, scale,
     $                      ierr )
            ELSE
*
*              Solve T11**H*R - R*T22**H = scale*X.
*
               CALL ctrsyl( 'C', 'C', -1, n1, n2, t, ldt,
     $                      t( n1+1, n1+1 ), ldt, work, n1, scale,
     $                      ierr )
            END IF
            GO TO 30
         END IF
*
         sep = scale / est
      END IF
*
   40 CONTINUE
*
*     Copy reordered eigenvalues to W.
*
      DO 50 k = 1, n
         w( k ) = t( k, k )
   50 CONTINUE
*
      work( 1 ) = lwmin
*
      RETURN
*
*     End of CTRSEN
*

◆ ctrsna()

subroutine ctrsna	(	character	job,
		character	howmny,
		logical, dimension( * )	select,
		integer	n,
		complex, dimension( ldt, * )	t,
		integer	ldt,
		complex, dimension( ldvl, * )	vl,
		integer	ldvl,
		complex, dimension( ldvr, * )	vr,
		integer	ldvr,
		real, dimension( * )	s,
		real, dimension( * )	sep,
		integer	mm,
		integer	m,
		complex, dimension( ldwork, * )	work,
		integer	ldwork,
		real, dimension( * )	rwork,
		integer	info )

CTRSNA

Download CTRSNA + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CTRSNA estimates reciprocal condition numbers for specified
!> eigenvalues and/or right eigenvectors of a complex upper triangular
!> matrix T (or of any matrix Q*T*Q**H with Q unitary).
!>

Parameters

[in]	JOB	!> JOB is CHARACTER*1 !> Specifies whether condition numbers are required for !> eigenvalues (S) or eigenvectors (SEP): !> = 'E': for eigenvalues only (S); !> = 'V': for eigenvectors only (SEP); !> = 'B': for both eigenvalues and eigenvectors (S and SEP). !>
[in]	HOWMNY	!> HOWMNY is CHARACTER*1 !> = 'A': compute condition numbers for all eigenpairs; !> = 'S': compute condition numbers for selected eigenpairs !> specified by the array SELECT. !>
[in]	SELECT	!> SELECT is LOGICAL array, dimension (N) !> If HOWMNY = 'S', SELECT specifies the eigenpairs for which !> condition numbers are required. To select condition numbers !> for the j-th eigenpair, SELECT(j) must be set to .TRUE.. !> If HOWMNY = 'A', SELECT is not referenced. !>
[in]	N	!> N is INTEGER !> The order of the matrix T. N >= 0. !>
[in]	T	!> T is COMPLEX array, dimension (LDT,N) !> The upper triangular matrix T. !>
[in]	LDT	!> LDT is INTEGER !> The leading dimension of the array T. LDT >= max(1,N). !>
[in]	VL	!> VL is COMPLEX array, dimension (LDVL,M) !> If JOB = 'E' or 'B', VL must contain left eigenvectors of T !> (or of any QTQ**H with Q unitary), corresponding to the !> eigenpairs specified by HOWMNY and SELECT. The eigenvectors !> must be stored in consecutive columns of VL, as returned by !> CHSEIN or CTREVC. !> If JOB = 'V', VL is not referenced. !>
[in]	LDVL	!> LDVL is INTEGER !> The leading dimension of the array VL. !> LDVL >= 1; and if JOB = 'E' or 'B', LDVL >= N. !>
[in]	VR	!> VR is COMPLEX array, dimension (LDVR,M) !> If JOB = 'E' or 'B', VR must contain right eigenvectors of T !> (or of any QTQ**H with Q unitary), corresponding to the !> eigenpairs specified by HOWMNY and SELECT. The eigenvectors !> must be stored in consecutive columns of VR, as returned by !> CHSEIN or CTREVC. !> If JOB = 'V', VR is not referenced. !>
[in]	LDVR	!> LDVR is INTEGER !> The leading dimension of the array VR. !> LDVR >= 1; and if JOB = 'E' or 'B', LDVR >= N. !>
[out]	S	!> S is REAL array, dimension (MM) !> If JOB = 'E' or 'B', the reciprocal condition numbers of the !> selected eigenvalues, stored in consecutive elements of the !> array. Thus S(j), SEP(j), and the j-th columns of VL and VR !> all correspond to the same eigenpair (but not in general the !> j-th eigenpair, unless all eigenpairs are selected). !> If JOB = 'V', S is not referenced. !>
[out]	SEP	!> SEP is REAL array, dimension (MM) !> If JOB = 'V' or 'B', the estimated reciprocal condition !> numbers of the selected eigenvectors, stored in consecutive !> elements of the array. !> If JOB = 'E', SEP is not referenced. !>
[in]	MM	!> MM is INTEGER !> The number of elements in the arrays S (if JOB = 'E' or 'B') !> and/or SEP (if JOB = 'V' or 'B'). MM >= M. !>
[out]	M	!> M is INTEGER !> The number of elements of the arrays S and/or SEP actually !> used to store the estimated condition numbers. !> If HOWMNY = 'A', M is set to N. !>
[out]	WORK	!> WORK is COMPLEX array, dimension (LDWORK,N+6) !> If JOB = 'E', WORK is not referenced. !>
[in]	LDWORK	!> LDWORK is INTEGER !> The leading dimension of the array WORK. !> LDWORK >= 1; and if JOB = 'V' or 'B', LDWORK >= N. !>
[out]	RWORK	!> RWORK is REAL array, dimension (N) !> If JOB = 'E', RWORK is not referenced. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  The reciprocal of the condition number of an eigenvalue lambda is
!>  defined as
!>
!>          S(lambda) = |v**H*u| / (norm(u)*norm(v))
!>
!>  where u and v are the right and left eigenvectors of T corresponding
!>  to lambda; v**H denotes the conjugate transpose of v, and norm(u)
!>  denotes the Euclidean norm. These reciprocal condition numbers always
!>  lie between zero (very badly conditioned) and one (very well
!>  conditioned). If n = 1, S(lambda) is defined to be 1.
!>
!>  An approximate error bound for a computed eigenvalue W(i) is given by
!>
!>                      EPS * norm(T) / S(i)
!>
!>  where EPS is the machine precision.
!>
!>  The reciprocal of the condition number of the right eigenvector u
!>  corresponding to lambda is defined as follows. Suppose
!>
!>              T = ( lambda  c  )
!>                  (   0    T22 )
!>
!>  Then the reciprocal condition number is
!>
!>          SEP( lambda, T22 ) = sigma-min( T22 - lambda*I )
!>
!>  where sigma-min denotes the smallest singular value. We approximate
!>  the smallest singular value by the reciprocal of an estimate of the
!>  one-norm of the inverse of T22 - lambda*I. If n = 1, SEP(1) is
!>  defined to be abs(T(1,1)).
!>
!>  An approximate error bound for a computed right eigenvector VR(i)
!>  is given by
!>
!>                      EPS * norm(T) / SEP(i)
!>

Definition at line 246 of file ctrsna.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          HOWMNY, JOB
      INTEGER            INFO, LDT, LDVL, LDVR, LDWORK, M, MM, N
*     ..
*     .. Array Arguments ..
      LOGICAL            SELECT( * )
      REAL               RWORK( * ), S( * ), SEP( * )
      COMPLEX            T( LDT, * ), VL( LDVL, * ), VR( LDVR, * ),
     $                   WORK( LDWORK, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ZERO, ONE
      parameter( zero = 0.0e+0, one = 1.0+0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            SOMCON, WANTBH, WANTS, WANTSP
      CHARACTER          NORMIN
      INTEGER            I, IERR, IX, J, K, KASE, KS
      REAL               BIGNUM, EPS, EST, LNRM, RNRM, SCALE, SMLNUM,
     $                   XNORM
      COMPLEX            CDUM, PROD
*     ..
*     .. Local Arrays ..
      INTEGER            ISAVE( 3 )
      COMPLEX            DUMMY( 1 )
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      INTEGER            ICAMAX
      REAL               SCNRM2, SLAMCH
      COMPLEX            CDOTC
      EXTERNAL           lsame, icamax, scnrm2, slamch, cdotc
*     ..
*     .. External Subroutines ..
      EXTERNAL           clacn2, clacpy, clatrs, csrscl, ctrexc, slabad,
     $                   xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, aimag, max, real
*     ..
*     .. Statement Functions ..
      REAL               CABS1
*     ..
*     .. Statement Function definitions ..
      cabs1( cdum ) = abs( real( cdum ) ) + abs( aimag( cdum ) )
*     ..
*     .. Executable Statements ..
*
*     Decode and test the input parameters
*
      wantbh = lsame( job, 'B' )
      wants = lsame( job, 'E' ) .OR. wantbh
      wantsp = lsame( job, 'V' ) .OR. wantbh
*
      somcon = lsame( howmny, 'S' )
*
*     Set M to the number of eigenpairs for which condition numbers are
*     to be computed.
*
      IF( somcon ) THEN
         m = 0
         DO 10 j = 1, n
            IF( SELECT( j ) )
     $         m = m + 1
   10    CONTINUE
      ELSE
         m = n
      END IF
*
      info = 0
      IF( .NOT.wants .AND. .NOT.wantsp ) THEN
         info = -1
      ELSE IF( .NOT.lsame( howmny, 'A' ) .AND. .NOT.somcon ) THEN
         info = -2
      ELSE IF( n.LT.0 ) THEN
         info = -4
      ELSE IF( ldt.LT.max( 1, n ) ) THEN
         info = -6
      ELSE IF( ldvl.LT.1 .OR. ( wants .AND. ldvl.LT.n ) ) THEN
         info = -8
      ELSE IF( ldvr.LT.1 .OR. ( wants .AND. ldvr.LT.n ) ) THEN
         info = -10
      ELSE IF( mm.LT.m ) THEN
         info = -13
      ELSE IF( ldwork.LT.1 .OR. ( wantsp .AND. ldwork.LT.n ) ) THEN
         info = -16
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CTRSNA', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
      IF( n.EQ.1 ) THEN
         IF( somcon ) THEN
            IF( .NOT.SELECT( 1 ) )
     $         RETURN
         END IF
         IF( wants )
     $      s( 1 ) = one
         IF( wantsp )
     $      sep( 1 ) = abs( t( 1, 1 ) )
         RETURN
      END IF
*
*     Get machine constants
*
      eps = slamch( 'P' )
      smlnum = slamch( 'S' ) / eps
      bignum = one / smlnum
      CALL slabad( smlnum, bignum )
*
      ks = 1
      DO 50 k = 1, n
*
         IF( somcon ) THEN
            IF( .NOT.SELECT( k ) )
     $         GO TO 50
         END IF
*
         IF( wants ) THEN
*
*           Compute the reciprocal condition number of the k-th
*           eigenvalue.
*
            prod = cdotc( n, vr( 1, ks ), 1, vl( 1, ks ), 1 )
            rnrm = scnrm2( n, vr( 1, ks ), 1 )
            lnrm = scnrm2( n, vl( 1, ks ), 1 )
            s( ks ) = abs( prod ) / ( rnrm*lnrm )
*
         END IF
*
         IF( wantsp ) THEN
*
*           Estimate the reciprocal condition number of the k-th
*           eigenvector.
*
*           Copy the matrix T to the array WORK and swap the k-th
*           diagonal element to the (1,1) position.
*
            CALL clacpy( 'Full', n, n, t, ldt, work, ldwork )
            CALL ctrexc( 'No Q', n, work, ldwork, dummy, 1, k, 1, ierr )
*
*           Form  C = T22 - lambda*I in WORK(2:N,2:N).
*
            DO 20 i = 2, n
               work( i, i ) = work( i, i ) - work( 1, 1 )
   20       CONTINUE
*
*           Estimate a lower bound for the 1-norm of inv(C**H). The 1st
*           and (N+1)th columns of WORK are used to store work vectors.
*
            sep( ks ) = zero
            est = zero
            kase = 0
            normin = 'N'
   30       CONTINUE
            CALL clacn2( n-1, work( 1, n+1 ), work, est, kase, isave )
*
            IF( kase.NE.0 ) THEN
               IF( kase.EQ.1 ) THEN
*
*                 Solve C**H*x = scale*b
*
                  CALL clatrs( 'Upper', 'Conjugate transpose',
     $                         'Nonunit', normin, n-1, work( 2, 2 ),
     $                         ldwork, work, scale, rwork, ierr )
               ELSE
*
*                 Solve C*x = scale*b
*
                  CALL clatrs( 'Upper', 'No transpose', 'Nonunit',
     $                         normin, n-1, work( 2, 2 ), ldwork, work,
     $                         scale, rwork, ierr )
               END IF
               normin = 'Y'
               IF( scale.NE.one ) THEN
*
*                 Multiply by 1/SCALE if doing so will not cause
*                 overflow.
*
                  ix = icamax( n-1, work, 1 )
                  xnorm = cabs1( work( ix, 1 ) )
                  IF( scale.LT.xnorm*smlnum .OR. scale.EQ.zero )
     $               GO TO 40
                  CALL csrscl( n, scale, work, 1 )
               END IF
               GO TO 30
            END IF
*
            sep( ks ) = one / max( est, smlnum )
         END IF
*
   40    CONTINUE
         ks = ks + 1
   50 CONTINUE
      RETURN
*
*     End of CTRSNA
*

◆ ctrti2()

subroutine ctrti2	(	character	uplo,
		character	diag,
		integer	n,
		complex, dimension( lda, * )	a,
		integer	lda,
		integer	info )

CTRTI2 computes the inverse of a triangular matrix (unblocked algorithm).

Download CTRTI2 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CTRTI2 computes the inverse of a complex upper or lower triangular
!> matrix.
!>
!> This is the Level 2 BLAS version of the algorithm.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> Specifies whether the matrix A is upper or lower triangular. !> = 'U': Upper triangular !> = 'L': Lower triangular !>
[in]	DIAG	!> DIAG is CHARACTER*1 !> Specifies whether or not the matrix A is unit triangular. !> = 'N': Non-unit triangular !> = 'U': Unit triangular !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in,out]	A	!> A is COMPLEX array, dimension (LDA,N) !> On entry, the triangular matrix A. If UPLO = 'U', the !> leading n by n upper triangular part of the array A contains !> the upper triangular matrix, and the strictly lower !> triangular part of A is not referenced. If UPLO = 'L', the !> leading n by n lower triangular part of the array A contains !> the lower triangular matrix, and the strictly upper !> triangular part of A is not referenced. If DIAG = 'U', the !> diagonal elements of A are also not referenced and are !> assumed to be 1. !> !> On exit, the (triangular) inverse of the original matrix, in !> the same storage format. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,N). !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -k, the k-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 109 of file ctrti2.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          DIAG, UPLO
      INTEGER            INFO, LDA, N
*     ..
*     .. Array Arguments ..
      COMPLEX            A( LDA, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            ONE
      parameter( one = ( 1.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      LOGICAL            NOUNIT, UPPER
      INTEGER            J
      COMPLEX            AJJ
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           cscal, ctrmv, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      upper = lsame( uplo, 'U' )
      nounit = lsame( diag, 'N' )
      IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -1
      ELSE IF( .NOT.nounit .AND. .NOT.lsame( diag, 'U' ) ) THEN
         info = -2
      ELSE IF( n.LT.0 ) THEN
         info = -3
      ELSE IF( lda.LT.max( 1, n ) ) THEN
         info = -5
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CTRTI2', -info )
         RETURN
      END IF
*
      IF( upper ) THEN
*
*        Compute inverse of upper triangular matrix.
*
         DO 10 j = 1, n
            IF( nounit ) THEN
               a( j, j ) = one / a( j, j )
               ajj = -a( j, j )
            ELSE
               ajj = -one
            END IF
*
*           Compute elements 1:j-1 of j-th column.
*
            CALL ctrmv( 'Upper', 'No transpose', diag, j-1, a, lda,
     $                  a( 1, j ), 1 )
            CALL cscal( j-1, ajj, a( 1, j ), 1 )
   10    CONTINUE
      ELSE
*
*        Compute inverse of lower triangular matrix.
*
         DO 20 j = n, 1, -1
            IF( nounit ) THEN
               a( j, j ) = one / a( j, j )
               ajj = -a( j, j )
            ELSE
               ajj = -one
            END IF
            IF( j.LT.n ) THEN
*
*              Compute elements j+1:n of j-th column.
*
               CALL ctrmv( 'Lower', 'No transpose', diag, n-j,
     $                     a( j+1, j+1 ), lda, a( j+1, j ), 1 )
               CALL cscal( n-j, ajj, a( j+1, j ), 1 )
            END IF
   20    CONTINUE
      END IF
*
      RETURN
*
*     End of CTRTI2
*

◆ ctrtri()

subroutine ctrtri	(	character	uplo,
		character	diag,
		integer	n,
		complex, dimension( lda, * )	a,
		integer	lda,
		integer	info )

CTRTRI

Download CTRTRI + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CTRTRI computes the inverse of a complex upper or lower triangular
!> matrix A.
!>
!> This is the Level 3 BLAS version of the algorithm.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': A is upper triangular; !> = 'L': A is lower triangular. !>
[in]	DIAG	!> DIAG is CHARACTER*1 !> = 'N': A is non-unit triangular; !> = 'U': A is unit triangular. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in,out]	A	!> A is COMPLEX array, dimension (LDA,N) !> On entry, the triangular matrix A. If UPLO = 'U', the !> leading N-by-N upper triangular part of the array A contains !> the upper triangular matrix, and the strictly lower !> triangular part of A is not referenced. If UPLO = 'L', the !> leading N-by-N lower triangular part of the array A contains !> the lower triangular matrix, and the strictly upper !> triangular part of A is not referenced. If DIAG = 'U', the !> diagonal elements of A are also not referenced and are !> assumed to be 1. !> On exit, the (triangular) inverse of the original matrix, in !> the same storage format. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,N). !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !> > 0: if INFO = i, A(i,i) is exactly zero. The triangular !> matrix is singular and its inverse can not be computed. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 108 of file ctrtri.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          DIAG, UPLO
      INTEGER            INFO, LDA, N
*     ..
*     .. Array Arguments ..
      COMPLEX            A( LDA, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            ONE, ZERO
      parameter( one = ( 1.0e+0, 0.0e+0 ),
     $                   zero = ( 0.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      LOGICAL            NOUNIT, UPPER
      INTEGER            J, JB, NB, NN
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      INTEGER            ILAENV
      EXTERNAL           lsame, ilaenv
*     ..
*     .. External Subroutines ..
      EXTERNAL           ctrmm, ctrsm, ctrti2, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, min
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      upper = lsame( uplo, 'U' )
      nounit = lsame( diag, 'N' )
      IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -1
      ELSE IF( .NOT.nounit .AND. .NOT.lsame( diag, 'U' ) ) THEN
         info = -2
      ELSE IF( n.LT.0 ) THEN
         info = -3
      ELSE IF( lda.LT.max( 1, n ) ) THEN
         info = -5
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CTRTRI', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
*     Check for singularity if non-unit.
*
      IF( nounit ) THEN
         DO 10 info = 1, n
            IF( a( info, info ).EQ.zero )
     $         RETURN
   10    CONTINUE
         info = 0
      END IF
*
*     Determine the block size for this environment.
*
      nb = ilaenv( 1, 'CTRTRI', uplo // diag, n, -1, -1, -1 )
      IF( nb.LE.1 .OR. nb.GE.n ) THEN
*
*        Use unblocked code
*
         CALL ctrti2( uplo, diag, n, a, lda, info )
      ELSE
*
*        Use blocked code
*
         IF( upper ) THEN
*
*           Compute inverse of upper triangular matrix
*
            DO 20 j = 1, n, nb
               jb = min( nb, n-j+1 )
*
*              Compute rows 1:j-1 of current block column
*
               CALL ctrmm( 'Left', 'Upper', 'No transpose', diag, j-1,
     $                     jb, one, a, lda, a( 1, j ), lda )
               CALL ctrsm( 'Right', 'Upper', 'No transpose', diag, j-1,
     $                     jb, -one, a( j, j ), lda, a( 1, j ), lda )
*
*              Compute inverse of current diagonal block
*
               CALL ctrti2( 'Upper', diag, jb, a( j, j ), lda, info )
   20       CONTINUE
         ELSE
*
*           Compute inverse of lower triangular matrix
*
            nn = ( ( n-1 ) / nb )*nb + 1
            DO 30 j = nn, 1, -nb
               jb = min( nb, n-j+1 )
               IF( j+jb.LE.n ) THEN
*
*                 Compute rows j+jb:n of current block column
*
                  CALL ctrmm( 'Left', 'Lower', 'No transpose', diag,
     $                        n-j-jb+1, jb, one, a( j+jb, j+jb ), lda,
     $                        a( j+jb, j ), lda )
                  CALL ctrsm( 'Right', 'Lower', 'No transpose', diag,
     $                        n-j-jb+1, jb, -one, a( j, j ), lda,
     $                        a( j+jb, j ), lda )
               END IF
*
*              Compute inverse of current diagonal block
*
               CALL ctrti2( 'Lower', diag, jb, a( j, j ), lda, info )
   30       CONTINUE
         END IF
      END IF
*
      RETURN
*
*     End of CTRTRI
*

◆ ctrtrs()

subroutine ctrtrs	(	character	uplo,
		character	trans,
		character	diag,
		integer	n,
		integer	nrhs,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( ldb, * )	b,
		integer	ldb,
		integer	info )

CTRTRS

Download CTRTRS + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CTRTRS solves a triangular system of the form
!>
!>    A * X = B,  A**T * X = B,  or  A**H * X = B,
!>
!> where A is a triangular matrix of order N, and B is an N-by-NRHS
!> matrix.  A check is made to verify that A is nonsingular.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': A is upper triangular; !> = 'L': A is lower triangular. !>
[in]	TRANS	!> TRANS is CHARACTER1 !> Specifies the form of the system of equations: !> = 'N': A X = B (No transpose) !> = 'T': A*T X = B (Transpose) !> = 'C': A*H X = B (Conjugate transpose) !>
[in]	DIAG	!> DIAG is CHARACTER*1 !> = 'N': A is non-unit triangular; !> = 'U': A is unit triangular. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in]	NRHS	!> NRHS is INTEGER !> The number of right hand sides, i.e., the number of columns !> of the matrix B. NRHS >= 0. !>
[in]	A	!> A is COMPLEX array, dimension (LDA,N) !> The triangular matrix A. If UPLO = 'U', the leading N-by-N !> upper triangular part of the array A contains the upper !> triangular matrix, and the strictly lower triangular part of !> A is not referenced. If UPLO = 'L', the leading N-by-N lower !> triangular part of the array A contains the lower triangular !> matrix, and the strictly upper triangular part of A is not !> referenced. If DIAG = 'U', the diagonal elements of A are !> also not referenced and are assumed to be 1. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,N). !>
[in,out]	B	!> B is COMPLEX array, dimension (LDB,NRHS) !> On entry, the right hand side matrix B. !> On exit, if INFO = 0, the solution matrix X. !>
[in]	LDB	!> LDB is INTEGER !> The leading dimension of the array B. LDB >= max(1,N). !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !> > 0: if INFO = i, the i-th diagonal element of A is zero, !> indicating that the matrix is singular and the solutions !> X have not been computed. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 138 of file ctrtrs.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          DIAG, TRANS, UPLO
      INTEGER            INFO, LDA, LDB, N, NRHS
*     ..
*     .. Array Arguments ..
      COMPLEX            A( LDA, * ), B( LDB, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            ZERO, ONE
      parameter( zero = ( 0.0e+0, 0.0e+0 ),
     $                   one = ( 1.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      LOGICAL            NOUNIT
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           ctrsm, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      nounit = lsame( diag, 'N' )
      IF( .NOT.lsame( uplo, 'U' ) .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -1
      ELSE IF( .NOT.lsame( trans, 'N' ) .AND. .NOT.
     $         lsame( trans, 'T' ) .AND. .NOT.lsame( trans, 'C' ) ) THEN
         info = -2
      ELSE IF( .NOT.nounit .AND. .NOT.lsame( diag, 'U' ) ) THEN
         info = -3
      ELSE IF( n.LT.0 ) THEN
         info = -4
      ELSE IF( nrhs.LT.0 ) THEN
         info = -5
      ELSE IF( lda.LT.max( 1, n ) ) THEN
         info = -7
      ELSE IF( ldb.LT.max( 1, n ) ) THEN
         info = -9
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CTRTRS', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
*     Check for singularity.
*
      IF( nounit ) THEN
         DO 10 info = 1, n
            IF( a( info, info ).EQ.zero )
     $         RETURN
   10    CONTINUE
      END IF
      info = 0
*
*     Solve A * x = b,  A**T * x = b,  or  A**H * x = b.
*
      CALL ctrsm( 'Left', uplo, trans, diag, n, nrhs, one, a, lda, b,
     $            ldb )
*
      RETURN
*
*     End of CTRTRS
*

◆ ctrttf()

subroutine ctrttf	(	character	transr,
		character	uplo,
		integer	n,
		complex, dimension( 0: lda-1, 0: * )	a,
		integer	lda,
		complex, dimension( 0: * )	arf,
		integer	info )

CTRTTF copies a triangular matrix from the standard full format (TR) to the rectangular full packed format (TF).

Download CTRTTF + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CTRTTF copies a triangular matrix A from standard full format (TR)
!> to rectangular full packed format (TF) .
!>

Parameters

[in]	TRANSR	!> TRANSR is CHARACTER*1 !> = 'N': ARF in Normal mode is wanted; !> = 'C': ARF in Conjugate Transpose mode is wanted; !>
[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': A is upper triangular; !> = 'L': A is lower triangular. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in]	A	!> A is COMPLEX array, dimension ( LDA, N ) !> On entry, the triangular matrix A. If UPLO = 'U', the !> leading N-by-N upper triangular part of the array A contains !> the upper triangular matrix, and the strictly lower !> triangular part of A is not referenced. If UPLO = 'L', the !> leading N-by-N lower triangular part of the array A contains !> the lower triangular matrix, and the strictly upper !> triangular part of A is not referenced. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the matrix A. LDA >= max(1,N). !>
[out]	ARF	!> ARF is COMPLEX array, dimension ( N*(N+1)/2 ), !> On exit, the upper or lower triangular matrix A stored in !> RFP format. For a further discussion see Notes below. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  We first consider Standard Packed Format when N is even.
!>  We give an example where N = 6.
!>
!>      AP is Upper             AP is Lower
!>
!>   00 01 02 03 04 05       00
!>      11 12 13 14 15       10 11
!>         22 23 24 25       20 21 22
!>            33 34 35       30 31 32 33
!>               44 45       40 41 42 43 44
!>                  55       50 51 52 53 54 55
!>
!>
!>  Let TRANSR = 'N'. RFP holds AP as follows:
!>  For UPLO = 'U' the upper trapezoid A(0:5,0:2) consists of the last
!>  three columns of AP upper. The lower triangle A(4:6,0:2) consists of
!>  conjugate-transpose of the first three columns of AP upper.
!>  For UPLO = 'L' the lower trapezoid A(1:6,0:2) consists of the first
!>  three columns of AP lower. The upper triangle A(0:2,0:2) consists of
!>  conjugate-transpose of the last three columns of AP lower.
!>  To denote conjugate we place -- above the element. This covers the
!>  case N even and TRANSR = 'N'.
!>
!>         RFP A                   RFP A
!>
!>                                -- -- --
!>        03 04 05                33 43 53
!>                                   -- --
!>        13 14 15                00 44 54
!>                                      --
!>        23 24 25                10 11 55
!>
!>        33 34 35                20 21 22
!>        --
!>        00 44 45                30 31 32
!>        -- --
!>        01 11 55                40 41 42
!>        -- -- --
!>        02 12 22                50 51 52
!>
!>  Now let TRANSR = 'C'. RFP A in both UPLO cases is just the conjugate-
!>  transpose of RFP A above. One therefore gets:
!>
!>
!>           RFP A                   RFP A
!>
!>     -- -- -- --                -- -- -- -- -- --
!>     03 13 23 33 00 01 02    33 00 10 20 30 40 50
!>     -- -- -- -- --                -- -- -- -- --
!>     04 14 24 34 44 11 12    43 44 11 21 31 41 51
!>     -- -- -- -- -- --                -- -- -- --
!>     05 15 25 35 45 55 22    53 54 55 22 32 42 52
!>
!>
!>  We next  consider Standard Packed Format when N is odd.
!>  We give an example where N = 5.
!>
!>     AP is Upper                 AP is Lower
!>
!>   00 01 02 03 04              00
!>      11 12 13 14              10 11
!>         22 23 24              20 21 22
!>            33 34              30 31 32 33
!>               44              40 41 42 43 44
!>
!>
!>  Let TRANSR = 'N'. RFP holds AP as follows:
!>  For UPLO = 'U' the upper trapezoid A(0:4,0:2) consists of the last
!>  three columns of AP upper. The lower triangle A(3:4,0:1) consists of
!>  conjugate-transpose of the first two   columns of AP upper.
!>  For UPLO = 'L' the lower trapezoid A(0:4,0:2) consists of the first
!>  three columns of AP lower. The upper triangle A(0:1,1:2) consists of
!>  conjugate-transpose of the last two   columns of AP lower.
!>  To denote conjugate we place -- above the element. This covers the
!>  case N odd  and TRANSR = 'N'.
!>
!>         RFP A                   RFP A
!>
!>                                   -- --
!>        02 03 04                00 33 43
!>                                      --
!>        12 13 14                10 11 44
!>
!>        22 23 24                20 21 22
!>        --
!>        00 33 34                30 31 32
!>        -- --
!>        01 11 44                40 41 42
!>
!>  Now let TRANSR = 'C'. RFP A in both UPLO cases is just the conjugate-
!>  transpose of RFP A above. One therefore gets:
!>
!>
!>           RFP A                   RFP A
!>
!>     -- -- --                   -- -- -- -- -- --
!>     02 12 22 00 01             00 10 20 30 40 50
!>     -- -- -- --                   -- -- -- -- --
!>     03 13 23 33 11             33 11 21 31 41 51
!>     -- -- -- -- --                   -- -- -- --
!>     04 14 24 34 44             43 44 22 32 42 52
!>

Definition at line 215 of file ctrttf.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          TRANSR, UPLO
      INTEGER            INFO, N, LDA
*     ..
*     .. Array Arguments ..
      COMPLEX            A( 0: LDA-1, 0: * ), ARF( 0: * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
*     ..
*     .. Local Scalars ..
      LOGICAL            LOWER, NISODD, NORMALTRANSR
      INTEGER            I, IJ, J, K, L, N1, N2, NT, NX2, NP1X2
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          conjg, max, mod
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      normaltransr = lsame( transr, 'N' )
      lower = lsame( uplo, 'L' )
      IF( .NOT.normaltransr .AND. .NOT.lsame( transr, 'C' ) ) THEN
         info = -1
      ELSE IF( .NOT.lower .AND. .NOT.lsame( uplo, 'U' ) ) THEN
         info = -2
      ELSE IF( n.LT.0 ) THEN
         info = -3
      ELSE IF( lda.LT.max( 1, n ) ) THEN
         info = -5
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CTRTTF', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.LE.1 ) THEN
         IF( n.EQ.1 ) THEN
            IF( normaltransr ) THEN
               arf( 0 ) = a( 0, 0 )
            ELSE
               arf( 0 ) = conjg( a( 0, 0 ) )
            END IF
         END IF
         RETURN
      END IF
*
*     Size of array ARF(1:2,0:nt-1)
*
      nt = n*( n+1 ) / 2
*
*     set N1 and N2 depending on LOWER: for N even N1=N2=K
*
      IF( lower ) THEN
         n2 = n / 2
         n1 = n - n2
      ELSE
         n1 = n / 2
         n2 = n - n1
      END IF
*
*     If N is odd, set NISODD = .TRUE., LDA=N+1 and A is (N+1)--by--K2.
*     If N is even, set K = N/2 and NISODD = .FALSE., LDA=N and A is
*     N--by--(N+1)/2.
*
      IF( mod( n, 2 ).EQ.0 ) THEN
         k = n / 2
         nisodd = .false.
         IF( .NOT.lower )
     $      np1x2 = n + n + 2
      ELSE
         nisodd = .true.
         IF( .NOT.lower )
     $      nx2 = n + n
      END IF
*
      IF( nisodd ) THEN
*
*        N is odd
*
         IF( normaltransr ) THEN
*
*           N is odd and TRANSR = 'N'
*
            IF( lower ) THEN
*
*             SRPA for LOWER, NORMAL and N is odd ( a(0:n-1,0:n1-1) )
*             T1 -> a(0,0), T2 -> a(0,1), S -> a(n1,0)
*             T1 -> a(0), T2 -> a(n), S -> a(n1); lda=n
*
               ij = 0
               DO j = 0, n2
                  DO i = n1, n2 + j
                     arf( ij ) = conjg( a( n2+j, i ) )
                     ij = ij + 1
                  END DO
                  DO i = j, n - 1
                     arf( ij ) = a( i, j )
                     ij = ij + 1
                  END DO
               END DO
*
            ELSE
*
*             SRPA for UPPER, NORMAL and N is odd ( a(0:n-1,0:n2-1)
*             T1 -> a(n1+1,0), T2 -> a(n1,0), S -> a(0,0)
*             T1 -> a(n2), T2 -> a(n1), S -> a(0); lda=n
*
               ij = nt - n
               DO j = n - 1, n1, -1
                  DO i = 0, j
                     arf( ij ) = a( i, j )
                     ij = ij + 1
                  END DO
                  DO l = j - n1, n1 - 1
                     arf( ij ) = conjg( a( j-n1, l ) )
                     ij = ij + 1
                  END DO
                  ij = ij - nx2
               END DO
*
            END IF
*
         ELSE
*
*           N is odd and TRANSR = 'C'
*
            IF( lower ) THEN
*
*              SRPA for LOWER, TRANSPOSE and N is odd
*              T1 -> A(0,0) , T2 -> A(1,0) , S -> A(0,n1)
*              T1 -> A(0+0) , T2 -> A(1+0) , S -> A(0+n1*n1); lda=n1
*
               ij = 0
               DO j = 0, n2 - 1
                  DO i = 0, j
                     arf( ij ) = conjg( a( j, i ) )
                     ij = ij + 1
                  END DO
                  DO i = n1 + j, n - 1
                     arf( ij ) = a( i, n1+j )
                     ij = ij + 1
                  END DO
               END DO
               DO j = n2, n - 1
                  DO i = 0, n1 - 1
                     arf( ij ) = conjg( a( j, i ) )
                     ij = ij + 1
                  END DO
               END DO
*
            ELSE
*
*              SRPA for UPPER, TRANSPOSE and N is odd
*              T1 -> A(0,n1+1), T2 -> A(0,n1), S -> A(0,0)
*              T1 -> A(n2*n2), T2 -> A(n1*n2), S -> A(0); lda=n2
*
               ij = 0
               DO j = 0, n1
                  DO i = n1, n - 1
                     arf( ij ) = conjg( a( j, i ) )
                     ij = ij + 1
                  END DO
               END DO
               DO j = 0, n1 - 1
                  DO i = 0, j
                     arf( ij ) = a( i, j )
                     ij = ij + 1
                  END DO
                  DO l = n2 + j, n - 1
                     arf( ij ) = conjg( a( n2+j, l ) )
                     ij = ij + 1
                  END DO
               END DO
*
            END IF
*
         END IF
*
      ELSE
*
*        N is even
*
         IF( normaltransr ) THEN
*
*           N is even and TRANSR = 'N'
*
            IF( lower ) THEN
*
*              SRPA for LOWER, NORMAL, and N is even ( a(0:n,0:k-1) )
*              T1 -> a(1,0), T2 -> a(0,0), S -> a(k+1,0)
*              T1 -> a(1), T2 -> a(0), S -> a(k+1); lda=n+1
*
               ij = 0
               DO j = 0, k - 1
                  DO i = k, k + j
                     arf( ij ) = conjg( a( k+j, i ) )
                     ij = ij + 1
                  END DO
                  DO i = j, n - 1
                     arf( ij ) = a( i, j )
                     ij = ij + 1
                  END DO
               END DO
*
            ELSE
*
*              SRPA for UPPER, NORMAL, and N is even ( a(0:n,0:k-1) )
*              T1 -> a(k+1,0) ,  T2 -> a(k,0),   S -> a(0,0)
*              T1 -> a(k+1), T2 -> a(k), S -> a(0); lda=n+1
*
               ij = nt - n - 1
               DO j = n - 1, k, -1
                  DO i = 0, j
                     arf( ij ) = a( i, j )
                     ij = ij + 1
                  END DO
                  DO l = j - k, k - 1
                     arf( ij ) = conjg( a( j-k, l ) )
                     ij = ij + 1
                  END DO
                  ij = ij - np1x2
               END DO
*
            END IF
*
         ELSE
*
*           N is even and TRANSR = 'C'
*
            IF( lower ) THEN
*
*              SRPA for LOWER, TRANSPOSE and N is even (see paper, A=B)
*              T1 -> A(0,1) , T2 -> A(0,0) , S -> A(0,k+1) :
*              T1 -> A(0+k) , T2 -> A(0+0) , S -> A(0+k*(k+1)); lda=k
*
               ij = 0
               j = k
               DO i = k, n - 1
                  arf( ij ) = a( i, j )
                  ij = ij + 1
               END DO
               DO j = 0, k - 2
                  DO i = 0, j
                     arf( ij ) = conjg( a( j, i ) )
                     ij = ij + 1
                  END DO
                  DO i = k + 1 + j, n - 1
                     arf( ij ) = a( i, k+1+j )
                     ij = ij + 1
                  END DO
               END DO
               DO j = k - 1, n - 1
                  DO i = 0, k - 1
                     arf( ij ) = conjg( a( j, i ) )
                     ij = ij + 1
                  END DO
               END DO
*
            ELSE
*
*              SRPA for UPPER, TRANSPOSE and N is even (see paper, A=B)
*              T1 -> A(0,k+1) , T2 -> A(0,k) , S -> A(0,0)
*              T1 -> A(0+k*(k+1)) , T2 -> A(0+k*k) , S -> A(0+0)); lda=k
*
               ij = 0
               DO j = 0, k
                  DO i = k, n - 1
                     arf( ij ) = conjg( a( j, i ) )
                     ij = ij + 1
                  END DO
               END DO
               DO j = 0, k - 2
                  DO i = 0, j
                     arf( ij ) = a( i, j )
                     ij = ij + 1
                  END DO
                  DO l = k + 1 + j, n - 1
                     arf( ij ) = conjg( a( k+1+j, l ) )
                     ij = ij + 1
                  END DO
               END DO
*
*              Note that here J = K-1
*
               DO i = 0, j
                  arf( ij ) = a( i, j )
                  ij = ij + 1
               END DO
*
            END IF
*
         END IF
*
      END IF
*
      RETURN
*
*     End of CTRTTF
*

◆ ctrttp()

subroutine ctrttp	(	character	uplo,
		integer	n,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( * )	ap,
		integer	info )

CTRTTP copies a triangular matrix from the standard full format (TR) to the standard packed format (TP).

Download CTRTTP + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CTRTTP copies a triangular matrix A from full format (TR) to standard
!> packed format (TP).
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': A is upper triangular; !> = 'L': A is lower triangular. !>
[in]	N	!> N is INTEGER !> The order of the matrices AP and A. N >= 0. !>
[in]	A	!> A is COMPLEX array, dimension (LDA,N) !> On entry, the triangular matrix A. If UPLO = 'U', the leading !> N-by-N upper triangular part of A contains the upper !> triangular part of the matrix A, and the strictly lower !> triangular part of A is not referenced. If UPLO = 'L', the !> leading N-by-N lower triangular part of A contains the lower !> triangular part of the matrix A, and the strictly upper !> triangular part of A is not referenced. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,N). !>
[out]	AP	!> AP is COMPLEX array, dimension ( N(N+1)/2 ), !> On exit, the upper or lower triangular matrix A, packed !> columnwise in a linear array. The j-th column of A is stored !> in the array AP as follows: !> if UPLO = 'U', AP(i + (j-1)j/2) = A(i,j) for 1<=i<=j; !> if UPLO = 'L', AP(i + (j-1)*(2n-j)/2) = A(i,j) for j<=i<=n. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 103 of file ctrttp.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          UPLO
      INTEGER            INFO, N, LDA
*     ..
*     .. Array Arguments ..
      COMPLEX            A( LDA, * ), AP( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
*     ..
*     .. Local Scalars ..
      LOGICAL            LOWER
      INTEGER            I, J, K
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           xerbla
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      lower = lsame( uplo, 'L' )
      IF( .NOT.lower .AND. .NOT.lsame( uplo, 'U' ) ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( lda.LT.max( 1, n ) ) THEN
         info = -4
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CTRTTP', -info )
         RETURN
      END IF
*
      IF( lower ) THEN
         k = 0
         DO j = 1, n
            DO i = j, n
               k = k + 1
               ap( k ) = a( i, j )
            END DO
         END DO
      ELSE
         k = 0
         DO j = 1, n
            DO i = 1, j
               k = k + 1
               ap( k ) = a( i, j )
            END DO
         END DO
      END IF
*
*
      RETURN
*
*     End of CTRTTP
*

◆ ctzrqf()

subroutine ctzrqf	(	integer	m,
		integer	n,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( * )	tau,
		integer	info )

CTZRQF

Download CTZRQF + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> This routine is deprecated and has been replaced by routine CTZRZF.
!>
!> CTZRQF reduces the M-by-N ( M<=N ) complex upper trapezoidal matrix A
!> to upper triangular form by means of unitary transformations.
!>
!> The upper trapezoidal matrix A is factored as
!>
!>    A = ( R  0 ) * Z,
!>
!> where Z is an N-by-N unitary matrix and R is an M-by-M upper
!> triangular matrix.
!>

Parameters

[in]	M	!> M is INTEGER !> The number of rows of the matrix A. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix A. N >= M. !>
[in,out]	A	!> A is COMPLEX array, dimension (LDA,N) !> On entry, the leading M-by-N upper trapezoidal part of the !> array A must contain the matrix to be factorized. !> On exit, the leading M-by-M upper triangular part of A !> contains the upper triangular matrix R, and elements M+1 to !> N of the first M rows of A, with the array TAU, represent the !> unitary matrix Z as a product of M elementary reflectors. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,M). !>
[out]	TAU	!> TAU is COMPLEX array, dimension (M) !> The scalar factors of the elementary reflectors. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  The  factorization is obtained by Householder's method.  The kth
!>  transformation matrix, Z( k ), whose conjugate transpose is used to
!>  introduce zeros into the (m - k + 1)th row of A, is given in the form
!>
!>     Z( k ) = ( I     0   ),
!>              ( 0  T( k ) )
!>
!>  where
!>
!>     T( k ) = I - tau*u( k )*u( k )**H,   u( k ) = (   1    ),
!>                                                   (   0    )
!>                                                   ( z( k ) )
!>
!>  tau is a scalar and z( k ) is an ( n - m ) element vector.
!>  tau and z( k ) are chosen to annihilate the elements of the kth row
!>  of X.
!>
!>  The scalar tau is returned in the kth element of TAU and the vector
!>  u( k ) in the kth row of A, such that the elements of z( k ) are
!>  in  a( k, m + 1 ), ..., a( k, n ). The elements of R are returned in
!>  the upper triangular part of A.
!>
!>  Z is given by
!>
!>     Z =  Z( 1 ) * Z( 2 ) * ... * Z( m ).
!>

Definition at line 137 of file ctzrqf.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INFO, LDA, M, N
*     ..
*     .. Array Arguments ..
      COMPLEX            A( LDA, * ), TAU( * )
*     ..
*
* =====================================================================
*
*     .. Parameters ..
      COMPLEX            CONE, CZERO
      parameter( cone = ( 1.0e+0, 0.0e+0 ),
     $                   czero = ( 0.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      INTEGER            I, K, M1
      COMPLEX            ALPHA
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          conjg, max, min
*     ..
*     .. External Subroutines ..
      EXTERNAL           caxpy, ccopy, cgemv, cgerc, clacgv, clarfg,
     $                   xerbla
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      IF( m.LT.0 ) THEN
         info = -1
      ELSE IF( n.LT.m ) THEN
         info = -2
      ELSE IF( lda.LT.max( 1, m ) ) THEN
         info = -4
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CTZRQF', -info )
         RETURN
      END IF
*
*     Perform the factorization.
*
      IF( m.EQ.0 )
     $   RETURN
      IF( m.EQ.n ) THEN
         DO 10 i = 1, n
            tau( i ) = czero
   10    CONTINUE
      ELSE
         m1 = min( m+1, n )
         DO 20 k = m, 1, -1
*
*           Use a Householder reflection to zero the kth row of A.
*           First set up the reflection.
*
            a( k, k ) = conjg( a( k, k ) )
            CALL clacgv( n-m, a( k, m1 ), lda )
            alpha = a( k, k )
            CALL clarfg( n-m+1, alpha, a( k, m1 ), lda, tau( k ) )
            a( k, k ) = alpha
            tau( k ) = conjg( tau( k ) )
*
            IF( tau( k ).NE.czero .AND. k.GT.1 ) THEN
*
*              We now perform the operation  A := A*P( k )**H.
*
*              Use the first ( k - 1 ) elements of TAU to store  a( k ),
*              where  a( k ) consists of the first ( k - 1 ) elements of
*              the  kth column  of  A.  Also  let  B  denote  the  first
*              ( k - 1 ) rows of the last ( n - m ) columns of A.
*
               CALL ccopy( k-1, a( 1, k ), 1, tau, 1 )
*
*              Form   w = a( k ) + B*z( k )  in TAU.
*
               CALL cgemv( 'No transpose', k-1, n-m, cone, a( 1, m1 ),
     $                     lda, a( k, m1 ), lda, cone, tau, 1 )
*
*              Now form  a( k ) := a( k ) - conjg(tau)*w
*              and       B      := B      - conjg(tau)*w*z( k )**H.
*
               CALL caxpy( k-1, -conjg( tau( k ) ), tau, 1, a( 1, k ),
     $                     1 )
               CALL cgerc( k-1, n-m, -conjg( tau( k ) ), tau, 1,
     $                     a( k, m1 ), lda, a( 1, m1 ), lda )
            END IF
   20    CONTINUE
      END IF
*
      RETURN
*
*     End of CTZRQF
*

◆ ctzrzf()

subroutine ctzrzf	(	integer	m,
		integer	n,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( * )	tau,
		complex, dimension( * )	work,
		integer	lwork,
		integer	info )

CTZRZF

Download CTZRZF + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CTZRZF reduces the M-by-N ( M<=N ) complex upper trapezoidal matrix A
!> to upper triangular form by means of unitary transformations.
!>
!> The upper trapezoidal matrix A is factored as
!>
!>    A = ( R  0 ) * Z,
!>
!> where Z is an N-by-N unitary matrix and R is an M-by-M upper
!> triangular matrix.
!>

Parameters

[in]	M	!> M is INTEGER !> The number of rows of the matrix A. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix A. N >= M. !>
[in,out]	A	!> A is COMPLEX array, dimension (LDA,N) !> On entry, the leading M-by-N upper trapezoidal part of the !> array A must contain the matrix to be factorized. !> On exit, the leading M-by-M upper triangular part of A !> contains the upper triangular matrix R, and elements M+1 to !> N of the first M rows of A, with the array TAU, represent the !> unitary matrix Z as a product of M elementary reflectors. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,M). !>
[out]	TAU	!> TAU is COMPLEX array, dimension (M) !> The scalar factors of the elementary reflectors. !>
[out]	WORK	!> WORK is COMPLEX array, dimension (MAX(1,LWORK)) !> On exit, if INFO = 0, WORK(1) returns the optimal LWORK. !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the array WORK. LWORK >= max(1,M). !> For optimum performance LWORK >= M*NB, where NB is !> the optimal blocksize. !> !> If LWORK = -1, then a workspace query is assumed; the routine !> only calculates the optimal size of the WORK array, returns !> this value as the first entry of the WORK array, and no error !> message related to LWORK is issued by XERBLA. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: A. Petitet, Computer Science Dept., Univ. of Tenn., Knoxville, USA

Further Details:

!>
!>  The N-by-N matrix Z can be computed by
!>
!>     Z =  Z(1)*Z(2)* ... *Z(M)
!>
!>  where each N-by-N Z(k) is given by
!>
!>     Z(k) = I - tau(k)*v(k)*v(k)**H
!>
!>  with v(k) is the kth row vector of the M-by-N matrix
!>
!>     V = ( I   A(:,M+1:N) )
!>
!>  I is the M-by-M identity matrix, A(:,M+1:N)
!>  is the output stored in A on exit from CTZRZF,
!>  and tau(k) is the kth element of the array TAU.
!>
!>

Definition at line 150 of file ctzrzf.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INFO, LDA, LWORK, M, N
*     ..
*     .. Array Arguments ..
      COMPLEX            A( LDA, * ), TAU( * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            ZERO
      parameter( zero = ( 0.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      LOGICAL            LQUERY
      INTEGER            I, IB, IWS, KI, KK, LDWORK, LWKMIN, LWKOPT,
     $                   M1, MU, NB, NBMIN, NX
*     ..
*     .. External Subroutines ..
      EXTERNAL           xerbla, clarzb, clarzt, clatrz
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, min
*     ..
*     .. External Functions ..
      INTEGER            ILAENV
      EXTERNAL           ilaenv
*     ..
*     .. Executable Statements ..
*
*     Test the input arguments
*
      info = 0
      lquery = ( lwork.EQ.-1 )
      IF( m.LT.0 ) THEN
         info = -1
      ELSE IF( n.LT.m ) THEN
         info = -2
      ELSE IF( lda.LT.max( 1, m ) ) THEN
         info = -4
      END IF
*
      IF( info.EQ.0 ) THEN
         IF( m.EQ.0 .OR. m.EQ.n ) THEN
            lwkopt = 1
            lwkmin = 1
         ELSE
*
*           Determine the block size.
*
            nb = ilaenv( 1, 'CGERQF', ' ', m, n, -1, -1 )
            lwkopt = m*nb
            lwkmin = max( 1, m )
         END IF
         work( 1 ) = lwkopt
*
         IF( lwork.LT.lwkmin .AND. .NOT.lquery ) THEN
            info = -7
         END IF
      END IF
*
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CTZRZF', -info )
         RETURN
      ELSE IF( lquery ) THEN
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( m.EQ.0 ) THEN
         RETURN
      ELSE IF( m.EQ.n ) THEN
         DO 10 i = 1, n
            tau( i ) = zero
   10    CONTINUE
         RETURN
      END IF
*
      nbmin = 2
      nx = 1
      iws = m
      IF( nb.GT.1 .AND. nb.LT.m ) THEN
*
*        Determine when to cross over from blocked to unblocked code.
*
         nx = max( 0, ilaenv( 3, 'CGERQF', ' ', m, n, -1, -1 ) )
         IF( nx.LT.m ) THEN
*
*           Determine if workspace is large enough for blocked code.
*
            ldwork = m
            iws = ldwork*nb
            IF( lwork.LT.iws ) THEN
*
*              Not enough workspace to use optimal NB:  reduce NB and
*              determine the minimum value of NB.
*
               nb = lwork / ldwork
               nbmin = max( 2, ilaenv( 2, 'CGERQF', ' ', m, n, -1,
     $                 -1 ) )
            END IF
         END IF
      END IF
*
      IF( nb.GE.nbmin .AND. nb.LT.m .AND. nx.LT.m ) THEN
*
*        Use blocked code initially.
*        The last kk rows are handled by the block method.
*
         m1 = min( m+1, n )
         ki = ( ( m-nx-1 ) / nb )*nb
         kk = min( m, ki+nb )
*
         DO 20 i = m - kk + ki + 1, m - kk + 1, -nb
            ib = min( m-i+1, nb )
*
*           Compute the TZ factorization of the current block
*           A(i:i+ib-1,i:n)
*
            CALL clatrz( ib, n-i+1, n-m, a( i, i ), lda, tau( i ),
     $                   work )
            IF( i.GT.1 ) THEN
*
*              Form the triangular factor of the block reflector
*              H = H(i+ib-1) . . . H(i+1) H(i)
*
               CALL clarzt( 'Backward', 'Rowwise', n-m, ib, a( i, m1 ),
     $                      lda, tau( i ), work, ldwork )
*
*              Apply H to A(1:i-1,i:n) from the right
*
               CALL clarzb( 'Right', 'No transpose', 'Backward',
     $                      'Rowwise', i-1, n-i+1, ib, n-m, a( i, m1 ),
     $                      lda, work, ldwork, a( 1, i ), lda,
     $                      work( ib+1 ), ldwork )
            END IF
   20    CONTINUE
         mu = i + nb - 1
      ELSE
         mu = m
      END IF
*
*     Use unblocked code to factor the last or only block
*
      IF( mu.GT.0 )
     $   CALL clatrz( mu, n, n-m, a, lda, tau, work )
*
      work( 1 ) = lwkopt
*
      RETURN
*
*     End of CTZRZF
*

◆ cunbdb()

subroutine cunbdb	(	character	trans,
		character	signs,
		integer	m,
		integer	p,
		integer	q,
		complex, dimension( ldx11, * )	x11,
		integer	ldx11,
		complex, dimension( ldx12, * )	x12,
		integer	ldx12,
		complex, dimension( ldx21, * )	x21,
		integer	ldx21,
		complex, dimension( ldx22, * )	x22,
		integer	ldx22,
		real, dimension( * )	theta,
		real, dimension( * )	phi,
		complex, dimension( * )	taup1,
		complex, dimension( * )	taup2,
		complex, dimension( * )	tauq1,
		complex, dimension( * )	tauq2,
		complex, dimension( * )	work,
		integer	lwork,
		integer	info )

CUNBDB

Download CUNBDB + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CUNBDB simultaneously bidiagonalizes the blocks of an M-by-M
!> partitioned unitary matrix X:
!>
!>                                 [ B11 | B12 0  0 ]
!>     [ X11 | X12 ]   [ P1 |    ] [  0  |  0 -I  0 ] [ Q1 |    ]**H
!> X = [-----------] = [---------] [----------------] [---------]   .
!>     [ X21 | X22 ]   [    | P2 ] [ B21 | B22 0  0 ] [    | Q2 ]
!>                                 [  0  |  0  0  I ]
!>
!> X11 is P-by-Q. Q must be no larger than P, M-P, or M-Q. (If this is
!> not the case, then X must be transposed and/or permuted. This can be
!> done in constant time using the TRANS and SIGNS options. See CUNCSD
!> for details.)
!>
!> The unitary matrices P1, P2, Q1, and Q2 are P-by-P, (M-P)-by-
!> (M-P), Q-by-Q, and (M-Q)-by-(M-Q), respectively. They are
!> represented implicitly by Householder vectors.
!>
!> B11, B12, B21, and B22 are Q-by-Q bidiagonal matrices represented
!> implicitly by angles THETA, PHI.
!>

Parameters

[in]	TRANS	!> TRANS is CHARACTER !> = 'T': X, U1, U2, V1T, and V2T are stored in row-major !> order; !> otherwise: X, U1, U2, V1T, and V2T are stored in column- !> major order. !>
[in]	SIGNS	!> SIGNS is CHARACTER !> = 'O': The lower-left block is made nonpositive (the !> convention); !> otherwise: The upper-right block is made nonpositive (the !> convention). !>
[in]	M	!> M is INTEGER !> The number of rows and columns in X. !>
[in]	P	!> P is INTEGER !> The number of rows in X11 and X12. 0 <= P <= M. !>
[in]	Q	!> Q is INTEGER !> The number of columns in X11 and X21. 0 <= Q <= !> MIN(P,M-P,M-Q). !>
[in,out]	X11	!> X11 is COMPLEX array, dimension (LDX11,Q) !> On entry, the top-left block of the unitary matrix to be !> reduced. On exit, the form depends on TRANS: !> If TRANS = 'N', then !> the columns of tril(X11) specify reflectors for P1, !> the rows of triu(X11,1) specify reflectors for Q1; !> else TRANS = 'T', and !> the rows of triu(X11) specify reflectors for P1, !> the columns of tril(X11,-1) specify reflectors for Q1. !>
[in]	LDX11	!> LDX11 is INTEGER !> The leading dimension of X11. If TRANS = 'N', then LDX11 >= !> P; else LDX11 >= Q. !>
[in,out]	X12	!> X12 is COMPLEX array, dimension (LDX12,M-Q) !> On entry, the top-right block of the unitary matrix to !> be reduced. On exit, the form depends on TRANS: !> If TRANS = 'N', then !> the rows of triu(X12) specify the first P reflectors for !> Q2; !> else TRANS = 'T', and !> the columns of tril(X12) specify the first P reflectors !> for Q2. !>
[in]	LDX12	!> LDX12 is INTEGER !> The leading dimension of X12. If TRANS = 'N', then LDX12 >= !> P; else LDX11 >= M-Q. !>
[in,out]	X21	!> X21 is COMPLEX array, dimension (LDX21,Q) !> On entry, the bottom-left block of the unitary matrix to !> be reduced. On exit, the form depends on TRANS: !> If TRANS = 'N', then !> the columns of tril(X21) specify reflectors for P2; !> else TRANS = 'T', and !> the rows of triu(X21) specify reflectors for P2. !>
[in]	LDX21	!> LDX21 is INTEGER !> The leading dimension of X21. If TRANS = 'N', then LDX21 >= !> M-P; else LDX21 >= Q. !>
[in,out]	X22	!> X22 is COMPLEX array, dimension (LDX22,M-Q) !> On entry, the bottom-right block of the unitary matrix to !> be reduced. On exit, the form depends on TRANS: !> If TRANS = 'N', then !> the rows of triu(X22(Q+1:M-P,P+1:M-Q)) specify the last !> M-P-Q reflectors for Q2, !> else TRANS = 'T', and !> the columns of tril(X22(P+1:M-Q,Q+1:M-P)) specify the last !> M-P-Q reflectors for P2. !>
[in]	LDX22	!> LDX22 is INTEGER !> The leading dimension of X22. If TRANS = 'N', then LDX22 >= !> M-P; else LDX22 >= M-Q. !>
[out]	THETA	!> THETA is REAL array, dimension (Q) !> The entries of the bidiagonal blocks B11, B12, B21, B22 can !> be computed from the angles THETA and PHI. See Further !> Details. !>
[out]	PHI	!> PHI is REAL array, dimension (Q-1) !> The entries of the bidiagonal blocks B11, B12, B21, B22 can !> be computed from the angles THETA and PHI. See Further !> Details. !>
[out]	TAUP1	!> TAUP1 is COMPLEX array, dimension (P) !> The scalar factors of the elementary reflectors that define !> P1. !>
[out]	TAUP2	!> TAUP2 is COMPLEX array, dimension (M-P) !> The scalar factors of the elementary reflectors that define !> P2. !>
[out]	TAUQ1	!> TAUQ1 is COMPLEX array, dimension (Q) !> The scalar factors of the elementary reflectors that define !> Q1. !>
[out]	TAUQ2	!> TAUQ2 is COMPLEX array, dimension (M-Q) !> The scalar factors of the elementary reflectors that define !> Q2. !>
[out]	WORK	!> WORK is COMPLEX array, dimension (LWORK) !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the array WORK. LWORK >= M-Q. !> !> If LWORK = -1, then a workspace query is assumed; the routine !> only calculates the optimal size of the WORK array, returns !> this value as the first entry of the WORK array, and no error !> message related to LWORK is issued by XERBLA. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> < 0: if INFO = -i, the i-th argument had an illegal value. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  The bidiagonal blocks B11, B12, B21, and B22 are represented
!>  implicitly by angles THETA(1), ..., THETA(Q) and PHI(1), ...,
!>  PHI(Q-1). B11 and B21 are upper bidiagonal, while B21 and B22 are
!>  lower bidiagonal. Every entry in each bidiagonal band is a product
!>  of a sine or cosine of a THETA with a sine or cosine of a PHI. See
!>  [1] or CUNCSD for details.
!>
!>  P1, P2, Q1, and Q2 are represented as products of elementary
!>  reflectors. See CUNCSD for details on generating P1, P2, Q1, and Q2
!>  using CUNGQR and CUNGLQ.
!>

References:: [1] Brian D. Sutton. Computing the complete CS decomposition. Numer. Algorithms, 50(1):33-65, 2009.

Definition at line 284 of file cunbdb.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          SIGNS, TRANS
      INTEGER            INFO, LDX11, LDX12, LDX21, LDX22, LWORK, M, P,
     $                   Q
*     ..
*     .. Array Arguments ..
      REAL               PHI( * ), THETA( * )
      COMPLEX            TAUP1( * ), TAUP2( * ), TAUQ1( * ), TAUQ2( * ),
     $                   WORK( * ), X11( LDX11, * ), X12( LDX12, * ),
     $                   X21( LDX21, * ), X22( LDX22, * )
*     ..
*
*  ====================================================================
*
*     .. Parameters ..
      REAL               REALONE
      parameter( realone = 1.0e0 )
      COMPLEX            ONE
      parameter( one = (1.0e0,0.0e0) )
*     ..
*     .. Local Scalars ..
      LOGICAL            COLMAJOR, LQUERY
      INTEGER            I, LWORKMIN, LWORKOPT
      REAL               Z1, Z2, Z3, Z4
*     ..
*     .. External Subroutines ..
      EXTERNAL           caxpy, clarf, clarfgp, cscal, xerbla
      EXTERNAL           clacgv
*
*     ..
*     .. External Functions ..
      REAL               SCNRM2
      LOGICAL            LSAME
      EXTERNAL           scnrm2, lsame
*     ..
*     .. Intrinsic Functions
      INTRINSIC          atan2, cos, max, min, sin
      INTRINSIC          cmplx, conjg
*     ..
*     .. Executable Statements ..
*
*     Test input arguments
*
      info = 0
      colmajor = .NOT. lsame( trans, 'T' )
      IF( .NOT. lsame( signs, 'O' ) ) THEN
         z1 = realone
         z2 = realone
         z3 = realone
         z4 = realone
      ELSE
         z1 = realone
         z2 = -realone
         z3 = realone
         z4 = -realone
      END IF
      lquery = lwork .EQ. -1
*
      IF( m .LT. 0 ) THEN
         info = -3
      ELSE IF( p .LT. 0 .OR. p .GT. m ) THEN
         info = -4
      ELSE IF( q .LT. 0 .OR. q .GT. p .OR. q .GT. m-p .OR.
     $         q .GT. m-q ) THEN
         info = -5
      ELSE IF( colmajor .AND. ldx11 .LT. max( 1, p ) ) THEN
         info = -7
      ELSE IF( .NOT.colmajor .AND. ldx11 .LT. max( 1, q ) ) THEN
         info = -7
      ELSE IF( colmajor .AND. ldx12 .LT. max( 1, p ) ) THEN
         info = -9
      ELSE IF( .NOT.colmajor .AND. ldx12 .LT. max( 1, m-q ) ) THEN
         info = -9
      ELSE IF( colmajor .AND. ldx21 .LT. max( 1, m-p ) ) THEN
         info = -11
      ELSE IF( .NOT.colmajor .AND. ldx21 .LT. max( 1, q ) ) THEN
         info = -11
      ELSE IF( colmajor .AND. ldx22 .LT. max( 1, m-p ) ) THEN
         info = -13
      ELSE IF( .NOT.colmajor .AND. ldx22 .LT. max( 1, m-q ) ) THEN
         info = -13
      END IF
*
*     Compute workspace
*
      IF( info .EQ. 0 ) THEN
         lworkopt = m - q
         lworkmin = m - q
         work(1) = lworkopt
         IF( lwork .LT. lworkmin .AND. .NOT. lquery ) THEN
            info = -21
         END IF
      END IF
      IF( info .NE. 0 ) THEN
         CALL xerbla( 'xORBDB', -info )
         RETURN
      ELSE IF( lquery ) THEN
         RETURN
      END IF
*
*     Handle column-major and row-major separately
*
      IF( colmajor ) THEN
*
*        Reduce columns 1, ..., Q of X11, X12, X21, and X22
*
         DO i = 1, q
*
            IF( i .EQ. 1 ) THEN
               CALL cscal( p-i+1, cmplx( z1, 0.0e0 ), x11(i,i), 1 )
            ELSE
               CALL cscal( p-i+1, cmplx( z1*cos(phi(i-1)), 0.0e0 ),
     $                     x11(i,i), 1 )
               CALL caxpy( p-i+1, cmplx( -z1*z3*z4*sin(phi(i-1)),
     $                     0.0e0 ), x12(i,i-1), 1, x11(i,i), 1 )
            END IF
            IF( i .EQ. 1 ) THEN
               CALL cscal( m-p-i+1, cmplx( z2, 0.0e0 ), x21(i,i), 1 )
            ELSE
               CALL cscal( m-p-i+1, cmplx( z2*cos(phi(i-1)), 0.0e0 ),
     $                     x21(i,i), 1 )
               CALL caxpy( m-p-i+1, cmplx( -z2*z3*z4*sin(phi(i-1)),
     $                     0.0e0 ), x22(i,i-1), 1, x21(i,i), 1 )
            END IF
*
            theta(i) = atan2( scnrm2( m-p-i+1, x21(i,i), 1 ),
     $                 scnrm2( p-i+1, x11(i,i), 1 ) )
*
            IF( p .GT. i ) THEN
               CALL clarfgp( p-i+1, x11(i,i), x11(i+1,i), 1, taup1(i) )
            ELSE IF ( p .EQ. i ) THEN
               CALL clarfgp( p-i+1, x11(i,i), x11(i,i), 1, taup1(i) )
            END IF
            x11(i,i) = one
            IF ( m-p .GT. i ) THEN
               CALL clarfgp( m-p-i+1, x21(i,i), x21(i+1,i), 1,
     $                       taup2(i) )
            ELSE IF ( m-p .EQ. i ) THEN
               CALL clarfgp( m-p-i+1, x21(i,i), x21(i,i), 1,
     $                       taup2(i) )
            END IF
            x21(i,i) = one
*
            IF ( q .GT. i ) THEN
               CALL clarf( 'L', p-i+1, q-i, x11(i,i), 1,
     $                     conjg(taup1(i)), x11(i,i+1), ldx11, work )
               CALL clarf( 'L', m-p-i+1, q-i, x21(i,i), 1,
     $                     conjg(taup2(i)), x21(i,i+1), ldx21, work )
            END IF
            IF ( m-q+1 .GT. i ) THEN
               CALL clarf( 'L', p-i+1, m-q-i+1, x11(i,i), 1,
     $                     conjg(taup1(i)), x12(i,i), ldx12, work )
               CALL clarf( 'L', m-p-i+1, m-q-i+1, x21(i,i), 1,
     $                     conjg(taup2(i)), x22(i,i), ldx22, work )
            END IF
*
            IF( i .LT. q ) THEN
               CALL cscal( q-i, cmplx( -z1*z3*sin(theta(i)), 0.0e0 ),
     $                     x11(i,i+1), ldx11 )
               CALL caxpy( q-i, cmplx( z2*z3*cos(theta(i)), 0.0e0 ),
     $                     x21(i,i+1), ldx21, x11(i,i+1), ldx11 )
            END IF
            CALL cscal( m-q-i+1, cmplx( -z1*z4*sin(theta(i)), 0.0e0 ),
     $                  x12(i,i), ldx12 )
            CALL caxpy( m-q-i+1, cmplx( z2*z4*cos(theta(i)), 0.0e0 ),
     $                  x22(i,i), ldx22, x12(i,i), ldx12 )
*
            IF( i .LT. q )
     $         phi(i) = atan2( scnrm2( q-i, x11(i,i+1), ldx11 ),
     $                  scnrm2( m-q-i+1, x12(i,i), ldx12 ) )
*
            IF( i .LT. q ) THEN
               CALL clacgv( q-i, x11(i,i+1), ldx11 )
               IF ( i .EQ. q-1 ) THEN
                  CALL clarfgp( q-i, x11(i,i+1), x11(i,i+1), ldx11,
     $                          tauq1(i) )
               ELSE
                  CALL clarfgp( q-i, x11(i,i+1), x11(i,i+2), ldx11,
     $                          tauq1(i) )
               END IF
               x11(i,i+1) = one
            END IF
            IF ( m-q+1 .GT. i ) THEN
               CALL clacgv( m-q-i+1, x12(i,i), ldx12 )
               IF ( m-q .EQ. i ) THEN
                  CALL clarfgp( m-q-i+1, x12(i,i), x12(i,i), ldx12,
     $                          tauq2(i) )
               ELSE
                  CALL clarfgp( m-q-i+1, x12(i,i), x12(i,i+1), ldx12,
     $                          tauq2(i) )
               END IF
            END IF
            x12(i,i) = one
*
            IF( i .LT. q ) THEN
               CALL clarf( 'R', p-i, q-i, x11(i,i+1), ldx11, tauq1(i),
     $                     x11(i+1,i+1), ldx11, work )
               CALL clarf( 'R', m-p-i, q-i, x11(i,i+1), ldx11, tauq1(i),
     $                     x21(i+1,i+1), ldx21, work )
            END IF
            IF ( p .GT. i ) THEN
               CALL clarf( 'R', p-i, m-q-i+1, x12(i,i), ldx12, tauq2(i),
     $                     x12(i+1,i), ldx12, work )
            END IF
            IF ( m-p .GT. i ) THEN
               CALL clarf( 'R', m-p-i, m-q-i+1, x12(i,i), ldx12,
     $                     tauq2(i), x22(i+1,i), ldx22, work )
            END IF
*
            IF( i .LT. q )
     $         CALL clacgv( q-i, x11(i,i+1), ldx11 )
            CALL clacgv( m-q-i+1, x12(i,i), ldx12 )
*
         END DO
*
*        Reduce columns Q + 1, ..., P of X12, X22
*
         DO i = q + 1, p
*
            CALL cscal( m-q-i+1, cmplx( -z1*z4, 0.0e0 ), x12(i,i),
     $                  ldx12 )
            CALL clacgv( m-q-i+1, x12(i,i), ldx12 )
            IF ( i .GE. m-q ) THEN
               CALL clarfgp( m-q-i+1, x12(i,i), x12(i,i), ldx12,
     $                       tauq2(i) )
            ELSE
               CALL clarfgp( m-q-i+1, x12(i,i), x12(i,i+1), ldx12,
     $                       tauq2(i) )
            END IF
            x12(i,i) = one
*
            IF ( p .GT. i ) THEN
               CALL clarf( 'R', p-i, m-q-i+1, x12(i,i), ldx12, tauq2(i),
     $                     x12(i+1,i), ldx12, work )
            END IF
            IF( m-p-q .GE. 1 )
     $         CALL clarf( 'R', m-p-q, m-q-i+1, x12(i,i), ldx12,
     $                     tauq2(i), x22(q+1,i), ldx22, work )
*
            CALL clacgv( m-q-i+1, x12(i,i), ldx12 )
*
         END DO
*
*        Reduce columns P + 1, ..., M - Q of X12, X22
*
         DO i = 1, m - p - q
*
            CALL cscal( m-p-q-i+1, cmplx( z2*z4, 0.0e0 ),
     $                  x22(q+i,p+i), ldx22 )
            CALL clacgv( m-p-q-i+1, x22(q+i,p+i), ldx22 )
            CALL clarfgp( m-p-q-i+1, x22(q+i,p+i), x22(q+i,p+i+1),
     $                    ldx22, tauq2(p+i) )
            x22(q+i,p+i) = one
            CALL clarf( 'R', m-p-q-i, m-p-q-i+1, x22(q+i,p+i), ldx22,
     $                  tauq2(p+i), x22(q+i+1,p+i), ldx22, work )
*
            CALL clacgv( m-p-q-i+1, x22(q+i,p+i), ldx22 )
*
         END DO
*
      ELSE
*
*        Reduce columns 1, ..., Q of X11, X12, X21, X22
*
         DO i = 1, q
*
            IF( i .EQ. 1 ) THEN
               CALL cscal( p-i+1, cmplx( z1, 0.0e0 ), x11(i,i),
     $                     ldx11 )
            ELSE
               CALL cscal( p-i+1, cmplx( z1*cos(phi(i-1)), 0.0e0 ),
     $                     x11(i,i), ldx11 )
               CALL caxpy( p-i+1, cmplx( -z1*z3*z4*sin(phi(i-1)),
     $                     0.0e0 ), x12(i-1,i), ldx12, x11(i,i), ldx11 )
            END IF
            IF( i .EQ. 1 ) THEN
               CALL cscal( m-p-i+1, cmplx( z2, 0.0e0 ), x21(i,i),
     $                     ldx21 )
            ELSE
               CALL cscal( m-p-i+1, cmplx( z2*cos(phi(i-1)), 0.0e0 ),
     $                     x21(i,i), ldx21 )
               CALL caxpy( m-p-i+1, cmplx( -z2*z3*z4*sin(phi(i-1)),
     $                     0.0e0 ), x22(i-1,i), ldx22, x21(i,i), ldx21 )
            END IF
*
            theta(i) = atan2( scnrm2( m-p-i+1, x21(i,i), ldx21 ),
     $                 scnrm2( p-i+1, x11(i,i), ldx11 ) )
*
            CALL clacgv( p-i+1, x11(i,i), ldx11 )
            CALL clacgv( m-p-i+1, x21(i,i), ldx21 )
*
            CALL clarfgp( p-i+1, x11(i,i), x11(i,i+1), ldx11, taup1(i) )
            x11(i,i) = one
            IF ( i .EQ. m-p ) THEN
               CALL clarfgp( m-p-i+1, x21(i,i), x21(i,i), ldx21,
     $                       taup2(i) )
            ELSE
               CALL clarfgp( m-p-i+1, x21(i,i), x21(i,i+1), ldx21,
     $                       taup2(i) )
            END IF
            x21(i,i) = one
*
            CALL clarf( 'R', q-i, p-i+1, x11(i,i), ldx11, taup1(i),
     $                  x11(i+1,i), ldx11, work )
            CALL clarf( 'R', m-q-i+1, p-i+1, x11(i,i), ldx11, taup1(i),
     $                  x12(i,i), ldx12, work )
            CALL clarf( 'R', q-i, m-p-i+1, x21(i,i), ldx21, taup2(i),
     $                  x21(i+1,i), ldx21, work )
            CALL clarf( 'R', m-q-i+1, m-p-i+1, x21(i,i), ldx21,
     $                  taup2(i), x22(i,i), ldx22, work )
*
            CALL clacgv( p-i+1, x11(i,i), ldx11 )
            CALL clacgv( m-p-i+1, x21(i,i), ldx21 )
*
            IF( i .LT. q ) THEN
               CALL cscal( q-i, cmplx( -z1*z3*sin(theta(i)), 0.0e0 ),
     $                     x11(i+1,i), 1 )
               CALL caxpy( q-i, cmplx( z2*z3*cos(theta(i)), 0.0e0 ),
     $                     x21(i+1,i), 1, x11(i+1,i), 1 )
            END IF
            CALL cscal( m-q-i+1, cmplx( -z1*z4*sin(theta(i)), 0.0e0 ),
     $                  x12(i,i), 1 )
            CALL caxpy( m-q-i+1, cmplx( z2*z4*cos(theta(i)), 0.0e0 ),
     $                  x22(i,i), 1, x12(i,i), 1 )
*
            IF( i .LT. q )
     $         phi(i) = atan2( scnrm2( q-i, x11(i+1,i), 1 ),
     $                  scnrm2( m-q-i+1, x12(i,i), 1 ) )
*
            IF( i .LT. q ) THEN
               CALL clarfgp( q-i, x11(i+1,i), x11(i+2,i), 1, tauq1(i) )
               x11(i+1,i) = one
            END IF
            CALL clarfgp( m-q-i+1, x12(i,i), x12(i+1,i), 1, tauq2(i) )
            x12(i,i) = one
*
            IF( i .LT. q ) THEN
               CALL clarf( 'L', q-i, p-i, x11(i+1,i), 1,
     $                     conjg(tauq1(i)), x11(i+1,i+1), ldx11, work )
               CALL clarf( 'L', q-i, m-p-i, x11(i+1,i), 1,
     $                     conjg(tauq1(i)), x21(i+1,i+1), ldx21, work )
            END IF
            CALL clarf( 'L', m-q-i+1, p-i, x12(i,i), 1, conjg(tauq2(i)),
     $                  x12(i,i+1), ldx12, work )
 
            IF ( m-p .GT. i ) THEN
               CALL clarf( 'L', m-q-i+1, m-p-i, x12(i,i), 1,
     $                     conjg(tauq2(i)), x22(i,i+1), ldx22, work )
            END IF
         END DO
*
*        Reduce columns Q + 1, ..., P of X12, X22
*
         DO i = q + 1, p
*
            CALL cscal( m-q-i+1, cmplx( -z1*z4, 0.0e0 ), x12(i,i), 1 )
            CALL clarfgp( m-q-i+1, x12(i,i), x12(i+1,i), 1, tauq2(i) )
            x12(i,i) = one
*
            IF ( p .GT. i ) THEN
               CALL clarf( 'L', m-q-i+1, p-i, x12(i,i), 1,
     $                     conjg(tauq2(i)), x12(i,i+1), ldx12, work )
            END IF
            IF( m-p-q .GE. 1 )
     $         CALL clarf( 'L', m-q-i+1, m-p-q, x12(i,i), 1,
     $                     conjg(tauq2(i)), x22(i,q+1), ldx22, work )
*
         END DO
*
*        Reduce columns P + 1, ..., M - Q of X12, X22
*
         DO i = 1, m - p - q
*
            CALL cscal( m-p-q-i+1, cmplx( z2*z4, 0.0e0 ),
     $                  x22(p+i,q+i), 1 )
            CALL clarfgp( m-p-q-i+1, x22(p+i,q+i), x22(p+i+1,q+i), 1,
     $                    tauq2(p+i) )
            x22(p+i,q+i) = one
            IF ( m-p-q .NE. i ) THEN
               CALL clarf( 'L', m-p-q-i+1, m-p-q-i, x22(p+i,q+i), 1,
     $                     conjg(tauq2(p+i)), x22(p+i,q+i+1), ldx22,
     $                     work )
            END IF
         END DO
*
      END IF
*
      RETURN
*
*     End of CUNBDB
*

◆ cunbdb1()

subroutine cunbdb1	(	integer	m,
		integer	p,
		integer	q,
		complex, dimension(ldx11,*)	x11,
		integer	ldx11,
		complex, dimension(ldx21,*)	x21,
		integer	ldx21,
		real, dimension(*)	theta,
		real, dimension(*)	phi,
		complex, dimension(*)	taup1,
		complex, dimension(*)	taup2,
		complex, dimension(*)	tauq1,
		complex, dimension(*)	work,
		integer	lwork,
		integer	info )

CUNBDB1

Download CUNBDB1 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CUNBDB1 simultaneously bidiagonalizes the blocks of a tall and skinny
!> matrix X with orthonomal columns:
!>
!>                            [ B11 ]
!>      [ X11 ]   [ P1 |    ] [  0  ]
!>      [-----] = [---------] [-----] Q1**T .
!>      [ X21 ]   [    | P2 ] [ B21 ]
!>                            [  0  ]
!>
!> X11 is P-by-Q, and X21 is (M-P)-by-Q. Q must be no larger than P,
!> M-P, or M-Q. Routines CUNBDB2, CUNBDB3, and CUNBDB4 handle cases in
!> which Q is not the minimum dimension.
!>
!> The unitary matrices P1, P2, and Q1 are P-by-P, (M-P)-by-(M-P),
!> and (M-Q)-by-(M-Q), respectively. They are represented implicitly by
!> Householder vectors.
!>
!> B11 and B12 are Q-by-Q bidiagonal matrices represented implicitly by
!> angles THETA, PHI.
!>
!>

Parameters

[in]	M	!> M is INTEGER !> The number of rows X11 plus the number of rows in X21. !>
[in]	P	!> P is INTEGER !> The number of rows in X11. 0 <= P <= M. !>
[in]	Q	!> Q is INTEGER !> The number of columns in X11 and X21. 0 <= Q <= !> MIN(P,M-P,M-Q). !>
[in,out]	X11	!> X11 is COMPLEX array, dimension (LDX11,Q) !> On entry, the top block of the matrix X to be reduced. On !> exit, the columns of tril(X11) specify reflectors for P1 and !> the rows of triu(X11,1) specify reflectors for Q1. !>
[in]	LDX11	!> LDX11 is INTEGER !> The leading dimension of X11. LDX11 >= P. !>
[in,out]	X21	!> X21 is COMPLEX array, dimension (LDX21,Q) !> On entry, the bottom block of the matrix X to be reduced. On !> exit, the columns of tril(X21) specify reflectors for P2. !>
[in]	LDX21	!> LDX21 is INTEGER !> The leading dimension of X21. LDX21 >= M-P. !>
[out]	THETA	!> THETA is REAL array, dimension (Q) !> The entries of the bidiagonal blocks B11, B21 are defined by !> THETA and PHI. See Further Details. !>
[out]	PHI	!> PHI is REAL array, dimension (Q-1) !> The entries of the bidiagonal blocks B11, B21 are defined by !> THETA and PHI. See Further Details. !>
[out]	TAUP1	!> TAUP1 is COMPLEX array, dimension (P) !> The scalar factors of the elementary reflectors that define !> P1. !>
[out]	TAUP2	!> TAUP2 is COMPLEX array, dimension (M-P) !> The scalar factors of the elementary reflectors that define !> P2. !>
[out]	TAUQ1	!> TAUQ1 is COMPLEX array, dimension (Q) !> The scalar factors of the elementary reflectors that define !> Q1. !>
[out]	WORK	!> WORK is COMPLEX array, dimension (LWORK) !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the array WORK. LWORK >= M-Q. !> !> If LWORK = -1, then a workspace query is assumed; the routine !> only calculates the optimal size of the WORK array, returns !> this value as the first entry of the WORK array, and no error !> message related to LWORK is issued by XERBLA. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> < 0: if INFO = -i, the i-th argument had an illegal value. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  The upper-bidiagonal blocks B11, B21 are represented implicitly by
!>  angles THETA(1), ..., THETA(Q) and PHI(1), ..., PHI(Q-1). Every entry
!>  in each bidiagonal band is a product of a sine or cosine of a THETA
!>  with a sine or cosine of a PHI. See [1] or CUNCSD for details.
!>
!>  P1, P2, and Q1 are represented as products of elementary reflectors.
!>  See CUNCSD2BY1 for details on generating P1, P2, and Q1 using CUNGQR
!>  and CUNGLQ.
!>

References:: [1] Brian D. Sutton. Computing the complete CS decomposition. Numer. Algorithms, 50(1):33-65, 2009.

Definition at line 200 of file cunbdb1.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INFO, LWORK, M, P, Q, LDX11, LDX21
*     ..
*     .. Array Arguments ..
      REAL               PHI(*), THETA(*)
      COMPLEX            TAUP1(*), TAUP2(*), TAUQ1(*), WORK(*),
     $                   X11(LDX11,*), X21(LDX21,*)
*     ..
*
*  ====================================================================
*
*     .. Parameters ..
      COMPLEX            ONE
      parameter( one = (1.0e0,0.0e0) )
*     ..
*     .. Local Scalars ..
      REAL               C, S
      INTEGER            CHILDINFO, I, ILARF, IORBDB5, LLARF, LORBDB5,
     $                   LWORKMIN, LWORKOPT
      LOGICAL            LQUERY
*     ..
*     .. External Subroutines ..
      EXTERNAL           clarf, clarfgp, cunbdb5, csrot, xerbla
      EXTERNAL           clacgv
*     ..
*     .. External Functions ..
      REAL               SCNRM2
      EXTERNAL           scnrm2
*     ..
*     .. Intrinsic Function ..
      INTRINSIC          atan2, cos, max, sin, sqrt
*     ..
*     .. Executable Statements ..
*
*     Test input arguments
*
      info = 0
      lquery = lwork .EQ. -1
*
      IF( m .LT. 0 ) THEN
         info = -1
      ELSE IF( p .LT. q .OR. m-p .LT. q ) THEN
         info = -2
      ELSE IF( q .LT. 0 .OR. m-q .LT. q ) THEN
         info = -3
      ELSE IF( ldx11 .LT. max( 1, p ) ) THEN
         info = -5
      ELSE IF( ldx21 .LT. max( 1, m-p ) ) THEN
         info = -7
      END IF
*
*     Compute workspace
*
      IF( info .EQ. 0 ) THEN
         ilarf = 2
         llarf = max( p-1, m-p-1, q-1 )
         iorbdb5 = 2
         lorbdb5 = q-2
         lworkopt = max( ilarf+llarf-1, iorbdb5+lorbdb5-1 )
         lworkmin = lworkopt
         work(1) = lworkopt
         IF( lwork .LT. lworkmin .AND. .NOT.lquery ) THEN
           info = -14
         END IF
      END IF
      IF( info .NE. 0 ) THEN
         CALL xerbla( 'CUNBDB1', -info )
         RETURN
      ELSE IF( lquery ) THEN
         RETURN
      END IF
*
*     Reduce columns 1, ..., Q of X11 and X21
*
      DO i = 1, q
*
         CALL clarfgp( p-i+1, x11(i,i), x11(i+1,i), 1, taup1(i) )
         CALL clarfgp( m-p-i+1, x21(i,i), x21(i+1,i), 1, taup2(i) )
         theta(i) = atan2( real( x21(i,i) ), real( x11(i,i) ) )
         c = cos( theta(i) )
         s = sin( theta(i) )
         x11(i,i) = one
         x21(i,i) = one
         CALL clarf( 'L', p-i+1, q-i, x11(i,i), 1, conjg(taup1(i)),
     $               x11(i,i+1), ldx11, work(ilarf) )
         CALL clarf( 'L', m-p-i+1, q-i, x21(i,i), 1, conjg(taup2(i)),
     $               x21(i,i+1), ldx21, work(ilarf) )
*
         IF( i .LT. q ) THEN
            CALL csrot( q-i, x11(i,i+1), ldx11, x21(i,i+1), ldx21, c,
     $                  s )
            CALL clacgv( q-i, x21(i,i+1), ldx21 )
            CALL clarfgp( q-i, x21(i,i+1), x21(i,i+2), ldx21, tauq1(i) )
            s = real( x21(i,i+1) )
            x21(i,i+1) = one
            CALL clarf( 'R', p-i, q-i, x21(i,i+1), ldx21, tauq1(i),
     $                  x11(i+1,i+1), ldx11, work(ilarf) )
            CALL clarf( 'R', m-p-i, q-i, x21(i,i+1), ldx21, tauq1(i),
     $                  x21(i+1,i+1), ldx21, work(ilarf) )
            CALL clacgv( q-i, x21(i,i+1), ldx21 )
            c = sqrt( scnrm2( p-i, x11(i+1,i+1), 1 )**2
     $              + scnrm2( m-p-i, x21(i+1,i+1), 1 )**2 )
            phi(i) = atan2( s, c )
            CALL cunbdb5( p-i, m-p-i, q-i-1, x11(i+1,i+1), 1,
     $                    x21(i+1,i+1), 1, x11(i+1,i+2), ldx11,
     $                    x21(i+1,i+2), ldx21, work(iorbdb5), lorbdb5,
     $                    childinfo )
         END IF
*
      END DO
*
      RETURN
*
*     End of CUNBDB1
*

◆ cunbdb2()

subroutine cunbdb2	(	integer	m,
		integer	p,
		integer	q,
		complex, dimension(ldx11,*)	x11,
		integer	ldx11,
		complex, dimension(ldx21,*)	x21,
		integer	ldx21,
		real, dimension(*)	theta,
		real, dimension(*)	phi,
		complex, dimension(*)	taup1,
		complex, dimension(*)	taup2,
		complex, dimension(*)	tauq1,
		complex, dimension(*)	work,
		integer	lwork,
		integer	info )

CUNBDB2

Download CUNBDB2 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CUNBDB2 simultaneously bidiagonalizes the blocks of a tall and skinny
!> matrix X with orthonomal columns:
!>
!>                            [ B11 ]
!>      [ X11 ]   [ P1 |    ] [  0  ]
!>      [-----] = [---------] [-----] Q1**T .
!>      [ X21 ]   [    | P2 ] [ B21 ]
!>                            [  0  ]
!>
!> X11 is P-by-Q, and X21 is (M-P)-by-Q. P must be no larger than M-P,
!> Q, or M-Q. Routines CUNBDB1, CUNBDB3, and CUNBDB4 handle cases in
!> which P is not the minimum dimension.
!>
!> The unitary matrices P1, P2, and Q1 are P-by-P, (M-P)-by-(M-P),
!> and (M-Q)-by-(M-Q), respectively. They are represented implicitly by
!> Householder vectors.
!>
!> B11 and B12 are P-by-P bidiagonal matrices represented implicitly by
!> angles THETA, PHI.
!>
!>

Parameters

[in]	M	!> M is INTEGER !> The number of rows X11 plus the number of rows in X21. !>
[in]	P	!> P is INTEGER !> The number of rows in X11. 0 <= P <= min(M-P,Q,M-Q). !>
[in]	Q	!> Q is INTEGER !> The number of columns in X11 and X21. 0 <= Q <= M. !>
[in,out]	X11	!> X11 is COMPLEX array, dimension (LDX11,Q) !> On entry, the top block of the matrix X to be reduced. On !> exit, the columns of tril(X11) specify reflectors for P1 and !> the rows of triu(X11,1) specify reflectors for Q1. !>
[in]	LDX11	!> LDX11 is INTEGER !> The leading dimension of X11. LDX11 >= P. !>
[in,out]	X21	!> X21 is COMPLEX array, dimension (LDX21,Q) !> On entry, the bottom block of the matrix X to be reduced. On !> exit, the columns of tril(X21) specify reflectors for P2. !>
[in]	LDX21	!> LDX21 is INTEGER !> The leading dimension of X21. LDX21 >= M-P. !>
[out]	THETA	!> THETA is REAL array, dimension (Q) !> The entries of the bidiagonal blocks B11, B21 are defined by !> THETA and PHI. See Further Details. !>
[out]	PHI	!> PHI is REAL array, dimension (Q-1) !> The entries of the bidiagonal blocks B11, B21 are defined by !> THETA and PHI. See Further Details. !>
[out]	TAUP1	!> TAUP1 is COMPLEX array, dimension (P) !> The scalar factors of the elementary reflectors that define !> P1. !>
[out]	TAUP2	!> TAUP2 is COMPLEX array, dimension (M-P) !> The scalar factors of the elementary reflectors that define !> P2. !>
[out]	TAUQ1	!> TAUQ1 is COMPLEX array, dimension (Q) !> The scalar factors of the elementary reflectors that define !> Q1. !>
[out]	WORK	!> WORK is COMPLEX array, dimension (LWORK) !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the array WORK. LWORK >= M-Q. !> !> If LWORK = -1, then a workspace query is assumed; the routine !> only calculates the optimal size of the WORK array, returns !> this value as the first entry of the WORK array, and no error !> message related to LWORK is issued by XERBLA. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> < 0: if INFO = -i, the i-th argument had an illegal value. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  The upper-bidiagonal blocks B11, B21 are represented implicitly by
!>  angles THETA(1), ..., THETA(Q) and PHI(1), ..., PHI(Q-1). Every entry
!>  in each bidiagonal band is a product of a sine or cosine of a THETA
!>  with a sine or cosine of a PHI. See [1] or CUNCSD for details.
!>
!>  P1, P2, and Q1 are represented as products of elementary reflectors.
!>  See CUNCSD2BY1 for details on generating P1, P2, and Q1 using CUNGQR
!>  and CUNGLQ.
!>

References:: [1] Brian D. Sutton. Computing the complete CS decomposition. Numer. Algorithms, 50(1):33-65, 2009.

Definition at line 200 of file cunbdb2.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INFO, LWORK, M, P, Q, LDX11, LDX21
*     ..
*     .. Array Arguments ..
      REAL               PHI(*), THETA(*)
      COMPLEX            TAUP1(*), TAUP2(*), TAUQ1(*), WORK(*),
     $                   X11(LDX11,*), X21(LDX21,*)
*     ..
*
*  ====================================================================
*
*     .. Parameters ..
      COMPLEX            NEGONE, ONE
      parameter( negone = (-1.0e0,0.0e0),
     $                     one = (1.0e0,0.0e0) )
*     ..
*     .. Local Scalars ..
      REAL               C, S
      INTEGER            CHILDINFO, I, ILARF, IORBDB5, LLARF, LORBDB5,
     $                   LWORKMIN, LWORKOPT
      LOGICAL            LQUERY
*     ..
*     .. External Subroutines ..
      EXTERNAL           clarf, clarfgp, cunbdb5, csrot, cscal, clacgv,
     $                   xerbla
*     ..
*     .. External Functions ..
      REAL               SCNRM2
      EXTERNAL           scnrm2
*     ..
*     .. Intrinsic Function ..
      INTRINSIC          atan2, cos, max, sin, sqrt
*     ..
*     .. Executable Statements ..
*
*     Test input arguments
*
      info = 0
      lquery = lwork .EQ. -1
*
      IF( m .LT. 0 ) THEN
         info = -1
      ELSE IF( p .LT. 0 .OR. p .GT. m-p ) THEN
         info = -2
      ELSE IF( q .LT. 0 .OR. q .LT. p .OR. m-q .LT. p ) THEN
         info = -3
      ELSE IF( ldx11 .LT. max( 1, p ) ) THEN
         info = -5
      ELSE IF( ldx21 .LT. max( 1, m-p ) ) THEN
         info = -7
      END IF
*
*     Compute workspace
*
      IF( info .EQ. 0 ) THEN
         ilarf = 2
         llarf = max( p-1, m-p, q-1 )
         iorbdb5 = 2
         lorbdb5 = q-1
         lworkopt = max( ilarf+llarf-1, iorbdb5+lorbdb5-1 )
         lworkmin = lworkopt
         work(1) = lworkopt
         IF( lwork .LT. lworkmin .AND. .NOT.lquery ) THEN
           info = -14
         END IF
      END IF
      IF( info .NE. 0 ) THEN
         CALL xerbla( 'CUNBDB2', -info )
         RETURN
      ELSE IF( lquery ) THEN
         RETURN
      END IF
*
*     Reduce rows 1, ..., P of X11 and X21
*
      DO i = 1, p
*
         IF( i .GT. 1 ) THEN
            CALL csrot( q-i+1, x11(i,i), ldx11, x21(i-1,i), ldx21, c,
     $                  s )
         END IF
         CALL clacgv( q-i+1, x11(i,i), ldx11 )
         CALL clarfgp( q-i+1, x11(i,i), x11(i,i+1), ldx11, tauq1(i) )
         c = real( x11(i,i) )
         x11(i,i) = one
         CALL clarf( 'R', p-i, q-i+1, x11(i,i), ldx11, tauq1(i),
     $               x11(i+1,i), ldx11, work(ilarf) )
         CALL clarf( 'R', m-p-i+1, q-i+1, x11(i,i), ldx11, tauq1(i),
     $               x21(i,i), ldx21, work(ilarf) )
         CALL clacgv( q-i+1, x11(i,i), ldx11 )
         s = sqrt( scnrm2( p-i, x11(i+1,i), 1 )**2
     $           + scnrm2( m-p-i+1, x21(i,i), 1 )**2 )
         theta(i) = atan2( s, c )
*
         CALL cunbdb5( p-i, m-p-i+1, q-i, x11(i+1,i), 1, x21(i,i), 1,
     $                 x11(i+1,i+1), ldx11, x21(i,i+1), ldx21,
     $                 work(iorbdb5), lorbdb5, childinfo )
         CALL cscal( p-i, negone, x11(i+1,i), 1 )
         CALL clarfgp( m-p-i+1, x21(i,i), x21(i+1,i), 1, taup2(i) )
         IF( i .LT. p ) THEN
            CALL clarfgp( p-i, x11(i+1,i), x11(i+2,i), 1, taup1(i) )
            phi(i) = atan2( real( x11(i+1,i) ), real( x21(i,i) ) )
            c = cos( phi(i) )
            s = sin( phi(i) )
            x11(i+1,i) = one
            CALL clarf( 'L', p-i, q-i, x11(i+1,i), 1, conjg(taup1(i)),
     $                  x11(i+1,i+1), ldx11, work(ilarf) )
         END IF
         x21(i,i) = one
         CALL clarf( 'L', m-p-i+1, q-i, x21(i,i), 1, conjg(taup2(i)),
     $               x21(i,i+1), ldx21, work(ilarf) )
*
      END DO
*
*     Reduce the bottom-right portion of X21 to the identity matrix
*
      DO i = p + 1, q
         CALL clarfgp( m-p-i+1, x21(i,i), x21(i+1,i), 1, taup2(i) )
         x21(i,i) = one
         CALL clarf( 'L', m-p-i+1, q-i, x21(i,i), 1, conjg(taup2(i)),
     $               x21(i,i+1), ldx21, work(ilarf) )
      END DO
*
      RETURN
*
*     End of CUNBDB2
*

◆ cunbdb3()

subroutine cunbdb3	(	integer	m,
		integer	p,
		integer	q,
		complex, dimension(ldx11,*)	x11,
		integer	ldx11,
		complex, dimension(ldx21,*)	x21,
		integer	ldx21,
		real, dimension(*)	theta,
		real, dimension(*)	phi,
		complex, dimension(*)	taup1,
		complex, dimension(*)	taup2,
		complex, dimension(*)	tauq1,
		complex, dimension(*)	work,
		integer	lwork,
		integer	info )

CUNBDB3

Download CUNBDB3 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CUNBDB3 simultaneously bidiagonalizes the blocks of a tall and skinny
!> matrix X with orthonomal columns:
!>
!>                            [ B11 ]
!>      [ X11 ]   [ P1 |    ] [  0  ]
!>      [-----] = [---------] [-----] Q1**T .
!>      [ X21 ]   [    | P2 ] [ B21 ]
!>                            [  0  ]
!>
!> X11 is P-by-Q, and X21 is (M-P)-by-Q. M-P must be no larger than P,
!> Q, or M-Q. Routines CUNBDB1, CUNBDB2, and CUNBDB4 handle cases in
!> which M-P is not the minimum dimension.
!>
!> The unitary matrices P1, P2, and Q1 are P-by-P, (M-P)-by-(M-P),
!> and (M-Q)-by-(M-Q), respectively. They are represented implicitly by
!> Householder vectors.
!>
!> B11 and B12 are (M-P)-by-(M-P) bidiagonal matrices represented
!> implicitly by angles THETA, PHI.
!>
!>

Parameters

[in]	M	!> M is INTEGER !> The number of rows X11 plus the number of rows in X21. !>
[in]	P	!> P is INTEGER !> The number of rows in X11. 0 <= P <= M. M-P <= min(P,Q,M-Q). !>
[in]	Q	!> Q is INTEGER !> The number of columns in X11 and X21. 0 <= Q <= M. !>
[in,out]	X11	!> X11 is COMPLEX array, dimension (LDX11,Q) !> On entry, the top block of the matrix X to be reduced. On !> exit, the columns of tril(X11) specify reflectors for P1 and !> the rows of triu(X11,1) specify reflectors for Q1. !>
[in]	LDX11	!> LDX11 is INTEGER !> The leading dimension of X11. LDX11 >= P. !>
[in,out]	X21	!> X21 is COMPLEX array, dimension (LDX21,Q) !> On entry, the bottom block of the matrix X to be reduced. On !> exit, the columns of tril(X21) specify reflectors for P2. !>
[in]	LDX21	!> LDX21 is INTEGER !> The leading dimension of X21. LDX21 >= M-P. !>
[out]	THETA	!> THETA is REAL array, dimension (Q) !> The entries of the bidiagonal blocks B11, B21 are defined by !> THETA and PHI. See Further Details. !>
[out]	PHI	!> PHI is REAL array, dimension (Q-1) !> The entries of the bidiagonal blocks B11, B21 are defined by !> THETA and PHI. See Further Details. !>
[out]	TAUP1	!> TAUP1 is COMPLEX array, dimension (P) !> The scalar factors of the elementary reflectors that define !> P1. !>
[out]	TAUP2	!> TAUP2 is COMPLEX array, dimension (M-P) !> The scalar factors of the elementary reflectors that define !> P2. !>
[out]	TAUQ1	!> TAUQ1 is COMPLEX array, dimension (Q) !> The scalar factors of the elementary reflectors that define !> Q1. !>
[out]	WORK	!> WORK is COMPLEX array, dimension (LWORK) !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the array WORK. LWORK >= M-Q. !> !> If LWORK = -1, then a workspace query is assumed; the routine !> only calculates the optimal size of the WORK array, returns !> this value as the first entry of the WORK array, and no error !> message related to LWORK is issued by XERBLA. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> < 0: if INFO = -i, the i-th argument had an illegal value. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  The upper-bidiagonal blocks B11, B21 are represented implicitly by
!>  angles THETA(1), ..., THETA(Q) and PHI(1), ..., PHI(Q-1). Every entry
!>  in each bidiagonal band is a product of a sine or cosine of a THETA
!>  with a sine or cosine of a PHI. See [1] or CUNCSD for details.
!>
!>  P1, P2, and Q1 are represented as products of elementary reflectors.
!>  See CUNCSD2BY1 for details on generating P1, P2, and Q1 using CUNGQR
!>  and CUNGLQ.
!>

References:: [1] Brian D. Sutton. Computing the complete CS decomposition. Numer. Algorithms, 50(1):33-65, 2009.

Definition at line 200 of file cunbdb3.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INFO, LWORK, M, P, Q, LDX11, LDX21
*     ..
*     .. Array Arguments ..
      REAL               PHI(*), THETA(*)
      COMPLEX            TAUP1(*), TAUP2(*), TAUQ1(*), WORK(*),
     $                   X11(LDX11,*), X21(LDX21,*)
*     ..
*
*  ====================================================================
*
*     .. Parameters ..
      COMPLEX            ONE
      parameter( one = (1.0e0,0.0e0) )
*     ..
*     .. Local Scalars ..
      REAL               C, S
      INTEGER            CHILDINFO, I, ILARF, IORBDB5, LLARF, LORBDB5,
     $                   LWORKMIN, LWORKOPT
      LOGICAL            LQUERY
*     ..
*     .. External Subroutines ..
      EXTERNAL           clarf, clarfgp, cunbdb5, csrot, clacgv, xerbla
*     ..
*     .. External Functions ..
      REAL               SCNRM2
      EXTERNAL           scnrm2
*     ..
*     .. Intrinsic Function ..
      INTRINSIC          atan2, cos, max, sin, sqrt
*     ..
*     .. Executable Statements ..
*
*     Test input arguments
*
      info = 0
      lquery = lwork .EQ. -1
*
      IF( m .LT. 0 ) THEN
         info = -1
      ELSE IF( 2*p .LT. m .OR. p .GT. m ) THEN
         info = -2
      ELSE IF( q .LT. m-p .OR. m-q .LT. m-p ) THEN
         info = -3
      ELSE IF( ldx11 .LT. max( 1, p ) ) THEN
         info = -5
      ELSE IF( ldx21 .LT. max( 1, m-p ) ) THEN
         info = -7
      END IF
*
*     Compute workspace
*
      IF( info .EQ. 0 ) THEN
         ilarf = 2
         llarf = max( p, m-p-1, q-1 )
         iorbdb5 = 2
         lorbdb5 = q-1
         lworkopt = max( ilarf+llarf-1, iorbdb5+lorbdb5-1 )
         lworkmin = lworkopt
         work(1) = lworkopt
         IF( lwork .LT. lworkmin .AND. .NOT.lquery ) THEN
           info = -14
         END IF
      END IF
      IF( info .NE. 0 ) THEN
         CALL xerbla( 'CUNBDB3', -info )
         RETURN
      ELSE IF( lquery ) THEN
         RETURN
      END IF
*
*     Reduce rows 1, ..., M-P of X11 and X21
*
      DO i = 1, m-p
*
         IF( i .GT. 1 ) THEN
            CALL csrot( q-i+1, x11(i-1,i), ldx11, x21(i,i), ldx11, c,
     $                  s )
         END IF
*
         CALL clacgv( q-i+1, x21(i,i), ldx21 )
         CALL clarfgp( q-i+1, x21(i,i), x21(i,i+1), ldx21, tauq1(i) )
         s = real( x21(i,i) )
         x21(i,i) = one
         CALL clarf( 'R', p-i+1, q-i+1, x21(i,i), ldx21, tauq1(i),
     $               x11(i,i), ldx11, work(ilarf) )
         CALL clarf( 'R', m-p-i, q-i+1, x21(i,i), ldx21, tauq1(i),
     $               x21(i+1,i), ldx21, work(ilarf) )
         CALL clacgv( q-i+1, x21(i,i), ldx21 )
         c = sqrt( scnrm2( p-i+1, x11(i,i), 1 )**2
     $           + scnrm2( m-p-i, x21(i+1,i), 1 )**2 )
         theta(i) = atan2( s, c )
*
         CALL cunbdb5( p-i+1, m-p-i, q-i, x11(i,i), 1, x21(i+1,i), 1,
     $                 x11(i,i+1), ldx11, x21(i+1,i+1), ldx21,
     $                 work(iorbdb5), lorbdb5, childinfo )
         CALL clarfgp( p-i+1, x11(i,i), x11(i+1,i), 1, taup1(i) )
         IF( i .LT. m-p ) THEN
            CALL clarfgp( m-p-i, x21(i+1,i), x21(i+2,i), 1, taup2(i) )
            phi(i) = atan2( real( x21(i+1,i) ), real( x11(i,i) ) )
            c = cos( phi(i) )
            s = sin( phi(i) )
            x21(i+1,i) = one
            CALL clarf( 'L', m-p-i, q-i, x21(i+1,i), 1, conjg(taup2(i)),
     $                  x21(i+1,i+1), ldx21, work(ilarf) )
         END IF
         x11(i,i) = one
         CALL clarf( 'L', p-i+1, q-i, x11(i,i), 1, conjg(taup1(i)),
     $               x11(i,i+1), ldx11, work(ilarf) )
*
      END DO
*
*     Reduce the bottom-right portion of X11 to the identity matrix
*
      DO i = m-p + 1, q
         CALL clarfgp( p-i+1, x11(i,i), x11(i+1,i), 1, taup1(i) )
         x11(i,i) = one
         CALL clarf( 'L', p-i+1, q-i, x11(i,i), 1, conjg(taup1(i)),
     $               x11(i,i+1), ldx11, work(ilarf) )
      END DO
*
      RETURN
*
*     End of CUNBDB3
*

◆ cunbdb4()

subroutine cunbdb4	(	integer	m,
		integer	p,
		integer	q,
		complex, dimension(ldx11,*)	x11,
		integer	ldx11,
		complex, dimension(ldx21,*)	x21,
		integer	ldx21,
		real, dimension(*)	theta,
		real, dimension(*)	phi,
		complex, dimension(*)	taup1,
		complex, dimension(*)	taup2,
		complex, dimension(*)	tauq1,
		complex, dimension(*)	phantom,
		complex, dimension(*)	work,
		integer	lwork,
		integer	info )

CUNBDB4

Download CUNBDB4 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CUNBDB4 simultaneously bidiagonalizes the blocks of a tall and skinny
!> matrix X with orthonomal columns:
!>
!>                            [ B11 ]
!>      [ X11 ]   [ P1 |    ] [  0  ]
!>      [-----] = [---------] [-----] Q1**T .
!>      [ X21 ]   [    | P2 ] [ B21 ]
!>                            [  0  ]
!>
!> X11 is P-by-Q, and X21 is (M-P)-by-Q. M-Q must be no larger than P,
!> M-P, or Q. Routines CUNBDB1, CUNBDB2, and CUNBDB3 handle cases in
!> which M-Q is not the minimum dimension.
!>
!> The unitary matrices P1, P2, and Q1 are P-by-P, (M-P)-by-(M-P),
!> and (M-Q)-by-(M-Q), respectively. They are represented implicitly by
!> Householder vectors.
!>
!> B11 and B12 are (M-Q)-by-(M-Q) bidiagonal matrices represented
!> implicitly by angles THETA, PHI.
!>
!>

Parameters

[in]	M	!> M is INTEGER !> The number of rows X11 plus the number of rows in X21. !>
[in]	P	!> P is INTEGER !> The number of rows in X11. 0 <= P <= M. !>
[in]	Q	!> Q is INTEGER !> The number of columns in X11 and X21. 0 <= Q <= M and !> M-Q <= min(P,M-P,Q). !>
[in,out]	X11	!> X11 is COMPLEX array, dimension (LDX11,Q) !> On entry, the top block of the matrix X to be reduced. On !> exit, the columns of tril(X11) specify reflectors for P1 and !> the rows of triu(X11,1) specify reflectors for Q1. !>
[in]	LDX11	!> LDX11 is INTEGER !> The leading dimension of X11. LDX11 >= P. !>
[in,out]	X21	!> X21 is COMPLEX array, dimension (LDX21,Q) !> On entry, the bottom block of the matrix X to be reduced. On !> exit, the columns of tril(X21) specify reflectors for P2. !>
[in]	LDX21	!> LDX21 is INTEGER !> The leading dimension of X21. LDX21 >= M-P. !>
[out]	THETA	!> THETA is REAL array, dimension (Q) !> The entries of the bidiagonal blocks B11, B21 are defined by !> THETA and PHI. See Further Details. !>
[out]	PHI	!> PHI is REAL array, dimension (Q-1) !> The entries of the bidiagonal blocks B11, B21 are defined by !> THETA and PHI. See Further Details. !>
[out]	TAUP1	!> TAUP1 is COMPLEX array, dimension (P) !> The scalar factors of the elementary reflectors that define !> P1. !>
[out]	TAUP2	!> TAUP2 is COMPLEX array, dimension (M-P) !> The scalar factors of the elementary reflectors that define !> P2. !>
[out]	TAUQ1	!> TAUQ1 is COMPLEX array, dimension (Q) !> The scalar factors of the elementary reflectors that define !> Q1. !>
[out]	PHANTOM	!> PHANTOM is COMPLEX array, dimension (M) !> The routine computes an M-by-1 column vector Y that is !> orthogonal to the columns of [ X11; X21 ]. PHANTOM(1:P) and !> PHANTOM(P+1:M) contain Householder vectors for Y(1:P) and !> Y(P+1:M), respectively. !>
[out]	WORK	!> WORK is COMPLEX array, dimension (LWORK) !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the array WORK. LWORK >= M-Q. !> !> If LWORK = -1, then a workspace query is assumed; the routine !> only calculates the optimal size of the WORK array, returns !> this value as the first entry of the WORK array, and no error !> message related to LWORK is issued by XERBLA. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> < 0: if INFO = -i, the i-th argument had an illegal value. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  The upper-bidiagonal blocks B11, B21 are represented implicitly by
!>  angles THETA(1), ..., THETA(Q) and PHI(1), ..., PHI(Q-1). Every entry
!>  in each bidiagonal band is a product of a sine or cosine of a THETA
!>  with a sine or cosine of a PHI. See [1] or CUNCSD for details.
!>
!>  P1, P2, and Q1 are represented as products of elementary reflectors.
!>  See CUNCSD2BY1 for details on generating P1, P2, and Q1 using CUNGQR
!>  and CUNGLQ.
!>

References:: [1] Brian D. Sutton. Computing the complete CS decomposition. Numer. Algorithms, 50(1):33-65, 2009.

Definition at line 210 of file cunbdb4.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INFO, LWORK, M, P, Q, LDX11, LDX21
*     ..
*     .. Array Arguments ..
      REAL               PHI(*), THETA(*)
      COMPLEX            PHANTOM(*), TAUP1(*), TAUP2(*), TAUQ1(*),
     $                   WORK(*), X11(LDX11,*), X21(LDX21,*)
*     ..
*
*  ====================================================================
*
*     .. Parameters ..
      COMPLEX            NEGONE, ONE, ZERO
      parameter( negone = (-1.0e0,0.0e0), one = (1.0e0,0.0e0),
     $                     zero = (0.0e0,0.0e0) )
*     ..
*     .. Local Scalars ..
      REAL               C, S
      INTEGER            CHILDINFO, I, ILARF, IORBDB5, J, LLARF,
     $                   LORBDB5, LWORKMIN, LWORKOPT
      LOGICAL            LQUERY
*     ..
*     .. External Subroutines ..
      EXTERNAL           clarf, clarfgp, cunbdb5, csrot, cscal, clacgv,
     $                   xerbla
*     ..
*     .. External Functions ..
      REAL               SCNRM2
      EXTERNAL           scnrm2
*     ..
*     .. Intrinsic Function ..
      INTRINSIC          atan2, cos, max, sin, sqrt
*     ..
*     .. Executable Statements ..
*
*     Test input arguments
*
      info = 0
      lquery = lwork .EQ. -1
*
      IF( m .LT. 0 ) THEN
         info = -1
      ELSE IF( p .LT. m-q .OR. m-p .LT. m-q ) THEN
         info = -2
      ELSE IF( q .LT. m-q .OR. q .GT. m ) THEN
         info = -3
      ELSE IF( ldx11 .LT. max( 1, p ) ) THEN
         info = -5
      ELSE IF( ldx21 .LT. max( 1, m-p ) ) THEN
         info = -7
      END IF
*
*     Compute workspace
*
      IF( info .EQ. 0 ) THEN
         ilarf = 2
         llarf = max( q-1, p-1, m-p-1 )
         iorbdb5 = 2
         lorbdb5 = q
         lworkopt = ilarf + llarf - 1
         lworkopt = max( lworkopt, iorbdb5 + lorbdb5 - 1 )
         lworkmin = lworkopt
         work(1) = lworkopt
         IF( lwork .LT. lworkmin .AND. .NOT.lquery ) THEN
           info = -14
         END IF
      END IF
      IF( info .NE. 0 ) THEN
         CALL xerbla( 'CUNBDB4', -info )
         RETURN
      ELSE IF( lquery ) THEN
         RETURN
      END IF
*
*     Reduce columns 1, ..., M-Q of X11 and X21
*
      DO i = 1, m-q
*
         IF( i .EQ. 1 ) THEN
            DO j = 1, m
               phantom(j) = zero
            END DO
            CALL cunbdb5( p, m-p, q, phantom(1), 1, phantom(p+1), 1,
     $                    x11, ldx11, x21, ldx21, work(iorbdb5),
     $                    lorbdb5, childinfo )
            CALL cscal( p, negone, phantom(1), 1 )
            CALL clarfgp( p, phantom(1), phantom(2), 1, taup1(1) )
            CALL clarfgp( m-p, phantom(p+1), phantom(p+2), 1, taup2(1) )
            theta(i) = atan2( real( phantom(1) ), real( phantom(p+1) ) )
            c = cos( theta(i) )
            s = sin( theta(i) )
            phantom(1) = one
            phantom(p+1) = one
            CALL clarf( 'L', p, q, phantom(1), 1, conjg(taup1(1)), x11,
     $                  ldx11, work(ilarf) )
            CALL clarf( 'L', m-p, q, phantom(p+1), 1, conjg(taup2(1)),
     $                  x21, ldx21, work(ilarf) )
         ELSE
            CALL cunbdb5( p-i+1, m-p-i+1, q-i+1, x11(i,i-1), 1,
     $                    x21(i,i-1), 1, x11(i,i), ldx11, x21(i,i),
     $                    ldx21, work(iorbdb5), lorbdb5, childinfo )
            CALL cscal( p-i+1, negone, x11(i,i-1), 1 )
            CALL clarfgp( p-i+1, x11(i,i-1), x11(i+1,i-1), 1, taup1(i) )
            CALL clarfgp( m-p-i+1, x21(i,i-1), x21(i+1,i-1), 1,
     $                    taup2(i) )
            theta(i) = atan2( real( x11(i,i-1) ), real( x21(i,i-1) ) )
            c = cos( theta(i) )
            s = sin( theta(i) )
            x11(i,i-1) = one
            x21(i,i-1) = one
            CALL clarf( 'L', p-i+1, q-i+1, x11(i,i-1), 1,
     $                  conjg(taup1(i)), x11(i,i), ldx11, work(ilarf) )
            CALL clarf( 'L', m-p-i+1, q-i+1, x21(i,i-1), 1,
     $                  conjg(taup2(i)), x21(i,i), ldx21, work(ilarf) )
         END IF
*
         CALL csrot( q-i+1, x11(i,i), ldx11, x21(i,i), ldx21, s, -c )
         CALL clacgv( q-i+1, x21(i,i), ldx21 )
         CALL clarfgp( q-i+1, x21(i,i), x21(i,i+1), ldx21, tauq1(i) )
         c = real( x21(i,i) )
         x21(i,i) = one
         CALL clarf( 'R', p-i, q-i+1, x21(i,i), ldx21, tauq1(i),
     $               x11(i+1,i), ldx11, work(ilarf) )
         CALL clarf( 'R', m-p-i, q-i+1, x21(i,i), ldx21, tauq1(i),
     $               x21(i+1,i), ldx21, work(ilarf) )
         CALL clacgv( q-i+1, x21(i,i), ldx21 )
         IF( i .LT. m-q ) THEN
            s = sqrt( scnrm2( p-i, x11(i+1,i), 1 )**2
     $              + scnrm2( m-p-i, x21(i+1,i), 1 )**2 )
            phi(i) = atan2( s, c )
         END IF
*
      END DO
*
*     Reduce the bottom-right portion of X11 to [ I 0 ]
*
      DO i = m - q + 1, p
         CALL clacgv( q-i+1, x11(i,i), ldx11 )
         CALL clarfgp( q-i+1, x11(i,i), x11(i,i+1), ldx11, tauq1(i) )
         x11(i,i) = one
         CALL clarf( 'R', p-i, q-i+1, x11(i,i), ldx11, tauq1(i),
     $               x11(i+1,i), ldx11, work(ilarf) )
         CALL clarf( 'R', q-p, q-i+1, x11(i,i), ldx11, tauq1(i),
     $               x21(m-q+1,i), ldx21, work(ilarf) )
         CALL clacgv( q-i+1, x11(i,i), ldx11 )
      END DO
*
*     Reduce the bottom-right portion of X21 to [ 0 I ]
*
      DO i = p + 1, q
         CALL clacgv( q-i+1, x21(m-q+i-p,i), ldx21 )
         CALL clarfgp( q-i+1, x21(m-q+i-p,i), x21(m-q+i-p,i+1), ldx21,
     $                 tauq1(i) )
         x21(m-q+i-p,i) = one
         CALL clarf( 'R', q-i, q-i+1, x21(m-q+i-p,i), ldx21, tauq1(i),
     $               x21(m-q+i-p+1,i), ldx21, work(ilarf) )
         CALL clacgv( q-i+1, x21(m-q+i-p,i), ldx21 )
      END DO
*
      RETURN
*
*     End of CUNBDB4
*

◆ cunbdb5()

subroutine cunbdb5	(	integer	m1,
		integer	m2,
		integer	n,
		complex, dimension(*)	x1,
		integer	incx1,
		complex, dimension(*)	x2,
		integer	incx2,
		complex, dimension(ldq1,*)	q1,
		integer	ldq1,
		complex, dimension(ldq2,*)	q2,
		integer	ldq2,
		complex, dimension(*)	work,
		integer	lwork,
		integer	info )

CUNBDB5

Download CUNBDB5 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CUNBDB5 orthogonalizes the column vector
!>      X = [ X1 ]
!>          [ X2 ]
!> with respect to the columns of
!>      Q = [ Q1 ] .
!>          [ Q2 ]
!> The columns of Q must be orthonormal.
!>
!> If the projection is zero according to Kahan's 
!> criterion, then some other vector from the orthogonal complement
!> is returned. This vector is chosen in an arbitrary but deterministic
!> way.
!>
!>

Parameters

[in]	M1	!> M1 is INTEGER !> The dimension of X1 and the number of rows in Q1. 0 <= M1. !>
[in]	M2	!> M2 is INTEGER !> The dimension of X2 and the number of rows in Q2. 0 <= M2. !>
[in]	N	!> N is INTEGER !> The number of columns in Q1 and Q2. 0 <= N. !>
[in,out]	X1	!> X1 is COMPLEX array, dimension (M1) !> On entry, the top part of the vector to be orthogonalized. !> On exit, the top part of the projected vector. !>
[in]	INCX1	!> INCX1 is INTEGER !> Increment for entries of X1. !>
[in,out]	X2	!> X2 is COMPLEX array, dimension (M2) !> On entry, the bottom part of the vector to be !> orthogonalized. On exit, the bottom part of the projected !> vector. !>
[in]	INCX2	!> INCX2 is INTEGER !> Increment for entries of X2. !>
[in]	Q1	!> Q1 is COMPLEX array, dimension (LDQ1, N) !> The top part of the orthonormal basis matrix. !>
[in]	LDQ1	!> LDQ1 is INTEGER !> The leading dimension of Q1. LDQ1 >= M1. !>
[in]	Q2	!> Q2 is COMPLEX array, dimension (LDQ2, N) !> The bottom part of the orthonormal basis matrix. !>
[in]	LDQ2	!> LDQ2 is INTEGER !> The leading dimension of Q2. LDQ2 >= M2. !>
[out]	WORK	!> WORK is COMPLEX array, dimension (LWORK) !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the array WORK. LWORK >= N. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> < 0: if INFO = -i, the i-th argument had an illegal value. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 154 of file cunbdb5.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INCX1, INCX2, INFO, LDQ1, LDQ2, LWORK, M1, M2,
     $                   N
*     ..
*     .. Array Arguments ..
      COMPLEX            Q1(LDQ1,*), Q2(LDQ2,*), WORK(*), X1(*), X2(*)
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            ONE, ZERO
      parameter( one = (1.0e0,0.0e0), zero = (0.0e0,0.0e0) )
*     ..
*     .. Local Scalars ..
      INTEGER            CHILDINFO, I, J
*     ..
*     .. External Subroutines ..
      EXTERNAL           cunbdb6, xerbla
*     ..
*     .. External Functions ..
      REAL               SCNRM2
      EXTERNAL           scnrm2
*     ..
*     .. Intrinsic Function ..
      INTRINSIC          max
*     ..
*     .. Executable Statements ..
*
*     Test input arguments
*
      info = 0
      IF( m1 .LT. 0 ) THEN
         info = -1
      ELSE IF( m2 .LT. 0 ) THEN
         info = -2
      ELSE IF( n .LT. 0 ) THEN
         info = -3
      ELSE IF( incx1 .LT. 1 ) THEN
         info = -5
      ELSE IF( incx2 .LT. 1 ) THEN
         info = -7
      ELSE IF( ldq1 .LT. max( 1, m1 ) ) THEN
         info = -9
      ELSE IF( ldq2 .LT. max( 1, m2 ) ) THEN
         info = -11
      ELSE IF( lwork .LT. n ) THEN
         info = -13
      END IF
*
      IF( info .NE. 0 ) THEN
         CALL xerbla( 'CUNBDB5', -info )
         RETURN
      END IF
*
*     Project X onto the orthogonal complement of Q
*
      CALL cunbdb6( m1, m2, n, x1, incx1, x2, incx2, q1, ldq1, q2, ldq2,
     $              work, lwork, childinfo )
*
*     If the projection is nonzero, then return
*
      IF( scnrm2(m1,x1,incx1) .NE. zero
     $    .OR. scnrm2(m2,x2,incx2) .NE. zero ) THEN
         RETURN
      END IF
*
*     Project each standard basis vector e_1,...,e_M1 in turn, stopping
*     when a nonzero projection is found
*
      DO i = 1, m1
         DO j = 1, m1
            x1(j) = zero
         END DO
         x1(i) = one
         DO j = 1, m2
            x2(j) = zero
         END DO
         CALL cunbdb6( m1, m2, n, x1, incx1, x2, incx2, q1, ldq1, q2,
     $                 ldq2, work, lwork, childinfo )
         IF( scnrm2(m1,x1,incx1) .NE. zero
     $       .OR. scnrm2(m2,x2,incx2) .NE. zero ) THEN
            RETURN
         END IF
      END DO
*
*     Project each standard basis vector e_(M1+1),...,e_(M1+M2) in turn,
*     stopping when a nonzero projection is found
*
      DO i = 1, m2
         DO j = 1, m1
            x1(j) = zero
         END DO
         DO j = 1, m2
            x2(j) = zero
         END DO
         x2(i) = one
         CALL cunbdb6( m1, m2, n, x1, incx1, x2, incx2, q1, ldq1, q2,
     $                 ldq2, work, lwork, childinfo )
         IF( scnrm2(m1,x1,incx1) .NE. zero
     $       .OR. scnrm2(m2,x2,incx2) .NE. zero ) THEN
            RETURN
         END IF
      END DO
*
      RETURN
*
*     End of CUNBDB5
*

◆ cunbdb6()

subroutine cunbdb6	(	integer	m1,
		integer	m2,
		integer	n,
		complex, dimension(*)	x1,
		integer	incx1,
		complex, dimension(*)	x2,
		integer	incx2,
		complex, dimension(ldq1,*)	q1,
		integer	ldq1,
		complex, dimension(ldq2,*)	q2,
		integer	ldq2,
		complex, dimension(*)	work,
		integer	lwork,
		integer	info )

CUNBDB6

Download CUNBDB6 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CUNBDB6 orthogonalizes the column vector
!>      X = [ X1 ]
!>          [ X2 ]
!> with respect to the columns of
!>      Q = [ Q1 ] .
!>          [ Q2 ]
!> The columns of Q must be orthonormal.
!>
!> If the projection is zero according to Kahan's 
!> criterion, then the zero vector is returned.
!>
!>

Parameters

[in]	M1	!> M1 is INTEGER !> The dimension of X1 and the number of rows in Q1. 0 <= M1. !>
[in]	M2	!> M2 is INTEGER !> The dimension of X2 and the number of rows in Q2. 0 <= M2. !>
[in]	N	!> N is INTEGER !> The number of columns in Q1 and Q2. 0 <= N. !>
[in,out]	X1	!> X1 is COMPLEX array, dimension (M1) !> On entry, the top part of the vector to be orthogonalized. !> On exit, the top part of the projected vector. !>
[in]	INCX1	!> INCX1 is INTEGER !> Increment for entries of X1. !>
[in,out]	X2	!> X2 is COMPLEX array, dimension (M2) !> On entry, the bottom part of the vector to be !> orthogonalized. On exit, the bottom part of the projected !> vector. !>
[in]	INCX2	!> INCX2 is INTEGER !> Increment for entries of X2. !>
[in]	Q1	!> Q1 is COMPLEX array, dimension (LDQ1, N) !> The top part of the orthonormal basis matrix. !>
[in]	LDQ1	!> LDQ1 is INTEGER !> The leading dimension of Q1. LDQ1 >= M1. !>
[in]	Q2	!> Q2 is COMPLEX array, dimension (LDQ2, N) !> The bottom part of the orthonormal basis matrix. !>
[in]	LDQ2	!> LDQ2 is INTEGER !> The leading dimension of Q2. LDQ2 >= M2. !>
[out]	WORK	!> WORK is COMPLEX array, dimension (LWORK) !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the array WORK. LWORK >= N. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> < 0: if INFO = -i, the i-th argument had an illegal value. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 152 of file cunbdb6.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INCX1, INCX2, INFO, LDQ1, LDQ2, LWORK, M1, M2,
     $                   N
*     ..
*     .. Array Arguments ..
      COMPLEX            Q1(LDQ1,*), Q2(LDQ2,*), WORK(*), X1(*), X2(*)
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ALPHASQ, REALONE, REALZERO
      parameter( alphasq = 0.01e0, realone = 1.0e0,
     $                     realzero = 0.0e0 )
      COMPLEX            NEGONE, ONE, ZERO
      parameter( negone = (-1.0e0,0.0e0), one = (1.0e0,0.0e0),
     $                     zero = (0.0e0,0.0e0) )
*     ..
*     .. Local Scalars ..
      INTEGER            I
      REAL               NORMSQ1, NORMSQ2, SCL1, SCL2, SSQ1, SSQ2
*     ..
*     .. External Subroutines ..
      EXTERNAL           cgemv, classq, xerbla
*     ..
*     .. Intrinsic Function ..
      INTRINSIC          max
*     ..
*     .. Executable Statements ..
*
*     Test input arguments
*
      info = 0
      IF( m1 .LT. 0 ) THEN
         info = -1
      ELSE IF( m2 .LT. 0 ) THEN
         info = -2
      ELSE IF( n .LT. 0 ) THEN
         info = -3
      ELSE IF( incx1 .LT. 1 ) THEN
         info = -5
      ELSE IF( incx2 .LT. 1 ) THEN
         info = -7
      ELSE IF( ldq1 .LT. max( 1, m1 ) ) THEN
         info = -9
      ELSE IF( ldq2 .LT. max( 1, m2 ) ) THEN
         info = -11
      ELSE IF( lwork .LT. n ) THEN
         info = -13
      END IF
*
      IF( info .NE. 0 ) THEN
         CALL xerbla( 'CUNBDB6', -info )
         RETURN
      END IF
*
*     First, project X onto the orthogonal complement of Q's column
*     space
*
      scl1 = realzero
      ssq1 = realone
      CALL classq( m1, x1, incx1, scl1, ssq1 )
      scl2 = realzero
      ssq2 = realone
      CALL classq( m2, x2, incx2, scl2, ssq2 )
      normsq1 = scl1**2*ssq1 + scl2**2*ssq2
*
      IF( m1 .EQ. 0 ) THEN
         DO i = 1, n
            work(i) = zero
         END DO
      ELSE
         CALL cgemv( 'C', m1, n, one, q1, ldq1, x1, incx1, zero, work,
     $               1 )
      END IF
*
      CALL cgemv( 'C', m2, n, one, q2, ldq2, x2, incx2, one, work, 1 )
*
      CALL cgemv( 'N', m1, n, negone, q1, ldq1, work, 1, one, x1,
     $            incx1 )
      CALL cgemv( 'N', m2, n, negone, q2, ldq2, work, 1, one, x2,
     $            incx2 )
*
      scl1 = realzero
      ssq1 = realone
      CALL classq( m1, x1, incx1, scl1, ssq1 )
      scl2 = realzero
      ssq2 = realone
      CALL classq( m2, x2, incx2, scl2, ssq2 )
      normsq2 = scl1**2*ssq1 + scl2**2*ssq2
*
*     If projection is sufficiently large in norm, then stop.
*     If projection is zero, then stop.
*     Otherwise, project again.
*
      IF( normsq2 .GE. alphasq*normsq1 ) THEN
         RETURN
      END IF
*
      IF( normsq2 .EQ. zero ) THEN
         RETURN
      END IF
*
      normsq1 = normsq2
*
      DO i = 1, n
         work(i) = zero
      END DO
*
      IF( m1 .EQ. 0 ) THEN
         DO i = 1, n
            work(i) = zero
         END DO
      ELSE
         CALL cgemv( 'C', m1, n, one, q1, ldq1, x1, incx1, zero, work,
     $               1 )
      END IF
*
      CALL cgemv( 'C', m2, n, one, q2, ldq2, x2, incx2, one, work, 1 )
*
      CALL cgemv( 'N', m1, n, negone, q1, ldq1, work, 1, one, x1,
     $            incx1 )
      CALL cgemv( 'N', m2, n, negone, q2, ldq2, work, 1, one, x2,
     $            incx2 )
*
      scl1 = realzero
      ssq1 = realone
      CALL classq( m1, x1, incx1, scl1, ssq1 )
      scl2 = realzero
      ssq2 = realone
      CALL classq( m1, x1, incx1, scl1, ssq1 )
      normsq2 = scl1**2*ssq1 + scl2**2*ssq2
*
*     If second projection is sufficiently large in norm, then do
*     nothing more. Alternatively, if it shrunk significantly, then
*     truncate it to zero.
*
      IF( normsq2 .LT. alphasq*normsq1 ) THEN
         DO i = 1, m1
            x1(i) = zero
         END DO
         DO i = 1, m2
            x2(i) = zero
         END DO
      END IF
*
      RETURN
*
*     End of CUNBDB6
*

◆ cuncsd()

recursive subroutine cuncsd	(	character	jobu1,
		character	jobu2,
		character	jobv1t,
		character	jobv2t,
		character	trans,
		character	signs,
		integer	m,
		integer	p,
		integer	q,
		complex, dimension( ldx11, * )	x11,
		integer	ldx11,
		complex, dimension( ldx12, * )	x12,
		integer	ldx12,
		complex, dimension( ldx21, * )	x21,
		integer	ldx21,
		complex, dimension( ldx22, * )	x22,
		integer	ldx22,
		real, dimension( * )	theta,
		complex, dimension( ldu1, * )	u1,
		integer	ldu1,
		complex, dimension( ldu2, * )	u2,
		integer	ldu2,
		complex, dimension( ldv1t, * )	v1t,
		integer	ldv1t,
		complex, dimension( ldv2t, * )	v2t,
		integer	ldv2t,
		complex, dimension( * )	work,
		integer	lwork,
		real, dimension( * )	rwork,
		integer	lrwork,
		integer, dimension( * )	iwork,
		integer	info )

CUNCSD

Download CUNCSD + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CUNCSD computes the CS decomposition of an M-by-M partitioned
!> unitary matrix X:
!>
!>                                 [  I  0  0 |  0  0  0 ]
!>                                 [  0  C  0 |  0 -S  0 ]
!>     [ X11 | X12 ]   [ U1 |    ] [  0  0  0 |  0  0 -I ] [ V1 |    ]**H
!> X = [-----------] = [---------] [---------------------] [---------]   .
!>     [ X21 | X22 ]   [    | U2 ] [  0  0  0 |  I  0  0 ] [    | V2 ]
!>                                 [  0  S  0 |  0  C  0 ]
!>                                 [  0  0  I |  0  0  0 ]
!>
!> X11 is P-by-Q. The unitary matrices U1, U2, V1, and V2 are P-by-P,
!> (M-P)-by-(M-P), Q-by-Q, and (M-Q)-by-(M-Q), respectively. C and S are
!> R-by-R nonnegative diagonal matrices satisfying C^2 + S^2 = I, in
!> which R = MIN(P,M-P,Q,M-Q).
!>

Parameters

[in]	JOBU1	!> JOBU1 is CHARACTER !> = 'Y': U1 is computed; !> otherwise: U1 is not computed. !>
[in]	JOBU2	!> JOBU2 is CHARACTER !> = 'Y': U2 is computed; !> otherwise: U2 is not computed. !>
[in]	JOBV1T	!> JOBV1T is CHARACTER !> = 'Y': V1T is computed; !> otherwise: V1T is not computed. !>
[in]	JOBV2T	!> JOBV2T is CHARACTER !> = 'Y': V2T is computed; !> otherwise: V2T is not computed. !>
[in]	TRANS	!> TRANS is CHARACTER !> = 'T': X, U1, U2, V1T, and V2T are stored in row-major !> order; !> otherwise: X, U1, U2, V1T, and V2T are stored in column- !> major order. !>
[in]	SIGNS	!> SIGNS is CHARACTER !> = 'O': The lower-left block is made nonpositive (the !> convention); !> otherwise: The upper-right block is made nonpositive (the !> convention). !>
[in]	M	!> M is INTEGER !> The number of rows and columns in X. !>
[in]	P	!> P is INTEGER !> The number of rows in X11 and X12. 0 <= P <= M. !>
[in]	Q	!> Q is INTEGER !> The number of columns in X11 and X21. 0 <= Q <= M. !>
[in,out]	X11	!> X11 is COMPLEX array, dimension (LDX11,Q) !> On entry, part of the unitary matrix whose CSD is desired. !>
[in]	LDX11	!> LDX11 is INTEGER !> The leading dimension of X11. LDX11 >= MAX(1,P). !>
[in,out]	X12	!> X12 is COMPLEX array, dimension (LDX12,M-Q) !> On entry, part of the unitary matrix whose CSD is desired. !>
[in]	LDX12	!> LDX12 is INTEGER !> The leading dimension of X12. LDX12 >= MAX(1,P). !>
[in,out]	X21	!> X21 is COMPLEX array, dimension (LDX21,Q) !> On entry, part of the unitary matrix whose CSD is desired. !>
[in]	LDX21	!> LDX21 is INTEGER !> The leading dimension of X11. LDX21 >= MAX(1,M-P). !>
[in,out]	X22	!> X22 is COMPLEX array, dimension (LDX22,M-Q) !> On entry, part of the unitary matrix whose CSD is desired. !>
[in]	LDX22	!> LDX22 is INTEGER !> The leading dimension of X11. LDX22 >= MAX(1,M-P). !>
[out]	THETA	!> THETA is REAL array, dimension (R), in which R = !> MIN(P,M-P,Q,M-Q). !> C = DIAG( COS(THETA(1)), ... , COS(THETA(R)) ) and !> S = DIAG( SIN(THETA(1)), ... , SIN(THETA(R)) ). !>
[out]	U1	!> U1 is COMPLEX array, dimension (LDU1,P) !> If JOBU1 = 'Y', U1 contains the P-by-P unitary matrix U1. !>
[in]	LDU1	!> LDU1 is INTEGER !> The leading dimension of U1. If JOBU1 = 'Y', LDU1 >= !> MAX(1,P). !>
[out]	U2	!> U2 is COMPLEX array, dimension (LDU2,M-P) !> If JOBU2 = 'Y', U2 contains the (M-P)-by-(M-P) unitary !> matrix U2. !>
[in]	LDU2	!> LDU2 is INTEGER !> The leading dimension of U2. If JOBU2 = 'Y', LDU2 >= !> MAX(1,M-P). !>
[out]	V1T	!> V1T is COMPLEX array, dimension (LDV1T,Q) !> If JOBV1T = 'Y', V1T contains the Q-by-Q matrix unitary !> matrix V1**H. !>
[in]	LDV1T	!> LDV1T is INTEGER !> The leading dimension of V1T. If JOBV1T = 'Y', LDV1T >= !> MAX(1,Q). !>
[out]	V2T	!> V2T is COMPLEX array, dimension (LDV2T,M-Q) !> If JOBV2T = 'Y', V2T contains the (M-Q)-by-(M-Q) unitary !> matrix V2**H. !>
[in]	LDV2T	!> LDV2T is INTEGER !> The leading dimension of V2T. If JOBV2T = 'Y', LDV2T >= !> MAX(1,M-Q). !>
[out]	WORK	!> WORK is COMPLEX array, dimension (MAX(1,LWORK)) !> On exit, if INFO = 0, WORK(1) returns the optimal LWORK. !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the array WORK. !> !> If LWORK = -1, then a workspace query is assumed; the routine !> only calculates the optimal size of the WORK array, returns !> this value as the first entry of the work array, and no error !> message related to LWORK is issued by XERBLA. !>
[out]	RWORK	!> RWORK is REAL array, dimension MAX(1,LRWORK) !> On exit, if INFO = 0, RWORK(1) returns the optimal LRWORK. !> If INFO > 0 on exit, RWORK(2:R) contains the values PHI(1), !> ..., PHI(R-1) that, together with THETA(1), ..., THETA(R), !> define the matrix in intermediate bidiagonal-block form !> remaining after nonconvergence. INFO specifies the number !> of nonzero PHI's. !>
[in]	LRWORK	!> LRWORK is INTEGER !> The dimension of the array RWORK. !> !> If LRWORK = -1, then a workspace query is assumed; the routine !> only calculates the optimal size of the RWORK array, returns !> this value as the first entry of the work array, and no error !> message related to LRWORK is issued by XERBLA. !>
[out]	IWORK	!> IWORK is INTEGER array, dimension (M-MIN(P,M-P,Q,M-Q)) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> < 0: if INFO = -i, the i-th argument had an illegal value. !> > 0: CBBCSD did not converge. See the description of RWORK !> above for details. !>

References:: [1] Brian D. Sutton. Computing the complete CS decomposition. Numer. Algorithms, 50(1):33-65, 2009.

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 314 of file cuncsd.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          JOBU1, JOBU2, JOBV1T, JOBV2T, SIGNS, TRANS
      INTEGER            INFO, LDU1, LDU2, LDV1T, LDV2T, LDX11, LDX12,
     $                   LDX21, LDX22, LRWORK, LWORK, M, P, Q
*     ..
*     .. Array Arguments ..
      INTEGER            IWORK( * )
      REAL               THETA( * )
      REAL               RWORK( * )
      COMPLEX            U1( LDU1, * ), U2( LDU2, * ), V1T( LDV1T, * ),
     $                   V2T( LDV2T, * ), WORK( * ), X11( LDX11, * ),
     $                   X12( LDX12, * ), X21( LDX21, * ), X22( LDX22,
     $                   * )
*     ..
*
*  ===================================================================
*
*     .. Parameters ..
      COMPLEX            ONE, ZERO
      parameter( one = (1.0e0,0.0e0),
     $                     zero = (0.0e0,0.0e0) )
*     ..
*     .. Local Scalars ..
      CHARACTER          TRANST, SIGNST
      INTEGER            CHILDINFO, I, IB11D, IB11E, IB12D, IB12E,
     $                   IB21D, IB21E, IB22D, IB22E, IBBCSD, IORBDB,
     $                   IORGLQ, IORGQR, IPHI, ITAUP1, ITAUP2, ITAUQ1,
     $                   ITAUQ2, J, LBBCSDWORK, LBBCSDWORKMIN,
     $                   LBBCSDWORKOPT, LORBDBWORK, LORBDBWORKMIN,
     $                   LORBDBWORKOPT, LORGLQWORK, LORGLQWORKMIN,
     $                   LORGLQWORKOPT, LORGQRWORK, LORGQRWORKMIN,
     $                   LORGQRWORKOPT, LWORKMIN, LWORKOPT, P1, Q1
      LOGICAL            COLMAJOR, DEFAULTSIGNS, LQUERY, WANTU1, WANTU2,
     $                   WANTV1T, WANTV2T
      INTEGER            LRWORKMIN, LRWORKOPT
      LOGICAL            LRQUERY
*     ..
*     .. External Subroutines ..
      EXTERNAL           xerbla, cbbcsd, clacpy, clapmr, clapmt,
     $                   cunbdb, cunglq, cungqr
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. Intrinsic Functions
      INTRINSIC          int, max, min
*     ..
*     .. Executable Statements ..
*
*     Test input arguments
*
      info = 0
      wantu1 = lsame( jobu1, 'Y' )
      wantu2 = lsame( jobu2, 'Y' )
      wantv1t = lsame( jobv1t, 'Y' )
      wantv2t = lsame( jobv2t, 'Y' )
      colmajor = .NOT. lsame( trans, 'T' )
      defaultsigns = .NOT. lsame( signs, 'O' )
      lquery = lwork .EQ. -1
      lrquery = lrwork .EQ. -1
      IF( m .LT. 0 ) THEN
         info = -7
      ELSE IF( p .LT. 0 .OR. p .GT. m ) THEN
         info = -8
      ELSE IF( q .LT. 0 .OR. q .GT. m ) THEN
         info = -9
      ELSE IF ( colmajor .AND.  ldx11 .LT. max( 1, p ) ) THEN
        info = -11
      ELSE IF (.NOT. colmajor .AND. ldx11 .LT. max( 1, q ) ) THEN
        info = -11
      ELSE IF (colmajor .AND. ldx12 .LT. max( 1, p ) ) THEN
        info = -13
      ELSE IF (.NOT. colmajor .AND. ldx12 .LT. max( 1, m-q ) ) THEN
        info = -13
      ELSE IF (colmajor .AND. ldx21 .LT. max( 1, m-p ) ) THEN
        info = -15
      ELSE IF (.NOT. colmajor .AND. ldx21 .LT. max( 1, q ) ) THEN
        info = -15
      ELSE IF (colmajor .AND. ldx22 .LT. max( 1, m-p ) ) THEN
        info = -17
      ELSE IF (.NOT. colmajor .AND. ldx22 .LT. max( 1, m-q ) ) THEN
        info = -17
      ELSE IF( wantu1 .AND. ldu1 .LT. p ) THEN
         info = -20
      ELSE IF( wantu2 .AND. ldu2 .LT. m-p ) THEN
         info = -22
      ELSE IF( wantv1t .AND. ldv1t .LT. q ) THEN
         info = -24
      ELSE IF( wantv2t .AND. ldv2t .LT. m-q ) THEN
         info = -26
      END IF
*
*     Work with transpose if convenient
*
      IF( info .EQ. 0 .AND. min( p, m-p ) .LT. min( q, m-q ) ) THEN
         IF( colmajor ) THEN
            transt = 'T'
         ELSE
            transt = 'N'
         END IF
         IF( defaultsigns ) THEN
            signst = 'O'
         ELSE
            signst = 'D'
         END IF
         CALL cuncsd( jobv1t, jobv2t, jobu1, jobu2, transt, signst, m,
     $                q, p, x11, ldx11, x21, ldx21, x12, ldx12, x22,
     $                ldx22, theta, v1t, ldv1t, v2t, ldv2t, u1, ldu1,
     $                u2, ldu2, work, lwork, rwork, lrwork, iwork,
     $                info )
         RETURN
      END IF
*
*     Work with permutation [ 0 I; I 0 ] * X * [ 0 I; I 0 ] if
*     convenient
*
      IF( info .EQ. 0 .AND. m-q .LT. q ) THEN
         IF( defaultsigns ) THEN
            signst = 'O'
         ELSE
            signst = 'D'
         END IF
         CALL cuncsd( jobu2, jobu1, jobv2t, jobv1t, trans, signst, m,
     $                m-p, m-q, x22, ldx22, x21, ldx21, x12, ldx12, x11,
     $                ldx11, theta, u2, ldu2, u1, ldu1, v2t, ldv2t, v1t,
     $                ldv1t, work, lwork, rwork, lrwork, iwork, info )
         RETURN
      END IF
*
*     Compute workspace
*
      IF( info .EQ. 0 ) THEN
*
*        Real workspace
*
         iphi = 2
         ib11d = iphi + max( 1, q - 1 )
         ib11e = ib11d + max( 1, q )
         ib12d = ib11e + max( 1, q - 1 )
         ib12e = ib12d + max( 1, q )
         ib21d = ib12e + max( 1, q - 1 )
         ib21e = ib21d + max( 1, q )
         ib22d = ib21e + max( 1, q - 1 )
         ib22e = ib22d + max( 1, q )
         ibbcsd = ib22e + max( 1, q - 1 )
         CALL cbbcsd( jobu1, jobu2, jobv1t, jobv2t, trans, m, p, q,
     $                theta, theta, u1, ldu1, u2, ldu2, v1t, ldv1t,
     $                v2t, ldv2t, theta, theta, theta, theta, theta,
     $                theta, theta, theta, rwork, -1, childinfo )
         lbbcsdworkopt = int( rwork(1) )
         lbbcsdworkmin = lbbcsdworkopt
         lrworkopt = ibbcsd + lbbcsdworkopt - 1
         lrworkmin = ibbcsd + lbbcsdworkmin - 1
         rwork(1) = lrworkopt
*
*        Complex workspace
*
         itaup1 = 2
         itaup2 = itaup1 + max( 1, p )
         itauq1 = itaup2 + max( 1, m - p )
         itauq2 = itauq1 + max( 1, q )
         iorgqr = itauq2 + max( 1, m - q )
         CALL cungqr( m-q, m-q, m-q, u1, max(1,m-q), u1, work, -1,
     $                childinfo )
         lorgqrworkopt = int( work(1) )
         lorgqrworkmin = max( 1, m - q )
         iorglq = itauq2 + max( 1, m - q )
         CALL cunglq( m-q, m-q, m-q, u1, max(1,m-q), u1, work, -1,
     $                childinfo )
         lorglqworkopt = int( work(1) )
         lorglqworkmin = max( 1, m - q )
         iorbdb = itauq2 + max( 1, m - q )
         CALL cunbdb( trans, signs, m, p, q, x11, ldx11, x12, ldx12,
     $                x21, ldx21, x22, ldx22, theta, theta, u1, u2,
     $                v1t, v2t, work, -1, childinfo )
         lorbdbworkopt = int( work(1) )
         lorbdbworkmin = lorbdbworkopt
         lworkopt = max( iorgqr + lorgqrworkopt, iorglq + lorglqworkopt,
     $              iorbdb + lorbdbworkopt ) - 1
         lworkmin = max( iorgqr + lorgqrworkmin, iorglq + lorglqworkmin,
     $              iorbdb + lorbdbworkmin ) - 1
         work(1) = max(lworkopt,lworkmin)
*
         IF( lwork .LT. lworkmin
     $       .AND. .NOT. ( lquery .OR. lrquery ) ) THEN
            info = -22
         ELSE IF( lrwork .LT. lrworkmin
     $            .AND. .NOT. ( lquery .OR. lrquery ) ) THEN
            info = -24
         ELSE
            lorgqrwork = lwork - iorgqr + 1
            lorglqwork = lwork - iorglq + 1
            lorbdbwork = lwork - iorbdb + 1
            lbbcsdwork = lrwork - ibbcsd + 1
         END IF
      END IF
*
*     Abort if any illegal arguments
*
      IF( info .NE. 0 ) THEN
         CALL xerbla( 'CUNCSD', -info )
         RETURN
      ELSE IF( lquery .OR. lrquery ) THEN
         RETURN
      END IF
*
*     Transform to bidiagonal block form
*
      CALL cunbdb( trans, signs, m, p, q, x11, ldx11, x12, ldx12, x21,
     $             ldx21, x22, ldx22, theta, rwork(iphi), work(itaup1),
     $             work(itaup2), work(itauq1), work(itauq2),
     $             work(iorbdb), lorbdbwork, childinfo )
*
*     Accumulate Householder reflectors
*
      IF( colmajor ) THEN
         IF( wantu1 .AND. p .GT. 0 ) THEN
            CALL clacpy( 'L', p, q, x11, ldx11, u1, ldu1 )
            CALL cungqr( p, p, q, u1, ldu1, work(itaup1), work(iorgqr),
     $                   lorgqrwork, info)
         END IF
         IF( wantu2 .AND. m-p .GT. 0 ) THEN
            CALL clacpy( 'L', m-p, q, x21, ldx21, u2, ldu2 )
            CALL cungqr( m-p, m-p, q, u2, ldu2, work(itaup2),
     $                   work(iorgqr), lorgqrwork, info )
         END IF
         IF( wantv1t .AND. q .GT. 0 ) THEN
            CALL clacpy( 'U', q-1, q-1, x11(1,2), ldx11, v1t(2,2),
     $                   ldv1t )
            v1t(1, 1) = one
            DO j = 2, q
               v1t(1,j) = zero
               v1t(j,1) = zero
            END DO
            CALL cunglq( q-1, q-1, q-1, v1t(2,2), ldv1t, work(itauq1),
     $                   work(iorglq), lorglqwork, info )
         END IF
         IF( wantv2t .AND. m-q .GT. 0 ) THEN
            CALL clacpy( 'U', p, m-q, x12, ldx12, v2t, ldv2t )
            IF( m-p .GT. q ) THEN
               CALL clacpy( 'U', m-p-q, m-p-q, x22(q+1,p+1), ldx22,
     $                      v2t(p+1,p+1), ldv2t )
            END IF
            IF( m .GT. q ) THEN
               CALL cunglq( m-q, m-q, m-q, v2t, ldv2t, work(itauq2),
     $                      work(iorglq), lorglqwork, info )
            END IF
         END IF
      ELSE
         IF( wantu1 .AND. p .GT. 0 ) THEN
            CALL clacpy( 'U', q, p, x11, ldx11, u1, ldu1 )
            CALL cunglq( p, p, q, u1, ldu1, work(itaup1), work(iorglq),
     $                   lorglqwork, info)
         END IF
         IF( wantu2 .AND. m-p .GT. 0 ) THEN
            CALL clacpy( 'U', q, m-p, x21, ldx21, u2, ldu2 )
            CALL cunglq( m-p, m-p, q, u2, ldu2, work(itaup2),
     $                   work(iorglq), lorglqwork, info )
         END IF
         IF( wantv1t .AND. q .GT. 0 ) THEN
            CALL clacpy( 'L', q-1, q-1, x11(2,1), ldx11, v1t(2,2),
     $                   ldv1t )
            v1t(1, 1) = one
            DO j = 2, q
               v1t(1,j) = zero
               v1t(j,1) = zero
            END DO
            CALL cungqr( q-1, q-1, q-1, v1t(2,2), ldv1t, work(itauq1),
     $                   work(iorgqr), lorgqrwork, info )
         END IF
         IF( wantv2t .AND. m-q .GT. 0 ) THEN
            p1 = min( p+1, m )
            q1 = min( q+1, m )
            CALL clacpy( 'L', m-q, p, x12, ldx12, v2t, ldv2t )
            IF ( m .GT. p+q ) THEN
               CALL clacpy( 'L', m-p-q, m-p-q, x22(p1,q1), ldx22,
     $                      v2t(p+1,p+1), ldv2t )
            END IF
            CALL cungqr( m-q, m-q, m-q, v2t, ldv2t, work(itauq2),
     $                   work(iorgqr), lorgqrwork, info )
         END IF
      END IF
*
*     Compute the CSD of the matrix in bidiagonal-block form
*
      CALL cbbcsd( jobu1, jobu2, jobv1t, jobv2t, trans, m, p, q, theta,
     $             rwork(iphi), u1, ldu1, u2, ldu2, v1t, ldv1t, v2t,
     $             ldv2t, rwork(ib11d), rwork(ib11e), rwork(ib12d),
     $             rwork(ib12e), rwork(ib21d), rwork(ib21e),
     $             rwork(ib22d), rwork(ib22e), rwork(ibbcsd),
     $             lbbcsdwork, info )
*
*     Permute rows and columns to place identity submatrices in top-
*     left corner of (1,1)-block and/or bottom-right corner of (1,2)-
*     block and/or bottom-right corner of (2,1)-block and/or top-left
*     corner of (2,2)-block
*
      IF( q .GT. 0 .AND. wantu2 ) THEN
         DO i = 1, q
            iwork(i) = m - p - q + i
         END DO
         DO i = q + 1, m - p
            iwork(i) = i - q
         END DO
         IF( colmajor ) THEN
            CALL clapmt( .false., m-p, m-p, u2, ldu2, iwork )
         ELSE
            CALL clapmr( .false., m-p, m-p, u2, ldu2, iwork )
         END IF
      END IF
      IF( m .GT. 0 .AND. wantv2t ) THEN
         DO i = 1, p
            iwork(i) = m - p - q + i
         END DO
         DO i = p + 1, m - q
            iwork(i) = i - p
         END DO
         IF( .NOT. colmajor ) THEN
            CALL clapmt( .false., m-q, m-q, v2t, ldv2t, iwork )
         ELSE
            CALL clapmr( .false., m-q, m-q, v2t, ldv2t, iwork )
         END IF
      END IF
*
      RETURN
*
*     End CUNCSD
*

◆ cuncsd2by1()

subroutine cuncsd2by1	(	character	jobu1,
		character	jobu2,
		character	jobv1t,
		integer	m,
		integer	p,
		integer	q,
		complex, dimension(ldx11,*)	x11,
		integer	ldx11,
		complex, dimension(ldx21,*)	x21,
		integer	ldx21,
		real, dimension(*)	theta,
		complex, dimension(ldu1,*)	u1,
		integer	ldu1,
		complex, dimension(ldu2,*)	u2,
		integer	ldu2,
		complex, dimension(ldv1t,*)	v1t,
		integer	ldv1t,
		complex, dimension(*)	work,
		integer	lwork,
		real, dimension(*)	rwork,
		integer	lrwork,
		integer, dimension(*)	iwork,
		integer	info )

CUNCSD2BY1

Download CUNCSD2BY1 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CUNCSD2BY1 computes the CS decomposition of an M-by-Q matrix X with
!> orthonormal columns that has been partitioned into a 2-by-1 block
!> structure:
!>
!>                                [  I1 0  0 ]
!>                                [  0  C  0 ]
!>          [ X11 ]   [ U1 |    ] [  0  0  0 ]
!>      X = [-----] = [---------] [----------] V1**T .
!>          [ X21 ]   [    | U2 ] [  0  0  0 ]
!>                                [  0  S  0 ]
!>                                [  0  0  I2]
!>
!> X11 is P-by-Q. The unitary matrices U1, U2, and V1 are P-by-P,
!> (M-P)-by-(M-P), and Q-by-Q, respectively. C and S are R-by-R
!> nonnegative diagonal matrices satisfying C^2 + S^2 = I, in which
!> R = MIN(P,M-P,Q,M-Q). I1 is a K1-by-K1 identity matrix and I2 is a
!> K2-by-K2 identity matrix, where K1 = MAX(Q+P-M,0), K2 = MAX(Q-P,0).
!>
!>

Parameters

[in]	JOBU1	!> JOBU1 is CHARACTER !> = 'Y': U1 is computed; !> otherwise: U1 is not computed. !>
[in]	JOBU2	!> JOBU2 is CHARACTER !> = 'Y': U2 is computed; !> otherwise: U2 is not computed. !>
[in]	JOBV1T	!> JOBV1T is CHARACTER !> = 'Y': V1T is computed; !> otherwise: V1T is not computed. !>
[in]	M	!> M is INTEGER !> The number of rows in X. !>
[in]	P	!> P is INTEGER !> The number of rows in X11. 0 <= P <= M. !>
[in]	Q	!> Q is INTEGER !> The number of columns in X11 and X21. 0 <= Q <= M. !>
[in,out]	X11	!> X11 is COMPLEX array, dimension (LDX11,Q) !> On entry, part of the unitary matrix whose CSD is desired. !>
[in]	LDX11	!> LDX11 is INTEGER !> The leading dimension of X11. LDX11 >= MAX(1,P). !>
[in,out]	X21	!> X21 is COMPLEX array, dimension (LDX21,Q) !> On entry, part of the unitary matrix whose CSD is desired. !>
[in]	LDX21	!> LDX21 is INTEGER !> The leading dimension of X21. LDX21 >= MAX(1,M-P). !>
[out]	THETA	!> THETA is REAL array, dimension (R), in which R = !> MIN(P,M-P,Q,M-Q). !> C = DIAG( COS(THETA(1)), ... , COS(THETA(R)) ) and !> S = DIAG( SIN(THETA(1)), ... , SIN(THETA(R)) ). !>
[out]	U1	!> U1 is COMPLEX array, dimension (P) !> If JOBU1 = 'Y', U1 contains the P-by-P unitary matrix U1. !>
[in]	LDU1	!> LDU1 is INTEGER !> The leading dimension of U1. If JOBU1 = 'Y', LDU1 >= !> MAX(1,P). !>
[out]	U2	!> U2 is COMPLEX array, dimension (M-P) !> If JOBU2 = 'Y', U2 contains the (M-P)-by-(M-P) unitary !> matrix U2. !>
[in]	LDU2	!> LDU2 is INTEGER !> The leading dimension of U2. If JOBU2 = 'Y', LDU2 >= !> MAX(1,M-P). !>
[out]	V1T	!> V1T is COMPLEX array, dimension (Q) !> If JOBV1T = 'Y', V1T contains the Q-by-Q matrix unitary !> matrix V1**T. !>
[in]	LDV1T	!> LDV1T is INTEGER !> The leading dimension of V1T. If JOBV1T = 'Y', LDV1T >= !> MAX(1,Q). !>
[out]	WORK	!> WORK is COMPLEX array, dimension (MAX(1,LWORK)) !> On exit, if INFO = 0, WORK(1) returns the optimal LWORK. !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the array WORK. !> !> If LWORK = -1, then a workspace query is assumed; the routine !> only calculates the optimal size of the WORK and RWORK !> arrays, returns this value as the first entry of the WORK !> and RWORK array, respectively, and no error message related !> to LWORK or LRWORK is issued by XERBLA. !>
[out]	RWORK	!> RWORK is REAL array, dimension (MAX(1,LRWORK)) !> On exit, if INFO = 0, RWORK(1) returns the optimal LRWORK. !> If INFO > 0 on exit, RWORK(2:R) contains the values PHI(1), !> ..., PHI(R-1) that, together with THETA(1), ..., THETA(R), !> define the matrix in intermediate bidiagonal-block form !> remaining after nonconvergence. INFO specifies the number !> of nonzero PHI's. !>
[in]	LRWORK	!> LRWORK is INTEGER !> The dimension of the array RWORK. !> !> If LRWORK=-1, then a workspace query is assumed; the routine !> only calculates the optimal size of the WORK and RWORK !> arrays, returns this value as the first entry of the WORK !> and RWORK array, respectively, and no error message related !> to LWORK or LRWORK is issued by XERBLA. !>
[out]	IWORK	!> IWORK is INTEGER array, dimension (M-MIN(P,M-P,Q,M-Q)) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> < 0: if INFO = -i, the i-th argument had an illegal value. !> > 0: CBBCSD did not converge. See the description of WORK !> above for details. !>

References:: [1] Brian D. Sutton. Computing the complete CS decomposition. Numer. Algorithms, 50(1):33-65, 2009.

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 253 of file cuncsd2by1.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          JOBU1, JOBU2, JOBV1T
      INTEGER            INFO, LDU1, LDU2, LDV1T, LWORK, LDX11, LDX21,
     $                   M, P, Q
      INTEGER            LRWORK, LRWORKMIN, LRWORKOPT
*     ..
*     .. Array Arguments ..
      REAL               RWORK(*)
      REAL               THETA(*)
      COMPLEX            U1(LDU1,*), U2(LDU2,*), V1T(LDV1T,*), WORK(*),
     $                   X11(LDX11,*), X21(LDX21,*)
      INTEGER            IWORK(*)
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            ONE, ZERO
      parameter( one = (1.0e0,0.0e0), zero = (0.0e0,0.0e0) )
*     ..
*     .. Local Scalars ..
      INTEGER            CHILDINFO, I, IB11D, IB11E, IB12D, IB12E,
     $                   IB21D, IB21E, IB22D, IB22E, IBBCSD, IORBDB,
     $                   IORGLQ, IORGQR, IPHI, ITAUP1, ITAUP2, ITAUQ1,
     $                   J, LBBCSD, LORBDB, LORGLQ, LORGLQMIN,
     $                   LORGLQOPT, LORGQR, LORGQRMIN, LORGQROPT,
     $                   LWORKMIN, LWORKOPT, R
      LOGICAL            LQUERY, WANTU1, WANTU2, WANTV1T
*     ..
*     .. Local Arrays ..
      REAL               DUM( 1 )
      COMPLEX            CDUM( 1, 1 )
*     ..
*     .. External Subroutines ..
      EXTERNAL           cbbcsd, ccopy, clacpy, clapmr, clapmt, cunbdb1,
     $                   cunbdb2, cunbdb3, cunbdb4, cunglq, cungqr,
     $                   xerbla
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. Intrinsic Function ..
      INTRINSIC          int, max, min
*     ..
*     .. Executable Statements ..
*
*     Test input arguments
*
      info = 0
      wantu1 = lsame( jobu1, 'Y' )
      wantu2 = lsame( jobu2, 'Y' )
      wantv1t = lsame( jobv1t, 'Y' )
      lquery = ( lwork.EQ.-1 ) .OR. ( lrwork.EQ.-1 )
*
      IF( m .LT. 0 ) THEN
         info = -4
      ELSE IF( p .LT. 0 .OR. p .GT. m ) THEN
         info = -5
      ELSE IF( q .LT. 0 .OR. q .GT. m ) THEN
         info = -6
      ELSE IF( ldx11 .LT. max( 1, p ) ) THEN
         info = -8
      ELSE IF( ldx21 .LT. max( 1, m-p ) ) THEN
         info = -10
      ELSE IF( wantu1 .AND. ldu1 .LT. max( 1, p ) ) THEN
         info = -13
      ELSE IF( wantu2 .AND. ldu2 .LT. max( 1, m - p ) ) THEN
         info = -15
      ELSE IF( wantv1t .AND. ldv1t .LT. max( 1, q ) ) THEN
         info = -17
      END IF
*
      r = min( p, m-p, q, m-q )
*
*     Compute workspace
*
*       WORK layout:
*     |-----------------------------------------|
*     | LWORKOPT (1)                            |
*     |-----------------------------------------|
*     | TAUP1 (MAX(1,P))                        |
*     | TAUP2 (MAX(1,M-P))                      |
*     | TAUQ1 (MAX(1,Q))                        |
*     |-----------------------------------------|
*     | CUNBDB WORK | CUNGQR WORK | CUNGLQ WORK |
*     |             |             |             |
*     |             |             |             |
*     |             |             |             |
*     |             |             |             |
*     |-----------------------------------------|
*       RWORK layout:
*     |------------------|
*     | LRWORKOPT (1)    |
*     |------------------|
*     | PHI (MAX(1,R-1)) |
*     |------------------|
*     | B11D (R)         |
*     | B11E (R-1)       |
*     | B12D (R)         |
*     | B12E (R-1)       |
*     | B21D (R)         |
*     | B21E (R-1)       |
*     | B22D (R)         |
*     | B22E (R-1)       |
*     | CBBCSD RWORK     |
*     |------------------|
*
      IF( info .EQ. 0 ) THEN
         iphi = 2
         ib11d = iphi + max( 1, r-1 )
         ib11e = ib11d + max( 1, r )
         ib12d = ib11e + max( 1, r - 1 )
         ib12e = ib12d + max( 1, r )
         ib21d = ib12e + max( 1, r - 1 )
         ib21e = ib21d + max( 1, r )
         ib22d = ib21e + max( 1, r - 1 )
         ib22e = ib22d + max( 1, r )
         ibbcsd = ib22e + max( 1, r - 1 )
         itaup1 = 2
         itaup2 = itaup1 + max( 1, p )
         itauq1 = itaup2 + max( 1, m-p )
         iorbdb = itauq1 + max( 1, q )
         iorgqr = itauq1 + max( 1, q )
         iorglq = itauq1 + max( 1, q )
         lorgqrmin = 1
         lorgqropt = 1
         lorglqmin = 1
         lorglqopt = 1
         IF( r .EQ. q ) THEN
            CALL cunbdb1( m, p, q, x11, ldx11, x21, ldx21, theta,
     $                    dum, cdum, cdum, cdum, work, -1,
     $                    childinfo )
            lorbdb = int( work(1) )
            IF( wantu1 .AND. p .GT. 0 ) THEN
               CALL cungqr( p, p, q, u1, ldu1, cdum, work(1), -1,
     $                      childinfo )
               lorgqrmin = max( lorgqrmin, p )
               lorgqropt = max( lorgqropt, int( work(1) ) )
            ENDIF
            IF( wantu2 .AND. m-p .GT. 0 ) THEN
               CALL cungqr( m-p, m-p, q, u2, ldu2, cdum, work(1), -1,
     $                      childinfo )
               lorgqrmin = max( lorgqrmin, m-p )
               lorgqropt = max( lorgqropt, int( work(1) ) )
            END IF
            IF( wantv1t .AND. q .GT. 0 ) THEN
               CALL cunglq( q-1, q-1, q-1, v1t, ldv1t,
     $                      cdum, work(1), -1, childinfo )
               lorglqmin = max( lorglqmin, q-1 )
               lorglqopt = max( lorglqopt, int( work(1) ) )
            END IF
            CALL cbbcsd( jobu1, jobu2, jobv1t, 'N', 'N', m, p, q, theta,
     $                   dum(1), u1, ldu1, u2, ldu2, v1t, ldv1t, cdum,
     $                   1, dum, dum, dum, dum, dum, dum, dum, dum,
     $                   rwork(1), -1, childinfo )
            lbbcsd = int( rwork(1) )
         ELSE IF( r .EQ. p ) THEN
            CALL cunbdb2( m, p, q, x11, ldx11, x21, ldx21, theta, dum,
     $                    cdum, cdum, cdum, work(1), -1, childinfo )
            lorbdb = int( work(1) )
            IF( wantu1 .AND. p .GT. 0 ) THEN
               CALL cungqr( p-1, p-1, p-1, u1(2,2), ldu1, cdum, work(1),
     $                      -1, childinfo )
               lorgqrmin = max( lorgqrmin, p-1 )
               lorgqropt = max( lorgqropt, int( work(1) ) )
            END IF
            IF( wantu2 .AND. m-p .GT. 0 ) THEN
               CALL cungqr( m-p, m-p, q, u2, ldu2, cdum, work(1), -1,
     $                      childinfo )
               lorgqrmin = max( lorgqrmin, m-p )
               lorgqropt = max( lorgqropt, int( work(1) ) )
            END IF
            IF( wantv1t .AND. q .GT. 0 ) THEN
               CALL cunglq( q, q, r, v1t, ldv1t, cdum, work(1), -1,
     $                      childinfo )
               lorglqmin = max( lorglqmin, q )
               lorglqopt = max( lorglqopt, int( work(1) ) )
            END IF
            CALL cbbcsd( jobv1t, 'N', jobu1, jobu2, 'T', m, q, p, theta,
     $                   dum, v1t, ldv1t, cdum, 1, u1, ldu1, u2, ldu2,
     $                   dum, dum, dum, dum, dum, dum, dum, dum,
     $                   rwork(1), -1, childinfo )
            lbbcsd = int( rwork(1) )
         ELSE IF( r .EQ. m-p ) THEN
            CALL cunbdb3( m, p, q, x11, ldx11, x21, ldx21, theta, dum,
     $                    cdum, cdum, cdum, work(1), -1, childinfo )
            lorbdb = int( work(1) )
            IF( wantu1 .AND. p .GT. 0 ) THEN
               CALL cungqr( p, p, q, u1, ldu1, cdum, work(1), -1,
     $                      childinfo )
               lorgqrmin = max( lorgqrmin, p )
               lorgqropt = max( lorgqropt, int( work(1) ) )
            END IF
            IF( wantu2 .AND. m-p .GT. 0 ) THEN
               CALL cungqr( m-p-1, m-p-1, m-p-1, u2(2,2), ldu2, cdum,
     $                      work(1), -1, childinfo )
               lorgqrmin = max( lorgqrmin, m-p-1 )
               lorgqropt = max( lorgqropt, int( work(1) ) )
            END IF
            IF( wantv1t .AND. q .GT. 0 ) THEN
               CALL cunglq( q, q, r, v1t, ldv1t, cdum, work(1), -1,
     $                      childinfo )
               lorglqmin = max( lorglqmin, q )
               lorglqopt = max( lorglqopt, int( work(1) ) )
            END IF
            CALL cbbcsd( 'N', jobv1t, jobu2, jobu1, 'T', m, m-q, m-p,
     $                   theta, dum, cdum, 1, v1t, ldv1t, u2, ldu2, u1,
     $                   ldu1, dum, dum, dum, dum, dum, dum, dum, dum,
     $                   rwork(1), -1, childinfo )
            lbbcsd = int( rwork(1) )
         ELSE
            CALL cunbdb4( m, p, q, x11, ldx11, x21, ldx21, theta, dum,
     $                    cdum, cdum, cdum, cdum, work(1), -1, childinfo
     $                  )
            lorbdb = m + int( work(1) )
            IF( wantu1 .AND. p .GT. 0 ) THEN
               CALL cungqr( p, p, m-q, u1, ldu1, cdum, work(1), -1,
     $                      childinfo )
               lorgqrmin = max( lorgqrmin, p )
               lorgqropt = max( lorgqropt, int( work(1) ) )
            END IF
            IF( wantu2 .AND. m-p .GT. 0 ) THEN
               CALL cungqr( m-p, m-p, m-q, u2, ldu2, cdum, work(1), -1,
     $                      childinfo )
               lorgqrmin = max( lorgqrmin, m-p )
               lorgqropt = max( lorgqropt, int( work(1) ) )
            END IF
            IF( wantv1t .AND. q .GT. 0 ) THEN
               CALL cunglq( q, q, q, v1t, ldv1t, cdum, work(1), -1,
     $                      childinfo )
               lorglqmin = max( lorglqmin, q )
               lorglqopt = max( lorglqopt, int( work(1) ) )
            END IF
            CALL cbbcsd( jobu2, jobu1, 'N', jobv1t, 'N', m, m-p, m-q,
     $                   theta, dum, u2, ldu2, u1, ldu1, cdum, 1, v1t,
     $                   ldv1t, dum, dum, dum, dum, dum, dum, dum, dum,
     $                   rwork(1), -1, childinfo )
            lbbcsd = int( rwork(1) )
         END IF
         lrworkmin = ibbcsd+lbbcsd-1
         lrworkopt = lrworkmin
         rwork(1) = lrworkopt
         lworkmin = max( iorbdb+lorbdb-1,
     $                   iorgqr+lorgqrmin-1,
     $                   iorglq+lorglqmin-1 )
         lworkopt = max( iorbdb+lorbdb-1,
     $                   iorgqr+lorgqropt-1,
     $                   iorglq+lorglqopt-1 )
         work(1) = lworkopt
         IF( lwork .LT. lworkmin .AND. .NOT.lquery ) THEN
            info = -19
         END IF
         IF( lrwork .LT. lrworkmin .AND. .NOT.lquery ) THEN
            info = -21
         END IF
      END IF
      IF( info .NE. 0 ) THEN
         CALL xerbla( 'CUNCSD2BY1', -info )
         RETURN
      ELSE IF( lquery ) THEN
         RETURN
      END IF
      lorgqr = lwork-iorgqr+1
      lorglq = lwork-iorglq+1
*
*     Handle four cases separately: R = Q, R = P, R = M-P, and R = M-Q,
*     in which R = MIN(P,M-P,Q,M-Q)
*
      IF( r .EQ. q ) THEN
*
*        Case 1: R = Q
*
*        Simultaneously bidiagonalize X11 and X21
*
         CALL cunbdb1( m, p, q, x11, ldx11, x21, ldx21, theta,
     $                 rwork(iphi), work(itaup1), work(itaup2),
     $                 work(itauq1), work(iorbdb), lorbdb, childinfo )
*
*        Accumulate Householder reflectors
*
         IF( wantu1 .AND. p .GT. 0 ) THEN
            CALL clacpy( 'L', p, q, x11, ldx11, u1, ldu1 )
            CALL cungqr( p, p, q, u1, ldu1, work(itaup1), work(iorgqr),
     $                   lorgqr, childinfo )
         END IF
         IF( wantu2 .AND. m-p .GT. 0 ) THEN
            CALL clacpy( 'L', m-p, q, x21, ldx21, u2, ldu2 )
            CALL cungqr( m-p, m-p, q, u2, ldu2, work(itaup2),
     $                   work(iorgqr), lorgqr, childinfo )
         END IF
         IF( wantv1t .AND. q .GT. 0 ) THEN
            v1t(1,1) = one
            DO j = 2, q
               v1t(1,j) = zero
               v1t(j,1) = zero
            END DO
            CALL clacpy( 'U', q-1, q-1, x21(1,2), ldx21, v1t(2,2),
     $                   ldv1t )
            CALL cunglq( q-1, q-1, q-1, v1t(2,2), ldv1t, work(itauq1),
     $                   work(iorglq), lorglq, childinfo )
         END IF
*
*        Simultaneously diagonalize X11 and X21.
*
         CALL cbbcsd( jobu1, jobu2, jobv1t, 'N', 'N', m, p, q, theta,
     $                rwork(iphi), u1, ldu1, u2, ldu2, v1t, ldv1t, cdum,
     $                1, rwork(ib11d), rwork(ib11e), rwork(ib12d),
     $                rwork(ib12e), rwork(ib21d), rwork(ib21e),
     $                rwork(ib22d), rwork(ib22e), rwork(ibbcsd),
     $                lrwork-ibbcsd+1, childinfo )
*
*        Permute rows and columns to place zero submatrices in
*        preferred positions
*
         IF( q .GT. 0 .AND. wantu2 ) THEN
            DO i = 1, q
               iwork(i) = m - p - q + i
            END DO
            DO i = q + 1, m - p
               iwork(i) = i - q
            END DO
            CALL clapmt( .false., m-p, m-p, u2, ldu2, iwork )
         END IF
      ELSE IF( r .EQ. p ) THEN
*
*        Case 2: R = P
*
*        Simultaneously bidiagonalize X11 and X21
*
         CALL cunbdb2( m, p, q, x11, ldx11, x21, ldx21, theta,
     $                 rwork(iphi), work(itaup1), work(itaup2),
     $                 work(itauq1), work(iorbdb), lorbdb, childinfo )
*
*        Accumulate Householder reflectors
*
         IF( wantu1 .AND. p .GT. 0 ) THEN
            u1(1,1) = one
            DO j = 2, p
               u1(1,j) = zero
               u1(j,1) = zero
            END DO
            CALL clacpy( 'L', p-1, p-1, x11(2,1), ldx11, u1(2,2), ldu1 )
            CALL cungqr( p-1, p-1, p-1, u1(2,2), ldu1, work(itaup1),
     $                   work(iorgqr), lorgqr, childinfo )
         END IF
         IF( wantu2 .AND. m-p .GT. 0 ) THEN
            CALL clacpy( 'L', m-p, q, x21, ldx21, u2, ldu2 )
            CALL cungqr( m-p, m-p, q, u2, ldu2, work(itaup2),
     $                   work(iorgqr), lorgqr, childinfo )
         END IF
         IF( wantv1t .AND. q .GT. 0 ) THEN
            CALL clacpy( 'U', p, q, x11, ldx11, v1t, ldv1t )
            CALL cunglq( q, q, r, v1t, ldv1t, work(itauq1),
     $                   work(iorglq), lorglq, childinfo )
         END IF
*
*        Simultaneously diagonalize X11 and X21.
*
         CALL cbbcsd( jobv1t, 'N', jobu1, jobu2, 'T', m, q, p, theta,
     $                rwork(iphi), v1t, ldv1t, cdum, 1, u1, ldu1, u2,
     $                ldu2, rwork(ib11d), rwork(ib11e), rwork(ib12d),
     $                rwork(ib12e), rwork(ib21d), rwork(ib21e),
     $                rwork(ib22d), rwork(ib22e), rwork(ibbcsd), lbbcsd,
     $                childinfo )
*
*        Permute rows and columns to place identity submatrices in
*        preferred positions
*
         IF( q .GT. 0 .AND. wantu2 ) THEN
            DO i = 1, q
               iwork(i) = m - p - q + i
            END DO
            DO i = q + 1, m - p
               iwork(i) = i - q
            END DO
            CALL clapmt( .false., m-p, m-p, u2, ldu2, iwork )
         END IF
      ELSE IF( r .EQ. m-p ) THEN
*
*        Case 3: R = M-P
*
*        Simultaneously bidiagonalize X11 and X21
*
         CALL cunbdb3( m, p, q, x11, ldx11, x21, ldx21, theta,
     $                 rwork(iphi), work(itaup1), work(itaup2),
     $                 work(itauq1), work(iorbdb), lorbdb, childinfo )
*
*        Accumulate Householder reflectors
*
         IF( wantu1 .AND. p .GT. 0 ) THEN
            CALL clacpy( 'L', p, q, x11, ldx11, u1, ldu1 )
            CALL cungqr( p, p, q, u1, ldu1, work(itaup1), work(iorgqr),
     $                   lorgqr, childinfo )
         END IF
         IF( wantu2 .AND. m-p .GT. 0 ) THEN
            u2(1,1) = one
            DO j = 2, m-p
               u2(1,j) = zero
               u2(j,1) = zero
            END DO
            CALL clacpy( 'L', m-p-1, m-p-1, x21(2,1), ldx21, u2(2,2),
     $                   ldu2 )
            CALL cungqr( m-p-1, m-p-1, m-p-1, u2(2,2), ldu2,
     $                   work(itaup2), work(iorgqr), lorgqr, childinfo )
         END IF
         IF( wantv1t .AND. q .GT. 0 ) THEN
            CALL clacpy( 'U', m-p, q, x21, ldx21, v1t, ldv1t )
            CALL cunglq( q, q, r, v1t, ldv1t, work(itauq1),
     $                   work(iorglq), lorglq, childinfo )
         END IF
*
*        Simultaneously diagonalize X11 and X21.
*
         CALL cbbcsd( 'N', jobv1t, jobu2, jobu1, 'T', m, m-q, m-p,
     $                theta, rwork(iphi), cdum, 1, v1t, ldv1t, u2, ldu2,
     $                u1, ldu1, rwork(ib11d), rwork(ib11e),
     $                rwork(ib12d), rwork(ib12e), rwork(ib21d),
     $                rwork(ib21e), rwork(ib22d), rwork(ib22e),
     $                rwork(ibbcsd), lbbcsd, childinfo )
*
*        Permute rows and columns to place identity submatrices in
*        preferred positions
*
         IF( q .GT. r ) THEN
            DO i = 1, r
               iwork(i) = q - r + i
            END DO
            DO i = r + 1, q
               iwork(i) = i - r
            END DO
            IF( wantu1 ) THEN
               CALL clapmt( .false., p, q, u1, ldu1, iwork )
            END IF
            IF( wantv1t ) THEN
               CALL clapmr( .false., q, q, v1t, ldv1t, iwork )
            END IF
         END IF
      ELSE
*
*        Case 4: R = M-Q
*
*        Simultaneously bidiagonalize X11 and X21
*
         CALL cunbdb4( m, p, q, x11, ldx11, x21, ldx21, theta,
     $                 rwork(iphi), work(itaup1), work(itaup2),
     $                 work(itauq1), work(iorbdb), work(iorbdb+m),
     $                 lorbdb-m, childinfo )
*
*        Accumulate Householder reflectors
*
 
         IF( wantu2 .AND. m-p .GT. 0 ) THEN
            CALL ccopy( m-p, work(iorbdb+p), 1, u2, 1 )
         END IF
         IF( wantu1 .AND. p .GT. 0 ) THEN
            CALL ccopy( p, work(iorbdb), 1, u1, 1 )
            DO j = 2, p
               u1(1,j) = zero
            END DO
            CALL clacpy( 'L', p-1, m-q-1, x11(2,1), ldx11, u1(2,2),
     $                   ldu1 )
            CALL cungqr( p, p, m-q, u1, ldu1, work(itaup1),
     $                   work(iorgqr), lorgqr, childinfo )
         END IF
         IF( wantu2 .AND. m-p .GT. 0 ) THEN
            DO j = 2, m-p
               u2(1,j) = zero
            END DO
            CALL clacpy( 'L', m-p-1, m-q-1, x21(2,1), ldx21, u2(2,2),
     $                   ldu2 )
            CALL cungqr( m-p, m-p, m-q, u2, ldu2, work(itaup2),
     $                   work(iorgqr), lorgqr, childinfo )
         END IF
         IF( wantv1t .AND. q .GT. 0 ) THEN
            CALL clacpy( 'U', m-q, q, x21, ldx21, v1t, ldv1t )
            CALL clacpy( 'U', p-(m-q), q-(m-q), x11(m-q+1,m-q+1), ldx11,
     $                   v1t(m-q+1,m-q+1), ldv1t )
            CALL clacpy( 'U', -p+q, q-p, x21(m-q+1,p+1), ldx21,
     $                   v1t(p+1,p+1), ldv1t )
            CALL cunglq( q, q, q, v1t, ldv1t, work(itauq1),
     $                   work(iorglq), lorglq, childinfo )
         END IF
*
*        Simultaneously diagonalize X11 and X21.
*
         CALL cbbcsd( jobu2, jobu1, 'N', jobv1t, 'N', m, m-p, m-q,
     $                theta, rwork(iphi), u2, ldu2, u1, ldu1, cdum, 1,
     $                v1t, ldv1t, rwork(ib11d), rwork(ib11e),
     $                rwork(ib12d), rwork(ib12e), rwork(ib21d),
     $                rwork(ib21e), rwork(ib22d), rwork(ib22e),
     $                rwork(ibbcsd), lbbcsd, childinfo )
*
*        Permute rows and columns to place identity submatrices in
*        preferred positions
*
         IF( p .GT. r ) THEN
            DO i = 1, r
               iwork(i) = p - r + i
            END DO
            DO i = r + 1, p
               iwork(i) = i - r
            END DO
            IF( wantu1 ) THEN
               CALL clapmt( .false., p, p, u1, ldu1, iwork )
            END IF
            IF( wantv1t ) THEN
               CALL clapmr( .false., p, q, v1t, ldv1t, iwork )
            END IF
         END IF
      END IF
*
      RETURN
*
*     End of CUNCSD2BY1
*

◆ cung2l()

subroutine cung2l	(	integer	m,
		integer	n,
		integer	k,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( * )	tau,
		complex, dimension( * )	work,
		integer	info )

CUNG2L generates all or part of the unitary matrix Q from a QL factorization determined by cgeqlf (unblocked algorithm).

Download CUNG2L + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CUNG2L generates an m by n complex matrix Q with orthonormal columns,
!> which is defined as the last n columns of a product of k elementary
!> reflectors of order m
!>
!>       Q  =  H(k) . . . H(2) H(1)
!>
!> as returned by CGEQLF.
!>

Parameters

[in]	M	!> M is INTEGER !> The number of rows of the matrix Q. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix Q. M >= N >= 0. !>
[in]	K	!> K is INTEGER !> The number of elementary reflectors whose product defines the !> matrix Q. N >= K >= 0. !>
[in,out]	A	!> A is COMPLEX array, dimension (LDA,N) !> On entry, the (n-k+i)-th column must contain the vector which !> defines the elementary reflector H(i), for i = 1,2,...,k, as !> returned by CGEQLF in the last k columns of its array !> argument A. !> On exit, the m-by-n matrix Q. !>
[in]	LDA	!> LDA is INTEGER !> The first dimension of the array A. LDA >= max(1,M). !>
[in]	TAU	!> TAU is COMPLEX array, dimension (K) !> TAU(i) must contain the scalar factor of the elementary !> reflector H(i), as returned by CGEQLF. !>
[out]	WORK	!> WORK is COMPLEX array, dimension (N) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument has an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 113 of file cung2l.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INFO, K, LDA, M, N
*     ..
*     .. Array Arguments ..
      COMPLEX            A( LDA, * ), TAU( * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            ONE, ZERO
      parameter( one = ( 1.0e+0, 0.0e+0 ),
     $                   zero = ( 0.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      INTEGER            I, II, J, L
*     ..
*     .. External Subroutines ..
      EXTERNAL           clarf, cscal, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max
*     ..
*     .. Executable Statements ..
*
*     Test the input arguments
*
      info = 0
      IF( m.LT.0 ) THEN
         info = -1
      ELSE IF( n.LT.0 .OR. n.GT.m ) THEN
         info = -2
      ELSE IF( k.LT.0 .OR. k.GT.n ) THEN
         info = -3
      ELSE IF( lda.LT.max( 1, m ) ) THEN
         info = -5
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CUNG2L', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.LE.0 )
     $   RETURN
*
*     Initialise columns 1:n-k to columns of the unit matrix
*
      DO 20 j = 1, n - k
         DO 10 l = 1, m
            a( l, j ) = zero
   10    CONTINUE
         a( m-n+j, j ) = one
   20 CONTINUE
*
      DO 40 i = 1, k
         ii = n - k + i
*
*        Apply H(i) to A(1:m-k+i,1:n-k+i) from the left
*
         a( m-n+ii, ii ) = one
         CALL clarf( 'Left', m-n+ii, ii-1, a( 1, ii ), 1, tau( i ), a,
     $               lda, work )
         CALL cscal( m-n+ii-1, -tau( i ), a( 1, ii ), 1 )
         a( m-n+ii, ii ) = one - tau( i )
*
*        Set A(m-k+i+1:m,n-k+i) to zero
*
         DO 30 l = m - n + ii + 1, m
            a( l, ii ) = zero
   30    CONTINUE
   40 CONTINUE
      RETURN
*
*     End of CUNG2L
*

◆ cung2r()

subroutine cung2r	(	integer	m,
		integer	n,
		integer	k,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( * )	tau,
		complex, dimension( * )	work,
		integer	info )

CUNG2R

Download CUNG2R + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CUNG2R generates an m by n complex matrix Q with orthonormal columns,
!> which is defined as the first n columns of a product of k elementary
!> reflectors of order m
!>
!>       Q  =  H(1) H(2) . . . H(k)
!>
!> as returned by CGEQRF.
!>

Parameters

[in]	M	!> M is INTEGER !> The number of rows of the matrix Q. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix Q. M >= N >= 0. !>
[in]	K	!> K is INTEGER !> The number of elementary reflectors whose product defines the !> matrix Q. N >= K >= 0. !>
[in,out]	A	!> A is COMPLEX array, dimension (LDA,N) !> On entry, the i-th column must contain the vector which !> defines the elementary reflector H(i), for i = 1,2,...,k, as !> returned by CGEQRF in the first k columns of its array !> argument A. !> On exit, the m by n matrix Q. !>
[in]	LDA	!> LDA is INTEGER !> The first dimension of the array A. LDA >= max(1,M). !>
[in]	TAU	!> TAU is COMPLEX array, dimension (K) !> TAU(i) must contain the scalar factor of the elementary !> reflector H(i), as returned by CGEQRF. !>
[out]	WORK	!> WORK is COMPLEX array, dimension (N) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument has an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 113 of file cung2r.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INFO, K, LDA, M, N
*     ..
*     .. Array Arguments ..
      COMPLEX            A( LDA, * ), TAU( * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            ONE, ZERO
      parameter( one = ( 1.0e+0, 0.0e+0 ),
     $                   zero = ( 0.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      INTEGER            I, J, L
*     ..
*     .. External Subroutines ..
      EXTERNAL           clarf, cscal, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max
*     ..
*     .. Executable Statements ..
*
*     Test the input arguments
*
      info = 0
      IF( m.LT.0 ) THEN
         info = -1
      ELSE IF( n.LT.0 .OR. n.GT.m ) THEN
         info = -2
      ELSE IF( k.LT.0 .OR. k.GT.n ) THEN
         info = -3
      ELSE IF( lda.LT.max( 1, m ) ) THEN
         info = -5
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CUNG2R', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.LE.0 )
     $   RETURN
*
*     Initialise columns k+1:n to columns of the unit matrix
*
      DO 20 j = k + 1, n
         DO 10 l = 1, m
            a( l, j ) = zero
   10    CONTINUE
         a( j, j ) = one
   20 CONTINUE
*
      DO 40 i = k, 1, -1
*
*        Apply H(i) to A(i:m,i:n) from the left
*
         IF( i.LT.n ) THEN
            a( i, i ) = one
            CALL clarf( 'Left', m-i+1, n-i, a( i, i ), 1, tau( i ),
     $                  a( i, i+1 ), lda, work )
         END IF
         IF( i.LT.m )
     $      CALL cscal( m-i, -tau( i ), a( i+1, i ), 1 )
         a( i, i ) = one - tau( i )
*
*        Set A(1:i-1,i) to zero
*
         DO 30 l = 1, i - 1
            a( l, i ) = zero
   30    CONTINUE
   40 CONTINUE
      RETURN
*
*     End of CUNG2R
*

◆ cunghr()

subroutine cunghr	(	integer	n,
		integer	ilo,
		integer	ihi,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( * )	tau,
		complex, dimension( * )	work,
		integer	lwork,
		integer	info )

CUNGHR

Download CUNGHR + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CUNGHR generates a complex unitary matrix Q which is defined as the
!> product of IHI-ILO elementary reflectors of order N, as returned by
!> CGEHRD:
!>
!> Q = H(ilo) H(ilo+1) . . . H(ihi-1).
!>

Parameters

[in]	N	!> N is INTEGER !> The order of the matrix Q. N >= 0. !>
[in]	ILO	!> ILO is INTEGER !>
[in]	IHI	!> IHI is INTEGER !> !> ILO and IHI must have the same values as in the previous call !> of CGEHRD. Q is equal to the unit matrix except in the !> submatrix Q(ilo+1:ihi,ilo+1:ihi). !> 1 <= ILO <= IHI <= N, if N > 0; ILO=1 and IHI=0, if N=0. !>
[in,out]	A	!> A is COMPLEX array, dimension (LDA,N) !> On entry, the vectors which define the elementary reflectors, !> as returned by CGEHRD. !> On exit, the N-by-N unitary matrix Q. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,N). !>
[in]	TAU	!> TAU is COMPLEX array, dimension (N-1) !> TAU(i) must contain the scalar factor of the elementary !> reflector H(i), as returned by CGEHRD. !>
[out]	WORK	!> WORK is COMPLEX array, dimension (MAX(1,LWORK)) !> On exit, if INFO = 0, WORK(1) returns the optimal LWORK. !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the array WORK. LWORK >= IHI-ILO. !> For optimum performance LWORK >= (IHI-ILO)*NB, where NB is !> the optimal blocksize. !> !> If LWORK = -1, then a workspace query is assumed; the routine !> only calculates the optimal size of the WORK array, returns !> this value as the first entry of the WORK array, and no error !> message related to LWORK is issued by XERBLA. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 125 of file cunghr.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            IHI, ILO, INFO, LDA, LWORK, N
*     ..
*     .. Array Arguments ..
      COMPLEX            A( LDA, * ), TAU( * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            ZERO, ONE
      parameter( zero = ( 0.0e+0, 0.0e+0 ),
     $                   one = ( 1.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      LOGICAL            LQUERY
      INTEGER            I, IINFO, J, LWKOPT, NB, NH
*     ..
*     .. External Subroutines ..
      EXTERNAL           cungqr, xerbla
*     ..
*     .. External Functions ..
      INTEGER            ILAENV
      EXTERNAL           ilaenv
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, min
*     ..
*     .. Executable Statements ..
*
*     Test the input arguments
*
      info = 0
      nh = ihi - ilo
      lquery = ( lwork.EQ.-1 )
      IF( n.LT.0 ) THEN
         info = -1
      ELSE IF( ilo.LT.1 .OR. ilo.GT.max( 1, n ) ) THEN
         info = -2
      ELSE IF( ihi.LT.min( ilo, n ) .OR. ihi.GT.n ) THEN
         info = -3
      ELSE IF( lda.LT.max( 1, n ) ) THEN
         info = -5
      ELSE IF( lwork.LT.max( 1, nh ) .AND. .NOT.lquery ) THEN
         info = -8
      END IF
*
      IF( info.EQ.0 ) THEN
         nb = ilaenv( 1, 'CUNGQR', ' ', nh, nh, nh, -1 )
         lwkopt = max( 1, nh )*nb
         work( 1 ) = lwkopt
      END IF
*
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CUNGHR', -info )
         RETURN
      ELSE IF( lquery ) THEN
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 ) THEN
         work( 1 ) = 1
         RETURN
      END IF
*
*     Shift the vectors which define the elementary reflectors one
*     column to the right, and set the first ilo and the last n-ihi
*     rows and columns to those of the unit matrix
*
      DO 40 j = ihi, ilo + 1, -1
         DO 10 i = 1, j - 1
            a( i, j ) = zero
   10    CONTINUE
         DO 20 i = j + 1, ihi
            a( i, j ) = a( i, j-1 )
   20    CONTINUE
         DO 30 i = ihi + 1, n
            a( i, j ) = zero
   30    CONTINUE
   40 CONTINUE
      DO 60 j = 1, ilo
         DO 50 i = 1, n
            a( i, j ) = zero
   50    CONTINUE
         a( j, j ) = one
   60 CONTINUE
      DO 80 j = ihi + 1, n
         DO 70 i = 1, n
            a( i, j ) = zero
   70    CONTINUE
         a( j, j ) = one
   80 CONTINUE
*
      IF( nh.GT.0 ) THEN
*
*        Generate Q(ilo+1:ihi,ilo+1:ihi)
*
         CALL cungqr( nh, nh, nh, a( ilo+1, ilo+1 ), lda, tau( ilo ),
     $                work, lwork, iinfo )
      END IF
      work( 1 ) = lwkopt
      RETURN
*
*     End of CUNGHR
*

◆ cungl2()

subroutine cungl2	(	integer	m,
		integer	n,
		integer	k,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( * )	tau,
		complex, dimension( * )	work,
		integer	info )

CUNGL2 generates all or part of the unitary matrix Q from an LQ factorization determined by cgelqf (unblocked algorithm).

Download CUNGL2 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CUNGL2 generates an m-by-n complex matrix Q with orthonormal rows,
!> which is defined as the first m rows of a product of k elementary
!> reflectors of order n
!>
!>       Q  =  H(k)**H . . . H(2)**H H(1)**H
!>
!> as returned by CGELQF.
!>

Parameters

[in]	M	!> M is INTEGER !> The number of rows of the matrix Q. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix Q. N >= M. !>
[in]	K	!> K is INTEGER !> The number of elementary reflectors whose product defines the !> matrix Q. M >= K >= 0. !>
[in,out]	A	!> A is COMPLEX array, dimension (LDA,N) !> On entry, the i-th row must contain the vector which defines !> the elementary reflector H(i), for i = 1,2,...,k, as returned !> by CGELQF in the first k rows of its array argument A. !> On exit, the m by n matrix Q. !>
[in]	LDA	!> LDA is INTEGER !> The first dimension of the array A. LDA >= max(1,M). !>
[in]	TAU	!> TAU is COMPLEX array, dimension (K) !> TAU(i) must contain the scalar factor of the elementary !> reflector H(i), as returned by CGELQF. !>
[out]	WORK	!> WORK is COMPLEX array, dimension (M) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument has an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 112 of file cungl2.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INFO, K, LDA, M, N
*     ..
*     .. Array Arguments ..
      COMPLEX            A( LDA, * ), TAU( * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            ONE, ZERO
      parameter( one = ( 1.0e+0, 0.0e+0 ),
     $                   zero = ( 0.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      INTEGER            I, J, L
*     ..
*     .. External Subroutines ..
      EXTERNAL           clacgv, clarf, cscal, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          conjg, max
*     ..
*     .. Executable Statements ..
*
*     Test the input arguments
*
      info = 0
      IF( m.LT.0 ) THEN
         info = -1
      ELSE IF( n.LT.m ) THEN
         info = -2
      ELSE IF( k.LT.0 .OR. k.GT.m ) THEN
         info = -3
      ELSE IF( lda.LT.max( 1, m ) ) THEN
         info = -5
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CUNGL2', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( m.LE.0 )
     $   RETURN
*
      IF( k.LT.m ) THEN
*
*        Initialise rows k+1:m to rows of the unit matrix
*
         DO 20 j = 1, n
            DO 10 l = k + 1, m
               a( l, j ) = zero
   10       CONTINUE
            IF( j.GT.k .AND. j.LE.m )
     $         a( j, j ) = one
   20    CONTINUE
      END IF
*
      DO 40 i = k, 1, -1
*
*        Apply H(i)**H to A(i:m,i:n) from the right
*
         IF( i.LT.n ) THEN
            CALL clacgv( n-i, a( i, i+1 ), lda )
            IF( i.LT.m ) THEN
               a( i, i ) = one
               CALL clarf( 'Right', m-i, n-i+1, a( i, i ), lda,
     $                     conjg( tau( i ) ), a( i+1, i ), lda, work )
            END IF
            CALL cscal( n-i, -tau( i ), a( i, i+1 ), lda )
            CALL clacgv( n-i, a( i, i+1 ), lda )
         END IF
         a( i, i ) = one - conjg( tau( i ) )
*
*        Set A(i,1:i-1,i) to zero
*
         DO 30 l = 1, i - 1
            a( i, l ) = zero
   30    CONTINUE
   40 CONTINUE
      RETURN
*
*     End of CUNGL2
*

◆ cunglq()

subroutine cunglq	(	integer	m,
		integer	n,
		integer	k,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( * )	tau,
		complex, dimension( * )	work,
		integer	lwork,
		integer	info )

CUNGLQ

Download CUNGLQ + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CUNGLQ generates an M-by-N complex matrix Q with orthonormal rows,
!> which is defined as the first M rows of a product of K elementary
!> reflectors of order N
!>
!>       Q  =  H(k)**H . . . H(2)**H H(1)**H
!>
!> as returned by CGELQF.
!>

Parameters

[in]	M	!> M is INTEGER !> The number of rows of the matrix Q. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix Q. N >= M. !>
[in]	K	!> K is INTEGER !> The number of elementary reflectors whose product defines the !> matrix Q. M >= K >= 0. !>
[in,out]	A	!> A is COMPLEX array, dimension (LDA,N) !> On entry, the i-th row must contain the vector which defines !> the elementary reflector H(i), for i = 1,2,...,k, as returned !> by CGELQF in the first k rows of its array argument A. !> On exit, the M-by-N matrix Q. !>
[in]	LDA	!> LDA is INTEGER !> The first dimension of the array A. LDA >= max(1,M). !>
[in]	TAU	!> TAU is COMPLEX array, dimension (K) !> TAU(i) must contain the scalar factor of the elementary !> reflector H(i), as returned by CGELQF. !>
[out]	WORK	!> WORK is COMPLEX array, dimension (MAX(1,LWORK)) !> On exit, if INFO = 0, WORK(1) returns the optimal LWORK. !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the array WORK. LWORK >= max(1,M). !> For optimum performance LWORK >= M*NB, where NB is !> the optimal blocksize. !> !> If LWORK = -1, then a workspace query is assumed; the routine !> only calculates the optimal size of the WORK array, returns !> this value as the first entry of the WORK array, and no error !> message related to LWORK is issued by XERBLA. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit; !> < 0: if INFO = -i, the i-th argument has an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 126 of file cunglq.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INFO, K, LDA, LWORK, M, N
*     ..
*     .. Array Arguments ..
      COMPLEX            A( LDA, * ), TAU( * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            ZERO
      parameter( zero = ( 0.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      LOGICAL            LQUERY
      INTEGER            I, IB, IINFO, IWS, J, KI, KK, L, LDWORK,
     $                   LWKOPT, NB, NBMIN, NX
*     ..
*     .. External Subroutines ..
      EXTERNAL           clarfb, clarft, cungl2, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, min
*     ..
*     .. External Functions ..
      INTEGER            ILAENV
      EXTERNAL           ilaenv
*     ..
*     .. Executable Statements ..
*
*     Test the input arguments
*
      info = 0
      nb = ilaenv( 1, 'CUNGLQ', ' ', m, n, k, -1 )
      lwkopt = max( 1, m )*nb
      work( 1 ) = lwkopt
      lquery = ( lwork.EQ.-1 )
      IF( m.LT.0 ) THEN
         info = -1
      ELSE IF( n.LT.m ) THEN
         info = -2
      ELSE IF( k.LT.0 .OR. k.GT.m ) THEN
         info = -3
      ELSE IF( lda.LT.max( 1, m ) ) THEN
         info = -5
      ELSE IF( lwork.LT.max( 1, m ) .AND. .NOT.lquery ) THEN
         info = -8
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CUNGLQ', -info )
         RETURN
      ELSE IF( lquery ) THEN
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( m.LE.0 ) THEN
         work( 1 ) = 1
         RETURN
      END IF
*
      nbmin = 2
      nx = 0
      iws = m
      IF( nb.GT.1 .AND. nb.LT.k ) THEN
*
*        Determine when to cross over from blocked to unblocked code.
*
         nx = max( 0, ilaenv( 3, 'CUNGLQ', ' ', m, n, k, -1 ) )
         IF( nx.LT.k ) THEN
*
*           Determine if workspace is large enough for blocked code.
*
            ldwork = m
            iws = ldwork*nb
            IF( lwork.LT.iws ) THEN
*
*              Not enough workspace to use optimal NB:  reduce NB and
*              determine the minimum value of NB.
*
               nb = lwork / ldwork
               nbmin = max( 2, ilaenv( 2, 'CUNGLQ', ' ', m, n, k, -1 ) )
            END IF
         END IF
      END IF
*
      IF( nb.GE.nbmin .AND. nb.LT.k .AND. nx.LT.k ) THEN
*
*        Use blocked code after the last block.
*        The first kk rows are handled by the block method.
*
         ki = ( ( k-nx-1 ) / nb )*nb
         kk = min( k, ki+nb )
*
*        Set A(kk+1:m,1:kk) to zero.
*
         DO 20 j = 1, kk
            DO 10 i = kk + 1, m
               a( i, j ) = zero
   10       CONTINUE
   20    CONTINUE
      ELSE
         kk = 0
      END IF
*
*     Use unblocked code for the last or only block.
*
      IF( kk.LT.m )
     $   CALL cungl2( m-kk, n-kk, k-kk, a( kk+1, kk+1 ), lda,
     $                tau( kk+1 ), work, iinfo )
*
      IF( kk.GT.0 ) THEN
*
*        Use blocked code
*
         DO 50 i = ki + 1, 1, -nb
            ib = min( nb, k-i+1 )
            IF( i+ib.LE.m ) THEN
*
*              Form the triangular factor of the block reflector
*              H = H(i) H(i+1) . . . H(i+ib-1)
*
               CALL clarft( 'Forward', 'Rowwise', n-i+1, ib, a( i, i ),
     $                      lda, tau( i ), work, ldwork )
*
*              Apply H**H to A(i+ib:m,i:n) from the right
*
               CALL clarfb( 'Right', 'Conjugate transpose', 'Forward',
     $                      'Rowwise', m-i-ib+1, n-i+1, ib, a( i, i ),
     $                      lda, work, ldwork, a( i+ib, i ), lda,
     $                      work( ib+1 ), ldwork )
            END IF
*
*           Apply H**H to columns i:n of current block
*
            CALL cungl2( ib, n-i+1, ib, a( i, i ), lda, tau( i ), work,
     $                   iinfo )
*
*           Set columns 1:i-1 of current block to zero
*
            DO 40 j = 1, i - 1
               DO 30 l = i, i + ib - 1
                  a( l, j ) = zero
   30          CONTINUE
   40       CONTINUE
   50    CONTINUE
      END IF
*
      work( 1 ) = iws
      RETURN
*
*     End of CUNGLQ
*

◆ cungql()

subroutine cungql	(	integer	m,
		integer	n,
		integer	k,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( * )	tau,
		complex, dimension( * )	work,
		integer	lwork,
		integer	info )

CUNGQL

Download CUNGQL + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CUNGQL generates an M-by-N complex matrix Q with orthonormal columns,
!> which is defined as the last N columns of a product of K elementary
!> reflectors of order M
!>
!>       Q  =  H(k) . . . H(2) H(1)
!>
!> as returned by CGEQLF.
!>

Parameters

[in]	M	!> M is INTEGER !> The number of rows of the matrix Q. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix Q. M >= N >= 0. !>
[in]	K	!> K is INTEGER !> The number of elementary reflectors whose product defines the !> matrix Q. N >= K >= 0. !>
[in,out]	A	!> A is COMPLEX array, dimension (LDA,N) !> On entry, the (n-k+i)-th column must contain the vector which !> defines the elementary reflector H(i), for i = 1,2,...,k, as !> returned by CGEQLF in the last k columns of its array !> argument A. !> On exit, the M-by-N matrix Q. !>
[in]	LDA	!> LDA is INTEGER !> The first dimension of the array A. LDA >= max(1,M). !>
[in]	TAU	!> TAU is COMPLEX array, dimension (K) !> TAU(i) must contain the scalar factor of the elementary !> reflector H(i), as returned by CGEQLF. !>
[out]	WORK	!> WORK is COMPLEX array, dimension (MAX(1,LWORK)) !> On exit, if INFO = 0, WORK(1) returns the optimal LWORK. !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the array WORK. LWORK >= max(1,N). !> For optimum performance LWORK >= N*NB, where NB is the !> optimal blocksize. !> !> If LWORK = -1, then a workspace query is assumed; the routine !> only calculates the optimal size of the WORK array, returns !> this value as the first entry of the WORK array, and no error !> message related to LWORK is issued by XERBLA. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument has an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 127 of file cungql.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INFO, K, LDA, LWORK, M, N
*     ..
*     .. Array Arguments ..
      COMPLEX            A( LDA, * ), TAU( * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            ZERO
      parameter( zero = ( 0.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      LOGICAL            LQUERY
      INTEGER            I, IB, IINFO, IWS, J, KK, L, LDWORK, LWKOPT,
     $                   NB, NBMIN, NX
*     ..
*     .. External Subroutines ..
      EXTERNAL           clarfb, clarft, cung2l, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, min
*     ..
*     .. External Functions ..
      INTEGER            ILAENV
      EXTERNAL           ilaenv
*     ..
*     .. Executable Statements ..
*
*     Test the input arguments
*
      info = 0
      lquery = ( lwork.EQ.-1 )
      IF( m.LT.0 ) THEN
         info = -1
      ELSE IF( n.LT.0 .OR. n.GT.m ) THEN
         info = -2
      ELSE IF( k.LT.0 .OR. k.GT.n ) THEN
         info = -3
      ELSE IF( lda.LT.max( 1, m ) ) THEN
         info = -5
      END IF
*
      IF( info.EQ.0 ) THEN
         IF( n.EQ.0 ) THEN
            lwkopt = 1
         ELSE
            nb = ilaenv( 1, 'CUNGQL', ' ', m, n, k, -1 )
            lwkopt = n*nb
         END IF
         work( 1 ) = lwkopt
*
         IF( lwork.LT.max( 1, n ) .AND. .NOT.lquery ) THEN
            info = -8
         END IF
      END IF
*
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CUNGQL', -info )
         RETURN
      ELSE IF( lquery ) THEN
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.LE.0 ) THEN
         RETURN
      END IF
*
      nbmin = 2
      nx = 0
      iws = n
      IF( nb.GT.1 .AND. nb.LT.k ) THEN
*
*        Determine when to cross over from blocked to unblocked code.
*
         nx = max( 0, ilaenv( 3, 'CUNGQL', ' ', m, n, k, -1 ) )
         IF( nx.LT.k ) THEN
*
*           Determine if workspace is large enough for blocked code.
*
            ldwork = n
            iws = ldwork*nb
            IF( lwork.LT.iws ) THEN
*
*              Not enough workspace to use optimal NB:  reduce NB and
*              determine the minimum value of NB.
*
               nb = lwork / ldwork
               nbmin = max( 2, ilaenv( 2, 'CUNGQL', ' ', m, n, k, -1 ) )
            END IF
         END IF
      END IF
*
      IF( nb.GE.nbmin .AND. nb.LT.k .AND. nx.LT.k ) THEN
*
*        Use blocked code after the first block.
*        The last kk columns are handled by the block method.
*
         kk = min( k, ( ( k-nx+nb-1 ) / nb )*nb )
*
*        Set A(m-kk+1:m,1:n-kk) to zero.
*
         DO 20 j = 1, n - kk
            DO 10 i = m - kk + 1, m
               a( i, j ) = zero
   10       CONTINUE
   20    CONTINUE
      ELSE
         kk = 0
      END IF
*
*     Use unblocked code for the first or only block.
*
      CALL cung2l( m-kk, n-kk, k-kk, a, lda, tau, work, iinfo )
*
      IF( kk.GT.0 ) THEN
*
*        Use blocked code
*
         DO 50 i = k - kk + 1, k, nb
            ib = min( nb, k-i+1 )
            IF( n-k+i.GT.1 ) THEN
*
*              Form the triangular factor of the block reflector
*              H = H(i+ib-1) . . . H(i+1) H(i)
*
               CALL clarft( 'Backward', 'Columnwise', m-k+i+ib-1, ib,
     $                      a( 1, n-k+i ), lda, tau( i ), work, ldwork )
*
*              Apply H to A(1:m-k+i+ib-1,1:n-k+i-1) from the left
*
               CALL clarfb( 'Left', 'No transpose', 'Backward',
     $                      'Columnwise', m-k+i+ib-1, n-k+i-1, ib,
     $                      a( 1, n-k+i ), lda, work, ldwork, a, lda,
     $                      work( ib+1 ), ldwork )
            END IF
*
*           Apply H to rows 1:m-k+i+ib-1 of current block
*
            CALL cung2l( m-k+i+ib-1, ib, ib, a( 1, n-k+i ), lda,
     $                   tau( i ), work, iinfo )
*
*           Set rows m-k+i+ib:m of current block to zero
*
            DO 40 j = n - k + i, n - k + i + ib - 1
               DO 30 l = m - k + i + ib, m
                  a( l, j ) = zero
   30          CONTINUE
   40       CONTINUE
   50    CONTINUE
      END IF
*
      work( 1 ) = iws
      RETURN
*
*     End of CUNGQL
*

◆ cungqr()

subroutine cungqr	(	integer	m,
		integer	n,
		integer	k,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( * )	tau,
		complex, dimension( * )	work,
		integer	lwork,
		integer	info )

CUNGQR

Download CUNGQR + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CUNGQR generates an M-by-N complex matrix Q with orthonormal columns,
!> which is defined as the first N columns of a product of K elementary
!> reflectors of order M
!>
!>       Q  =  H(1) H(2) . . . H(k)
!>
!> as returned by CGEQRF.
!>

Parameters

[in]	M	!> M is INTEGER !> The number of rows of the matrix Q. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix Q. M >= N >= 0. !>
[in]	K	!> K is INTEGER !> The number of elementary reflectors whose product defines the !> matrix Q. N >= K >= 0. !>
[in,out]	A	!> A is COMPLEX array, dimension (LDA,N) !> On entry, the i-th column must contain the vector which !> defines the elementary reflector H(i), for i = 1,2,...,k, as !> returned by CGEQRF in the first k columns of its array !> argument A. !> On exit, the M-by-N matrix Q. !>
[in]	LDA	!> LDA is INTEGER !> The first dimension of the array A. LDA >= max(1,M). !>
[in]	TAU	!> TAU is COMPLEX array, dimension (K) !> TAU(i) must contain the scalar factor of the elementary !> reflector H(i), as returned by CGEQRF. !>
[out]	WORK	!> WORK is COMPLEX array, dimension (MAX(1,LWORK)) !> On exit, if INFO = 0, WORK(1) returns the optimal LWORK. !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the array WORK. LWORK >= max(1,N). !> For optimum performance LWORK >= N*NB, where NB is the !> optimal blocksize. !> !> If LWORK = -1, then a workspace query is assumed; the routine !> only calculates the optimal size of the WORK array, returns !> this value as the first entry of the WORK array, and no error !> message related to LWORK is issued by XERBLA. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument has an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 127 of file cungqr.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INFO, K, LDA, LWORK, M, N
*     ..
*     .. Array Arguments ..
      COMPLEX            A( LDA, * ), TAU( * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            ZERO
      parameter( zero = ( 0.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      LOGICAL            LQUERY
      INTEGER            I, IB, IINFO, IWS, J, KI, KK, L, LDWORK,
     $                   LWKOPT, NB, NBMIN, NX
*     ..
*     .. External Subroutines ..
      EXTERNAL           clarfb, clarft, cung2r, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, min
*     ..
*     .. External Functions ..
      INTEGER            ILAENV
      EXTERNAL           ilaenv
*     ..
*     .. Executable Statements ..
*
*     Test the input arguments
*
      info = 0
      nb = ilaenv( 1, 'CUNGQR', ' ', m, n, k, -1 )
      lwkopt = max( 1, n )*nb
      work( 1 ) = lwkopt
      lquery = ( lwork.EQ.-1 )
      IF( m.LT.0 ) THEN
         info = -1
      ELSE IF( n.LT.0 .OR. n.GT.m ) THEN
         info = -2
      ELSE IF( k.LT.0 .OR. k.GT.n ) THEN
         info = -3
      ELSE IF( lda.LT.max( 1, m ) ) THEN
         info = -5
      ELSE IF( lwork.LT.max( 1, n ) .AND. .NOT.lquery ) THEN
         info = -8
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CUNGQR', -info )
         RETURN
      ELSE IF( lquery ) THEN
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.LE.0 ) THEN
         work( 1 ) = 1
         RETURN
      END IF
*
      nbmin = 2
      nx = 0
      iws = n
      IF( nb.GT.1 .AND. nb.LT.k ) THEN
*
*        Determine when to cross over from blocked to unblocked code.
*
         nx = max( 0, ilaenv( 3, 'CUNGQR', ' ', m, n, k, -1 ) )
         IF( nx.LT.k ) THEN
*
*           Determine if workspace is large enough for blocked code.
*
            ldwork = n
            iws = ldwork*nb
            IF( lwork.LT.iws ) THEN
*
*              Not enough workspace to use optimal NB:  reduce NB and
*              determine the minimum value of NB.
*
               nb = lwork / ldwork
               nbmin = max( 2, ilaenv( 2, 'CUNGQR', ' ', m, n, k, -1 ) )
            END IF
         END IF
      END IF
*
      IF( nb.GE.nbmin .AND. nb.LT.k .AND. nx.LT.k ) THEN
*
*        Use blocked code after the last block.
*        The first kk columns are handled by the block method.
*
         ki = ( ( k-nx-1 ) / nb )*nb
         kk = min( k, ki+nb )
*
*        Set A(1:kk,kk+1:n) to zero.
*
         DO 20 j = kk + 1, n
            DO 10 i = 1, kk
               a( i, j ) = zero
   10       CONTINUE
   20    CONTINUE
      ELSE
         kk = 0
      END IF
*
*     Use unblocked code for the last or only block.
*
      IF( kk.LT.n )
     $   CALL cung2r( m-kk, n-kk, k-kk, a( kk+1, kk+1 ), lda,
     $                tau( kk+1 ), work, iinfo )
*
      IF( kk.GT.0 ) THEN
*
*        Use blocked code
*
         DO 50 i = ki + 1, 1, -nb
            ib = min( nb, k-i+1 )
            IF( i+ib.LE.n ) THEN
*
*              Form the triangular factor of the block reflector
*              H = H(i) H(i+1) . . . H(i+ib-1)
*
               CALL clarft( 'Forward', 'Columnwise', m-i+1, ib,
     $                      a( i, i ), lda, tau( i ), work, ldwork )
*
*              Apply H to A(i:m,i+ib:n) from the left
*
               CALL clarfb( 'Left', 'No transpose', 'Forward',
     $                      'Columnwise', m-i+1, n-i-ib+1, ib,
     $                      a( i, i ), lda, work, ldwork, a( i, i+ib ),
     $                      lda, work( ib+1 ), ldwork )
            END IF
*
*           Apply H to rows i:m of current block
*
            CALL cung2r( m-i+1, ib, ib, a( i, i ), lda, tau( i ), work,
     $                   iinfo )
*
*           Set rows 1:i-1 of current block to zero
*
            DO 40 j = i, i + ib - 1
               DO 30 l = 1, i - 1
                  a( l, j ) = zero
   30          CONTINUE
   40       CONTINUE
   50    CONTINUE
      END IF
*
      work( 1 ) = iws
      RETURN
*
*     End of CUNGQR
*

◆ cungr2()

subroutine cungr2	(	integer	m,
		integer	n,
		integer	k,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( * )	tau,
		complex, dimension( * )	work,
		integer	info )

CUNGR2 generates all or part of the unitary matrix Q from an RQ factorization determined by cgerqf (unblocked algorithm).

Download CUNGR2 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CUNGR2 generates an m by n complex matrix Q with orthonormal rows,
!> which is defined as the last m rows of a product of k elementary
!> reflectors of order n
!>
!>       Q  =  H(1)**H H(2)**H . . . H(k)**H
!>
!> as returned by CGERQF.
!>

Parameters

[in]	M	!> M is INTEGER !> The number of rows of the matrix Q. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix Q. N >= M. !>
[in]	K	!> K is INTEGER !> The number of elementary reflectors whose product defines the !> matrix Q. M >= K >= 0. !>
[in,out]	A	!> A is COMPLEX array, dimension (LDA,N) !> On entry, the (m-k+i)-th row must contain the vector which !> defines the elementary reflector H(i), for i = 1,2,...,k, as !> returned by CGERQF in the last k rows of its array argument !> A. !> On exit, the m-by-n matrix Q. !>
[in]	LDA	!> LDA is INTEGER !> The first dimension of the array A. LDA >= max(1,M). !>
[in]	TAU	!> TAU is COMPLEX array, dimension (K) !> TAU(i) must contain the scalar factor of the elementary !> reflector H(i), as returned by CGERQF. !>
[out]	WORK	!> WORK is COMPLEX array, dimension (M) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument has an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 113 of file cungr2.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INFO, K, LDA, M, N
*     ..
*     .. Array Arguments ..
      COMPLEX            A( LDA, * ), TAU( * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            ONE, ZERO
      parameter( one = ( 1.0e+0, 0.0e+0 ),
     $                   zero = ( 0.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      INTEGER            I, II, J, L
*     ..
*     .. External Subroutines ..
      EXTERNAL           clacgv, clarf, cscal, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          conjg, max
*     ..
*     .. Executable Statements ..
*
*     Test the input arguments
*
      info = 0
      IF( m.LT.0 ) THEN
         info = -1
      ELSE IF( n.LT.m ) THEN
         info = -2
      ELSE IF( k.LT.0 .OR. k.GT.m ) THEN
         info = -3
      ELSE IF( lda.LT.max( 1, m ) ) THEN
         info = -5
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CUNGR2', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( m.LE.0 )
     $   RETURN
*
      IF( k.LT.m ) THEN
*
*        Initialise rows 1:m-k to rows of the unit matrix
*
         DO 20 j = 1, n
            DO 10 l = 1, m - k
               a( l, j ) = zero
   10       CONTINUE
            IF( j.GT.n-m .AND. j.LE.n-k )
     $         a( m-n+j, j ) = one
   20    CONTINUE
      END IF
*
      DO 40 i = 1, k
         ii = m - k + i
*
*        Apply H(i)**H to A(1:m-k+i,1:n-k+i) from the right
*
         CALL clacgv( n-m+ii-1, a( ii, 1 ), lda )
         a( ii, n-m+ii ) = one
         CALL clarf( 'Right', ii-1, n-m+ii, a( ii, 1 ), lda,
     $               conjg( tau( i ) ), a, lda, work )
         CALL cscal( n-m+ii-1, -tau( i ), a( ii, 1 ), lda )
         CALL clacgv( n-m+ii-1, a( ii, 1 ), lda )
         a( ii, n-m+ii ) = one - conjg( tau( i ) )
*
*        Set A(m-k+i,n-k+i+1:n) to zero
*
         DO 30 l = n - m + ii + 1, n
            a( ii, l ) = zero
   30    CONTINUE
   40 CONTINUE
      RETURN
*
*     End of CUNGR2
*

◆ cungrq()

subroutine cungrq	(	integer	m,
		integer	n,
		integer	k,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( * )	tau,
		complex, dimension( * )	work,
		integer	lwork,
		integer	info )

CUNGRQ

Download CUNGRQ + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CUNGRQ generates an M-by-N complex matrix Q with orthonormal rows,
!> which is defined as the last M rows of a product of K elementary
!> reflectors of order N
!>
!>       Q  =  H(1)**H H(2)**H . . . H(k)**H
!>
!> as returned by CGERQF.
!>

Parameters

[in]	M	!> M is INTEGER !> The number of rows of the matrix Q. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix Q. N >= M. !>
[in]	K	!> K is INTEGER !> The number of elementary reflectors whose product defines the !> matrix Q. M >= K >= 0. !>
[in,out]	A	!> A is COMPLEX array, dimension (LDA,N) !> On entry, the (m-k+i)-th row must contain the vector which !> defines the elementary reflector H(i), for i = 1,2,...,k, as !> returned by CGERQF in the last k rows of its array argument !> A. !> On exit, the M-by-N matrix Q. !>
[in]	LDA	!> LDA is INTEGER !> The first dimension of the array A. LDA >= max(1,M). !>
[in]	TAU	!> TAU is COMPLEX array, dimension (K) !> TAU(i) must contain the scalar factor of the elementary !> reflector H(i), as returned by CGERQF. !>
[out]	WORK	!> WORK is COMPLEX array, dimension (MAX(1,LWORK)) !> On exit, if INFO = 0, WORK(1) returns the optimal LWORK. !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the array WORK. LWORK >= max(1,M). !> For optimum performance LWORK >= M*NB, where NB is the !> optimal blocksize. !> !> If LWORK = -1, then a workspace query is assumed; the routine !> only calculates the optimal size of the WORK array, returns !> this value as the first entry of the WORK array, and no error !> message related to LWORK is issued by XERBLA. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument has an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 127 of file cungrq.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INFO, K, LDA, LWORK, M, N
*     ..
*     .. Array Arguments ..
      COMPLEX            A( LDA, * ), TAU( * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            ZERO
      parameter( zero = ( 0.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      LOGICAL            LQUERY
      INTEGER            I, IB, II, IINFO, IWS, J, KK, L, LDWORK,
     $                   LWKOPT, NB, NBMIN, NX
*     ..
*     .. External Subroutines ..
      EXTERNAL           clarfb, clarft, cungr2, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, min
*     ..
*     .. External Functions ..
      INTEGER            ILAENV
      EXTERNAL           ilaenv
*     ..
*     .. Executable Statements ..
*
*     Test the input arguments
*
      info = 0
      lquery = ( lwork.EQ.-1 )
      IF( m.LT.0 ) THEN
         info = -1
      ELSE IF( n.LT.m ) THEN
         info = -2
      ELSE IF( k.LT.0 .OR. k.GT.m ) THEN
         info = -3
      ELSE IF( lda.LT.max( 1, m ) ) THEN
         info = -5
      END IF
*
      IF( info.EQ.0 ) THEN
         IF( m.LE.0 ) THEN
            lwkopt = 1
         ELSE
            nb = ilaenv( 1, 'CUNGRQ', ' ', m, n, k, -1 )
            lwkopt = m*nb
         END IF
         work( 1 ) = lwkopt
*
         IF( lwork.LT.max( 1, m ) .AND. .NOT.lquery ) THEN
            info = -8
         END IF
      END IF
*
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CUNGRQ', -info )
         RETURN
      ELSE IF( lquery ) THEN
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( m.LE.0 ) THEN
         RETURN
      END IF
*
      nbmin = 2
      nx = 0
      iws = m
      IF( nb.GT.1 .AND. nb.LT.k ) THEN
*
*        Determine when to cross over from blocked to unblocked code.
*
         nx = max( 0, ilaenv( 3, 'CUNGRQ', ' ', m, n, k, -1 ) )
         IF( nx.LT.k ) THEN
*
*           Determine if workspace is large enough for blocked code.
*
            ldwork = m
            iws = ldwork*nb
            IF( lwork.LT.iws ) THEN
*
*              Not enough workspace to use optimal NB:  reduce NB and
*              determine the minimum value of NB.
*
               nb = lwork / ldwork
               nbmin = max( 2, ilaenv( 2, 'CUNGRQ', ' ', m, n, k, -1 ) )
            END IF
         END IF
      END IF
*
      IF( nb.GE.nbmin .AND. nb.LT.k .AND. nx.LT.k ) THEN
*
*        Use blocked code after the first block.
*        The last kk rows are handled by the block method.
*
         kk = min( k, ( ( k-nx+nb-1 ) / nb )*nb )
*
*        Set A(1:m-kk,n-kk+1:n) to zero.
*
         DO 20 j = n - kk + 1, n
            DO 10 i = 1, m - kk
               a( i, j ) = zero
   10       CONTINUE
   20    CONTINUE
      ELSE
         kk = 0
      END IF
*
*     Use unblocked code for the first or only block.
*
      CALL cungr2( m-kk, n-kk, k-kk, a, lda, tau, work, iinfo )
*
      IF( kk.GT.0 ) THEN
*
*        Use blocked code
*
         DO 50 i = k - kk + 1, k, nb
            ib = min( nb, k-i+1 )
            ii = m - k + i
            IF( ii.GT.1 ) THEN
*
*              Form the triangular factor of the block reflector
*              H = H(i+ib-1) . . . H(i+1) H(i)
*
               CALL clarft( 'Backward', 'Rowwise', n-k+i+ib-1, ib,
     $                      a( ii, 1 ), lda, tau( i ), work, ldwork )
*
*              Apply H**H to A(1:m-k+i-1,1:n-k+i+ib-1) from the right
*
               CALL clarfb( 'Right', 'Conjugate transpose', 'Backward',
     $                      'Rowwise', ii-1, n-k+i+ib-1, ib, a( ii, 1 ),
     $                      lda, work, ldwork, a, lda, work( ib+1 ),
     $                      ldwork )
            END IF
*
*           Apply H**H to columns 1:n-k+i+ib-1 of current block
*
            CALL cungr2( ib, n-k+i+ib-1, ib, a( ii, 1 ), lda, tau( i ),
     $                   work, iinfo )
*
*           Set columns n-k+i+ib:n of current block to zero
*
            DO 40 l = n - k + i + ib, n
               DO 30 j = ii, ii + ib - 1
                  a( j, l ) = zero
   30          CONTINUE
   40       CONTINUE
   50    CONTINUE
      END IF
*
      work( 1 ) = iws
      RETURN
*
*     End of CUNGRQ
*

◆ cungtr()

subroutine cungtr	(	character	uplo,
		integer	n,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( * )	tau,
		complex, dimension( * )	work,
		integer	lwork,
		integer	info )

CUNGTR

Download CUNGTR + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CUNGTR generates a complex unitary matrix Q which is defined as the
!> product of n-1 elementary reflectors of order N, as returned by
!> CHETRD:
!>
!> if UPLO = 'U', Q = H(n-1) . . . H(2) H(1),
!>
!> if UPLO = 'L', Q = H(1) H(2) . . . H(n-1).
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': Upper triangle of A contains elementary reflectors !> from CHETRD; !> = 'L': Lower triangle of A contains elementary reflectors !> from CHETRD. !>
[in]	N	!> N is INTEGER !> The order of the matrix Q. N >= 0. !>
[in,out]	A	!> A is COMPLEX array, dimension (LDA,N) !> On entry, the vectors which define the elementary reflectors, !> as returned by CHETRD. !> On exit, the N-by-N unitary matrix Q. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= N. !>
[in]	TAU	!> TAU is COMPLEX array, dimension (N-1) !> TAU(i) must contain the scalar factor of the elementary !> reflector H(i), as returned by CHETRD. !>
[out]	WORK	!> WORK is COMPLEX array, dimension (MAX(1,LWORK)) !> On exit, if INFO = 0, WORK(1) returns the optimal LWORK. !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the array WORK. LWORK >= N-1. !> For optimum performance LWORK >= (N-1)*NB, where NB is !> the optimal blocksize. !> !> If LWORK = -1, then a workspace query is assumed; the routine !> only calculates the optimal size of the WORK array, returns !> this value as the first entry of the WORK array, and no error !> message related to LWORK is issued by XERBLA. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 122 of file cungtr.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          UPLO
      INTEGER            INFO, LDA, LWORK, N
*     ..
*     .. Array Arguments ..
      COMPLEX            A( LDA, * ), TAU( * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            ZERO, ONE
      parameter( zero = ( 0.0e+0, 0.0e+0 ),
     $                   one = ( 1.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      LOGICAL            LQUERY, UPPER
      INTEGER            I, IINFO, J, LWKOPT, NB
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      INTEGER            ILAENV
      EXTERNAL           ilaenv, lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           cungql, cungqr, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max
*     ..
*     .. Executable Statements ..
*
*     Test the input arguments
*
      info = 0
      lquery = ( lwork.EQ.-1 )
      upper = lsame( uplo, 'U' )
      IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( lda.LT.max( 1, n ) ) THEN
         info = -4
      ELSE IF( lwork.LT.max( 1, n-1 ) .AND. .NOT.lquery ) THEN
         info = -7
      END IF
*
      IF( info.EQ.0 ) THEN
         IF ( upper ) THEN
           nb = ilaenv( 1, 'CUNGQL', ' ', n-1, n-1, n-1, -1 )
         ELSE
           nb = ilaenv( 1, 'CUNGQR', ' ', n-1, n-1, n-1, -1 )
         END IF
         lwkopt = max( 1, n-1 )*nb
         work( 1 ) = lwkopt
      END IF
*
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CUNGTR', -info )
         RETURN
      ELSE IF( lquery ) THEN
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 ) THEN
         work( 1 ) = 1
         RETURN
      END IF
*
      IF( upper ) THEN
*
*        Q was determined by a call to CHETRD with UPLO = 'U'
*
*        Shift the vectors which define the elementary reflectors one
*        column to the left, and set the last row and column of Q to
*        those of the unit matrix
*
         DO 20 j = 1, n - 1
            DO 10 i = 1, j - 1
               a( i, j ) = a( i, j+1 )
   10       CONTINUE
            a( n, j ) = zero
   20    CONTINUE
         DO 30 i = 1, n - 1
            a( i, n ) = zero
   30    CONTINUE
         a( n, n ) = one
*
*        Generate Q(1:n-1,1:n-1)
*
         CALL cungql( n-1, n-1, n-1, a, lda, tau, work, lwork, iinfo )
*
      ELSE
*
*        Q was determined by a call to CHETRD with UPLO = 'L'.
*
*        Shift the vectors which define the elementary reflectors one
*        column to the right, and set the first row and column of Q to
*        those of the unit matrix
*
         DO 50 j = n, 2, -1
            a( 1, j ) = zero
            DO 40 i = j + 1, n
               a( i, j ) = a( i, j-1 )
   40       CONTINUE
   50    CONTINUE
         a( 1, 1 ) = one
         DO 60 i = 2, n
            a( i, 1 ) = zero
   60    CONTINUE
         IF( n.GT.1 ) THEN
*
*           Generate Q(2:n,2:n)
*
            CALL cungqr( n-1, n-1, n-1, a( 2, 2 ), lda, tau, work,
     $                   lwork, iinfo )
         END IF
      END IF
      work( 1 ) = lwkopt
      RETURN
*
*     End of CUNGTR
*

◆ cungtsqr()

subroutine cungtsqr	(	integer	m,
		integer	n,
		integer	mb,
		integer	nb,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( ldt, * )	t,
		integer	ldt,
		complex, dimension( * )	work,
		integer	lwork,
		integer	info )

CUNGTSQR

Download CUNGTSQR + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CUNGTSQR generates an M-by-N complex matrix Q_out with orthonormal
!> columns, which are the first N columns of a product of comlpex unitary
!> matrices of order M which are returned by CLATSQR
!>
!>      Q_out = first_N_columns_of( Q(1)_in * Q(2)_in * ... * Q(k)_in ).
!>
!> See the documentation for CLATSQR.
!>

Parameters

[in]	M	!> M is INTEGER !> The number of rows of the matrix A. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix A. M >= N >= 0. !>
[in]	MB	!> MB is INTEGER !> The row block size used by CLATSQR to return !> arrays A and T. MB > N. !> (Note that if MB > M, then M is used instead of MB !> as the row block size). !>
[in]	NB	!> NB is INTEGER !> The column block size used by CLATSQR to return !> arrays A and T. NB >= 1. !> (Note that if NB > N, then N is used instead of NB !> as the column block size). !>
[in,out]	A	!> A is COMPLEX array, dimension (LDA,N) !> !> On entry: !> !> The elements on and above the diagonal are not accessed. !> The elements below the diagonal represent the unit !> lower-trapezoidal blocked matrix V computed by CLATSQR !> that defines the input matrices Q_in(k) (ones on the !> diagonal are not stored) (same format as the output A !> below the diagonal in CLATSQR). !> !> On exit: !> !> The array A contains an M-by-N orthonormal matrix Q_out, !> i.e the columns of A are orthogonal unit vectors. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,M). !>
[in]	T	!> T is COMPLEX array, !> dimension (LDT, N * NIRB) !> where NIRB = Number_of_input_row_blocks !> = MAX( 1, CEIL((M-N)/(MB-N)) ) !> Let NICB = Number_of_input_col_blocks !> = CEIL(N/NB) !> !> The upper-triangular block reflectors used to define the !> input matrices Q_in(k), k=(1:NIRB*NICB). The block !> reflectors are stored in compact form in NIRB block !> reflector sequences. Each of NIRB block reflector sequences !> is stored in a larger NB-by-N column block of T and consists !> of NICB smaller NB-by-NB upper-triangular column blocks. !> (same format as the output T in CLATSQR). !>
[in]	LDT	!> LDT is INTEGER !> The leading dimension of the array T. !> LDT >= max(1,min(NB1,N)). !>
[out]	WORK	!> (workspace) COMPLEX array, dimension (MAX(2,LWORK)) !> On exit, if INFO = 0, WORK(1) returns the optimal LWORK. !>
[in]	LWORK	!> The dimension of the array WORK. LWORK >= (M+NB)*N. !> If LWORK = -1, then a workspace query is assumed. !> The routine only calculates the optimal size of the WORK !> array, returns this value as the first entry of the WORK !> array, and no error message related to LWORK is issued !> by XERBLA. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:

!>
!> November 2019, Igor Kozachenko,
!>                Computer Science Division,
!>                University of California, Berkeley
!>
!>

Definition at line 173 of file cungtsqr.f.

      IMPLICIT NONE
*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER           INFO, LDA, LDT, LWORK, M, N, MB, NB
*     ..
*     .. Array Arguments ..
      COMPLEX        A( LDA, * ), T( LDT, * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            CONE, CZERO
      parameter( cone = ( 1.0e+0, 0.0e+0 ),
     $                     czero = ( 0.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      LOGICAL            LQUERY
      INTEGER            IINFO, LDC, LWORKOPT, LC, LW, NBLOCAL, J
*     ..
*     .. External Subroutines ..
      EXTERNAL           ccopy, clamtsqr, claset, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          cmplx, max, min
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters
*
      lquery  = lwork.EQ.-1
      info = 0
      IF( m.LT.0 ) THEN
         info = -1
      ELSE IF( n.LT.0 .OR. m.LT.n ) THEN
         info = -2
      ELSE IF( mb.LE.n ) THEN
         info = -3
      ELSE IF( nb.LT.1 ) THEN
         info = -4
      ELSE IF( lda.LT.max( 1, m ) ) THEN
         info = -6
      ELSE IF( ldt.LT.max( 1, min( nb, n ) ) ) THEN
         info = -8
      ELSE
*
*        Test the input LWORK for the dimension of the array WORK.
*        This workspace is used to store array C(LDC, N) and WORK(LWORK)
*        in the call to CLAMTSQR. See the documentation for CLAMTSQR.
*
         IF( lwork.LT.2 .AND. (.NOT.lquery) ) THEN
            info = -10
         ELSE
*
*           Set block size for column blocks
*
            nblocal = min( nb, n )
*
*           LWORK = -1, then set the size for the array C(LDC,N)
*           in CLAMTSQR call and set the optimal size of the work array
*           WORK(LWORK) in CLAMTSQR call.
*
            ldc = m
            lc = ldc*n
            lw = n * nblocal
*
            lworkopt = lc+lw
*
            IF( ( lwork.LT.max( 1, lworkopt ) ).AND.(.NOT.lquery) ) THEN
               info = -10
            END IF
         END IF
*
      END IF
*
*     Handle error in the input parameters and return workspace query.
*
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CUNGTSQR', -info )
         RETURN
      ELSE IF ( lquery ) THEN
         work( 1 ) = cmplx( lworkopt )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( min( m, n ).EQ.0 ) THEN
         work( 1 ) = cmplx( lworkopt )
         RETURN
      END IF
*
*     (1) Form explicitly the tall-skinny M-by-N left submatrix Q1_in
*     of M-by-M orthogonal matrix Q_in, which is implicitly stored in
*     the subdiagonal part of input array A and in the input array T.
*     Perform by the following operation using the routine CLAMTSQR.
*
*         Q1_in = Q_in * ( I ), where I is a N-by-N identity matrix,
*                        ( 0 )        0 is a (M-N)-by-N zero matrix.
*
*     (1a) Form M-by-N matrix in the array WORK(1:LDC*N) with ones
*     on the diagonal and zeros elsewhere.
*
      CALL claset( 'F', m, n, czero, cone, work, ldc )
*
*     (1b)  On input, WORK(1:LDC*N) stores ( I );
*                                          ( 0 )
*
*           On output, WORK(1:LDC*N) stores Q1_in.
*
      CALL clamtsqr( 'L', 'N', m, n, n, mb, nblocal, a, lda, t, ldt,
     $               work, ldc, work( lc+1 ), lw, iinfo )
*
*     (2) Copy the result from the part of the work array (1:M,1:N)
*     with the leading dimension LDC that starts at WORK(1) into
*     the output array A(1:M,1:N) column-by-column.
*
      DO j = 1, n
         CALL ccopy( m, work( (j-1)*ldc + 1 ), 1, a( 1, j ), 1 )
      END DO
*
      work( 1 ) = cmplx( lworkopt )
      RETURN
*
*     End of CUNGTSQR
*

◆ cungtsqr_row()

subroutine cungtsqr_row	(	integer	m,
		integer	n,
		integer	mb,
		integer	nb,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( ldt, * )	t,
		integer	ldt,
		complex, dimension( * )	work,
		integer	lwork,
		integer	info )

CUNGTSQR_ROW

Download CUNGTSQR_ROW + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CUNGTSQR_ROW generates an M-by-N complex matrix Q_out with
!> orthonormal columns from the output of CLATSQR. These N orthonormal
!> columns are the first N columns of a product of complex unitary
!> matrices Q(k)_in of order M, which are returned by CLATSQR in
!> a special format.
!>
!>      Q_out = first_N_columns_of( Q(1)_in * Q(2)_in * ... * Q(k)_in ).
!>
!> The input matrices Q(k)_in are stored in row and column blocks in A.
!> See the documentation of CLATSQR for more details on the format of
!> Q(k)_in, where each Q(k)_in is represented by block Householder
!> transformations. This routine calls an auxiliary routine CLARFB_GETT,
!> where the computation is performed on each individual block. The
!> algorithm first sweeps NB-sized column blocks from the right to left
!> starting in the bottom row block and continues to the top row block
!> (hence _ROW in the routine name). This sweep is in reverse order of
!> the order in which CLATSQR generates the output blocks.
!>

Parameters

[in]	M	!> M is INTEGER !> The number of rows of the matrix A. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix A. M >= N >= 0. !>
[in]	MB	!> MB is INTEGER !> The row block size used by CLATSQR to return !> arrays A and T. MB > N. !> (Note that if MB > M, then M is used instead of MB !> as the row block size). !>
[in]	NB	!> NB is INTEGER !> The column block size used by CLATSQR to return !> arrays A and T. NB >= 1. !> (Note that if NB > N, then N is used instead of NB !> as the column block size). !>
[in,out]	A	!> A is COMPLEX array, dimension (LDA,N) !> !> On entry: !> !> The elements on and above the diagonal are not used as !> input. The elements below the diagonal represent the unit !> lower-trapezoidal blocked matrix V computed by CLATSQR !> that defines the input matrices Q_in(k) (ones on the !> diagonal are not stored). See CLATSQR for more details. !> !> On exit: !> !> The array A contains an M-by-N orthonormal matrix Q_out, !> i.e the columns of A are orthogonal unit vectors. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,M). !>
[in]	T	!> T is COMPLEX array, !> dimension (LDT, N * NIRB) !> where NIRB = Number_of_input_row_blocks !> = MAX( 1, CEIL((M-N)/(MB-N)) ) !> Let NICB = Number_of_input_col_blocks !> = CEIL(N/NB) !> !> The upper-triangular block reflectors used to define the !> input matrices Q_in(k), k=(1:NIRB*NICB). The block !> reflectors are stored in compact form in NIRB block !> reflector sequences. Each of the NIRB block reflector !> sequences is stored in a larger NB-by-N column block of T !> and consists of NICB smaller NB-by-NB upper-triangular !> column blocks. See CLATSQR for more details on the format !> of T. !>
[in]	LDT	!> LDT is INTEGER !> The leading dimension of the array T. !> LDT >= max(1,min(NB,N)). !>
[out]	WORK	!> (workspace) COMPLEX array, dimension (MAX(1,LWORK)) !> On exit, if INFO = 0, WORK(1) returns the optimal LWORK. !>
[in]	LWORK	!> The dimension of the array WORK. !> LWORK >= NBLOCAL * MAX(NBLOCAL,(N-NBLOCAL)), !> where NBLOCAL=MIN(NB,N). !> If LWORK = -1, then a workspace query is assumed. !> The routine only calculates the optimal size of the WORK !> array, returns this value as the first entry of the WORK !> array, and no error message related to LWORK is issued !> by XERBLA. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:

!>
!> November 2020, Igor Kozachenko,
!>                Computer Science Division,
!>                University of California, Berkeley
!>
!>

Definition at line 186 of file cungtsqr_row.f.

      IMPLICIT NONE
*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER           INFO, LDA, LDT, LWORK, M, N, MB, NB
*     ..
*     .. Array Arguments ..
      COMPLEX           A( LDA, * ), T( LDT, * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            CONE, CZERO
      parameter( cone = ( 1.0e+0, 0.0e+0 ),
     $                     czero = ( 0.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      LOGICAL            LQUERY
      INTEGER            NBLOCAL, MB2, M_PLUS_ONE, ITMP, IB_BOTTOM,
     $                   LWORKOPT, NUM_ALL_ROW_BLOCKS, JB_T, IB, IMB,
     $                   KB, KB_LAST, KNB, MB1
*     ..
*     .. Local Arrays ..
      COMPLEX            DUMMY( 1, 1 )
*     ..
*     .. External Subroutines ..
      EXTERNAL           clarfb_gett, claset, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          cmplx, max, min
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters
*
      info = 0
      lquery  = lwork.EQ.-1
      IF( m.LT.0 ) THEN
         info = -1
      ELSE IF( n.LT.0 .OR. m.LT.n ) THEN
         info = -2
      ELSE IF( mb.LE.n ) THEN
         info = -3
      ELSE IF( nb.LT.1 ) THEN
         info = -4
      ELSE IF( lda.LT.max( 1, m ) ) THEN
         info = -6
      ELSE IF( ldt.LT.max( 1, min( nb, n ) ) ) THEN
         info = -8
      ELSE IF( lwork.LT.1 .AND. .NOT.lquery ) THEN
         info = -10
      END IF
*
      nblocal = min( nb, n )
*
*     Determine the workspace size.
*
      IF( info.EQ.0 ) THEN
         lworkopt = nblocal * max( nblocal, ( n - nblocal ) )
      END IF
*
*     Handle error in the input parameters and handle the workspace query.
*
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CUNGTSQR_ROW', -info )
         RETURN
      ELSE IF ( lquery ) THEN
         work( 1 ) = cmplx( lworkopt )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( min( m, n ).EQ.0 ) THEN
         work( 1 ) = cmplx( lworkopt )
         RETURN
      END IF
*
*     (0) Set the upper-triangular part of the matrix A to zero and
*     its diagonal elements to one.
*
      CALL claset('U', m, n, czero, cone, a, lda )
*
*     KB_LAST is the column index of the last column block reflector
*     in the matrices T and V.
*
      kb_last = ( ( n-1 ) / nblocal ) * nblocal + 1
*
*
*     (1) Bottom-up loop over row blocks of A, except the top row block.
*     NOTE: If MB>=M, then the loop is never executed.
*
      IF ( mb.LT.m ) THEN
*
*        MB2 is the row blocking size for the row blocks before the
*        first top row block in the matrix A. IB is the row index for
*        the row blocks in the matrix A before the first top row block.
*        IB_BOTTOM is the row index for the last bottom row block
*        in the matrix A. JB_T is the column index of the corresponding
*        column block in the matrix T.
*
*        Initialize variables.
*
*        NUM_ALL_ROW_BLOCKS is the number of row blocks in the matrix A
*        including the first row block.
*
         mb2 = mb - n
         m_plus_one = m + 1
         itmp = ( m - mb - 1 ) / mb2
         ib_bottom = itmp * mb2 + mb + 1
         num_all_row_blocks = itmp + 2
         jb_t = num_all_row_blocks * n + 1
*
         DO ib = ib_bottom, mb+1, -mb2
*
*           Determine the block size IMB for the current row block
*           in the matrix A.
*
            imb = min( m_plus_one - ib, mb2 )
*
*           Determine the column index JB_T for the current column block
*           in the matrix T.
*
            jb_t = jb_t - n
*
*           Apply column blocks of H in the row block from right to left.
*
*           KB is the column index of the current column block reflector
*           in the matrices T and V.
*
            DO kb = kb_last, 1, -nblocal
*
*              Determine the size of the current column block KNB in
*              the matrices T and V.
*
               knb = min( nblocal, n - kb + 1 )
*
               CALL clarfb_gett( 'I', imb, n-kb+1, knb,
     $                     t( 1, jb_t+kb-1 ), ldt, a( kb, kb ), lda,
     $                     a( ib, kb ), lda, work, knb )
*
            END DO
*
         END DO
*
      END IF
*
*     (2) Top row block of A.
*     NOTE: If MB>=M, then we have only one row block of A of size M
*     and we work on the entire matrix A.
*
      mb1 = min( mb, m )
*
*     Apply column blocks of H in the top row block from right to left.
*
*     KB is the column index of the current block reflector in
*     the matrices T and V.
*
      DO kb = kb_last, 1, -nblocal
*
*        Determine the size of the current column block KNB in
*        the matrices T and V.
*
         knb = min( nblocal, n - kb + 1 )
*
         IF( mb1-kb-knb+1.EQ.0 ) THEN
*
*           In SLARFB_GETT parameters, when M=0, then the matrix B
*           does not exist, hence we need to pass a dummy array
*           reference DUMMY(1,1) to B with LDDUMMY=1.
*
            CALL clarfb_gett( 'N', 0, n-kb+1, knb,
     $                        t( 1, kb ), ldt, a( kb, kb ), lda,
     $                        dummy( 1, 1 ), 1, work, knb )
         ELSE
            CALL clarfb_gett( 'N', mb1-kb-knb+1, n-kb+1, knb,
     $                        t( 1, kb ), ldt, a( kb, kb ), lda,
     $                        a( kb+knb, kb), lda, work, knb )
 
         END IF
*
      END DO
*
      work( 1 ) = cmplx( lworkopt )
      RETURN
*
*     End of CUNGTSQR_ROW
*

◆ cunhr_col()

subroutine cunhr_col	(	integer	m,
		integer	n,
		integer	nb,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( ldt, * )	t,
		integer	ldt,
		complex, dimension( * )	d,
		integer	info )

CUNHR_COL

Download CUNHR_COL + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!>  CUNHR_COL takes an M-by-N complex matrix Q_in with orthonormal columns
!>  as input, stored in A, and performs Householder Reconstruction (HR),
!>  i.e. reconstructs Householder vectors V(i) implicitly representing
!>  another M-by-N matrix Q_out, with the property that Q_in = Q_out*S,
!>  where S is an N-by-N diagonal matrix with diagonal entries
!>  equal to +1 or -1. The Householder vectors (columns V(i) of V) are
!>  stored in A on output, and the diagonal entries of S are stored in D.
!>  Block reflectors are also returned in T
!>  (same output format as CGEQRT).
!>

Parameters

[in]	M	!> M is INTEGER !> The number of rows of the matrix A. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix A. M >= N >= 0. !>
[in]	NB	!> NB is INTEGER !> The column block size to be used in the reconstruction !> of Householder column vector blocks in the array A and !> corresponding block reflectors in the array T. NB >= 1. !> (Note that if NB > N, then N is used instead of NB !> as the column block size.) !>
[in,out]	A	!> A is COMPLEX array, dimension (LDA,N) !> !> On entry: !> !> The array A contains an M-by-N orthonormal matrix Q_in, !> i.e the columns of A are orthogonal unit vectors. !> !> On exit: !> !> The elements below the diagonal of A represent the unit !> lower-trapezoidal matrix V of Householder column vectors !> V(i). The unit diagonal entries of V are not stored !> (same format as the output below the diagonal in A from !> CGEQRT). The matrix T and the matrix V stored on output !> in A implicitly define Q_out. !> !> The elements above the diagonal contain the factor U !> of the LU-decomposition: !> Q_in - ( S ) = V * U !> ( 0 ) !> where 0 is a (M-N)-by-(M-N) zero matrix. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,M). !>
[out]	T	!> T is COMPLEX array, !> dimension (LDT, N) !> !> Let NOCB = Number_of_output_col_blocks !> = CEIL(N/NB) !> !> On exit, T(1:NB, 1:N) contains NOCB upper-triangular !> block reflectors used to define Q_out stored in compact !> form as a sequence of upper-triangular NB-by-NB column !> blocks (same format as the output T in CGEQRT). !> The matrix T and the matrix V stored on output in A !> implicitly define Q_out. NOTE: The lower triangles !> below the upper-triangular blocks will be filled with !> zeros. See Further Details. !>
[in]	LDT	!> LDT is INTEGER !> The leading dimension of the array T. !> LDT >= max(1,min(NB,N)). !>
[out]	D	!> D is COMPLEX array, dimension min(M,N). !> The elements can be only plus or minus one. !> !> D(i) is constructed as D(i) = -SIGN(Q_in_i(i,i)), where !> 1 <= i <= min(M,N), and Q_in_i is Q_in after performing !> i-1 steps of “modified” Gaussian elimination. !> See Further Details. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Further Details:

!>
!> The computed M-by-M unitary factor Q_out is defined implicitly as
!> a product of unitary matrices Q_out(i). Each Q_out(i) is stored in
!> the compact WY-representation format in the corresponding blocks of
!> matrices V (stored in A) and T.
!>
!> The M-by-N unit lower-trapezoidal matrix V stored in the M-by-N
!> matrix A contains the column vectors V(i) in NB-size column
!> blocks VB(j). For example, VB(1) contains the columns
!> V(1), V(2), ... V(NB). NOTE: The unit entries on
!> the diagonal of Y are not stored in A.
!>
!> The number of column blocks is
!>
!>     NOCB = Number_of_output_col_blocks = CEIL(N/NB)
!>
!> where each block is of order NB except for the last block, which
!> is of order LAST_NB = N - (NOCB-1)*NB.
!>
!> For example, if M=6,  N=5 and NB=2, the matrix V is
!>
!>
!>     V = (    VB(1),   VB(2), VB(3) ) =
!>
!>       = (   1                      )
!>         ( v21    1                 )
!>         ( v31  v32    1            )
!>         ( v41  v42  v43   1        )
!>         ( v51  v52  v53  v54    1  )
!>         ( v61  v62  v63  v54   v65 )
!>
!>
!> For each of the column blocks VB(i), an upper-triangular block
!> reflector TB(i) is computed. These blocks are stored as
!> a sequence of upper-triangular column blocks in the NB-by-N
!> matrix T. The size of each TB(i) block is NB-by-NB, except
!> for the last block, whose size is LAST_NB-by-LAST_NB.
!>
!> For example, if M=6,  N=5 and NB=2, the matrix T is
!>
!>     T  = (    TB(1),    TB(2), TB(3) ) =
!>
!>        = ( t11  t12  t13  t14   t15  )
!>          (      t22       t24        )
!>
!>
!> The M-by-M factor Q_out is given as a product of NOCB
!> unitary M-by-M matrices Q_out(i).
!>
!>     Q_out = Q_out(1) * Q_out(2) * ... * Q_out(NOCB),
!>
!> where each matrix Q_out(i) is given by the WY-representation
!> using corresponding blocks from the matrices V and T:
!>
!>     Q_out(i) = I - VB(i) * TB(i) * (VB(i))**T,
!>
!> where I is the identity matrix. Here is the formula with matrix
!> dimensions:
!>
!>  Q(i){M-by-M} = I{M-by-M} -
!>    VB(i){M-by-INB} * TB(i){INB-by-INB} * (VB(i))**T {INB-by-M},
!>
!> where INB = NB, except for the last block NOCB
!> for which INB=LAST_NB.
!>
!> =====
!> NOTE:
!> =====
!>
!> If Q_in is the result of doing a QR factorization
!> B = Q_in * R_in, then:
!>
!> B = (Q_out*S) * R_in = Q_out * (S * R_in) = Q_out * R_out.
!>
!> So if one wants to interpret Q_out as the result
!> of the QR factorization of B, then the corresponding R_out
!> should be equal to R_out = S * R_in, i.e. some rows of R_in
!> should be multiplied by -1.
!>
!> For the details of the algorithm, see [1].
!>
!> [1] ,
!>     G. Ballard, J. Demmel, L. Grigori, M. Jacquelin, H.D. Nguyen,
!>     E. Solomonik, J. Parallel Distrib. Comput.,
!>     vol. 85, pp. 3-31, 2015.
!>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:

!>
!> November   2019, Igor Kozachenko,
!>            Computer Science Division,
!>            University of California, Berkeley
!>
!>

Definition at line 258 of file cunhr_col.f.

      IMPLICIT NONE
*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER           INFO, LDA, LDT, M, N, NB
*     ..
*     .. Array Arguments ..
      COMPLEX           A( LDA, * ), D( * ), T( LDT, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            CONE, CZERO
      parameter( cone = ( 1.0e+0, 0.0e+0 ),
     $                     czero = ( 0.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      INTEGER            I, IINFO, J, JB, JBTEMP1, JBTEMP2, JNB,
     $                   NPLUSONE
*     ..
*     .. External Subroutines ..
      EXTERNAL           ccopy, claunhr_col_getrfnp, cscal, ctrsm,
     $                   xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, min
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters
*
      info = 0
      IF( m.LT.0 ) THEN
         info = -1
      ELSE IF( n.LT.0 .OR. n.GT.m ) THEN
         info = -2
      ELSE IF( nb.LT.1 ) THEN
         info = -3
      ELSE IF( lda.LT.max( 1, m ) ) THEN
         info = -5
      ELSE IF( ldt.LT.max( 1, min( nb, n ) ) ) THEN
         info = -7
      END IF
*
*     Handle error in the input parameters.
*
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CUNHR_COL', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( min( m, n ).EQ.0 ) THEN
         RETURN
      END IF
*
*     On input, the M-by-N matrix A contains the unitary
*     M-by-N matrix Q_in.
*
*     (1) Compute the unit lower-trapezoidal V (ones on the diagonal
*     are not stored) by performing the "modified" LU-decomposition.
*
*     Q_in - ( S ) = V * U = ( V1 ) * U,
*            ( 0 )           ( V2 )
*
*     where 0 is an (M-N)-by-N zero matrix.
*
*     (1-1) Factor V1 and U.
 
      CALL claunhr_col_getrfnp( n, n, a, lda, d, iinfo )
*
*     (1-2) Solve for V2.
*
      IF( m.GT.n ) THEN
         CALL ctrsm( 'R', 'U', 'N', 'N', m-n, n, cone, a, lda,
     $               a( n+1, 1 ), lda )
      END IF
*
*     (2) Reconstruct the block reflector T stored in T(1:NB, 1:N)
*     as a sequence of upper-triangular blocks with NB-size column
*     blocking.
*
*     Loop over the column blocks of size NB of the array A(1:M,1:N)
*     and the array T(1:NB,1:N), JB is the column index of a column
*     block, JNB is the column block size at each step JB.
*
      nplusone = n + 1
      DO jb = 1, n, nb
*
*        (2-0) Determine the column block size JNB.
*
         jnb = min( nplusone-jb, nb )
*
*        (2-1) Copy the upper-triangular part of the current JNB-by-JNB
*        diagonal block U(JB) (of the N-by-N matrix U) stored
*        in A(JB:JB+JNB-1,JB:JB+JNB-1) into the upper-triangular part
*        of the current JNB-by-JNB block T(1:JNB,JB:JB+JNB-1)
*        column-by-column, total JNB*(JNB+1)/2 elements.
*
         jbtemp1 = jb - 1
         DO j = jb, jb+jnb-1
            CALL ccopy( j-jbtemp1, a( jb, j ), 1, t( 1, j ), 1 )
         END DO
*
*        (2-2) Perform on the upper-triangular part of the current
*        JNB-by-JNB diagonal block U(JB) (of the N-by-N matrix U) stored
*        in T(1:JNB,JB:JB+JNB-1) the following operation in place:
*        (-1)*U(JB)*S(JB), i.e the result will be stored in the upper-
*        triangular part of T(1:JNB,JB:JB+JNB-1). This multiplication
*        of the JNB-by-JNB diagonal block U(JB) by the JNB-by-JNB
*        diagonal block S(JB) of the N-by-N sign matrix S from the
*        right means changing the sign of each J-th column of the block
*        U(JB) according to the sign of the diagonal element of the block
*        S(JB), i.e. S(J,J) that is stored in the array element D(J).
*
         DO j = jb, jb+jnb-1
            IF( d( j ).EQ.cone ) THEN
               CALL cscal( j-jbtemp1, -cone, t( 1, j ), 1 )
            END IF
         END DO
*
*        (2-3) Perform the triangular solve for the current block
*        matrix X(JB):
*
*               X(JB) * (A(JB)**T) = B(JB), where:
*
*               A(JB)**T  is a JNB-by-JNB unit upper-triangular
*                         coefficient block, and A(JB)=V1(JB), which
*                         is a JNB-by-JNB unit lower-triangular block
*                         stored in A(JB:JB+JNB-1,JB:JB+JNB-1).
*                         The N-by-N matrix V1 is the upper part
*                         of the M-by-N lower-trapezoidal matrix V
*                         stored in A(1:M,1:N);
*
*               B(JB)     is a JNB-by-JNB  upper-triangular right-hand
*                         side block, B(JB) = (-1)*U(JB)*S(JB), and
*                         B(JB) is stored in T(1:JNB,JB:JB+JNB-1);
*
*               X(JB)     is a JNB-by-JNB upper-triangular solution
*                         block, X(JB) is the upper-triangular block
*                         reflector T(JB), and X(JB) is stored
*                         in T(1:JNB,JB:JB+JNB-1).
*
*             In other words, we perform the triangular solve for the
*             upper-triangular block T(JB):
*
*               T(JB) * (V1(JB)**T) = (-1)*U(JB)*S(JB).
*
*             Even though the blocks X(JB) and B(JB) are upper-
*             triangular, the routine CTRSM will access all JNB**2
*             elements of the square T(1:JNB,JB:JB+JNB-1). Therefore,
*             we need to set to zero the elements of the block
*             T(1:JNB,JB:JB+JNB-1) below the diagonal before the call
*             to CTRSM.
*
*        (2-3a) Set the elements to zero.
*
         jbtemp2 = jb - 2
         DO j = jb, jb+jnb-2
            DO i = j-jbtemp2, nb
               t( i, j ) = czero
            END DO
         END DO
*
*        (2-3b) Perform the triangular solve.
*
         CALL ctrsm( 'R', 'L', 'C', 'U', jnb, jnb, cone,
     $               a( jb, jb ), lda, t( 1, jb ), ldt )
*
      END DO
*
      RETURN
*
*     End of CUNHR_COL
*

◆ cunm22()

subroutine cunm22	(	character	side,
		character	trans,
		integer	m,
		integer	n,
		integer	n1,
		integer	n2,
		complex, dimension( ldq, * )	q,
		integer	ldq,
		complex, dimension( ldc, * )	c,
		integer	ldc,
		complex, dimension( * )	work,
		integer	lwork,
		integer	info )

CUNM22 multiplies a general matrix by a banded unitary matrix.

Download CUNM22 + dependencies [TGZ] [ZIP] [TXT]

Purpose

!>
!>  CUNM22 overwrites the general complex M-by-N matrix C with
!>
!>                  SIDE = 'L'     SIDE = 'R'
!>  TRANS = 'N':      Q * C          C * Q
!>  TRANS = 'C':      Q**H * C       C * Q**H
!>
!>  where Q is a complex unitary matrix of order NQ, with NQ = M if
!>  SIDE = 'L' and NQ = N if SIDE = 'R'.
!>  The unitary matrix Q processes a 2-by-2 block structure
!>
!>         [  Q11  Q12  ]
!>     Q = [            ]
!>         [  Q21  Q22  ],
!>
!>  where Q12 is an N1-by-N1 lower triangular matrix and Q21 is an
!>  N2-by-N2 upper triangular matrix.
!>

Parameters

[in]	SIDE	!> SIDE is CHARACTER1 !> = 'L': apply Q or QH from the Left; !> = 'R': apply Q or Q*H from the Right. !>
[in]	TRANS	!> TRANS is CHARACTER1 !> = 'N': apply Q (No transpose); !> = 'C': apply Q*H (Conjugate transpose). !>
[in]	M	!> M is INTEGER !> The number of rows of the matrix C. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix C. N >= 0. !>
[in]	N1
[in]	N2	!> N1 is INTEGER !> N2 is INTEGER !> The dimension of Q12 and Q21, respectively. N1, N2 >= 0. !> The following requirement must be satisfied: !> N1 + N2 = M if SIDE = 'L' and N1 + N2 = N if SIDE = 'R'. !>
[in]	Q	!> Q is COMPLEX array, dimension !> (LDQ,M) if SIDE = 'L' !> (LDQ,N) if SIDE = 'R' !>
[in]	LDQ	!> LDQ is INTEGER !> The leading dimension of the array Q. !> LDQ >= max(1,M) if SIDE = 'L'; LDQ >= max(1,N) if SIDE = 'R'. !>
[in,out]	C	!> C is COMPLEX array, dimension (LDC,N) !> On entry, the M-by-N matrix C. !> On exit, C is overwritten by QC or QHC or CQH or CQ. !>
[in]	LDC	!> LDC is INTEGER !> The leading dimension of the array C. LDC >= max(1,M). !>
[out]	WORK	!> WORK is COMPLEX array, dimension (MAX(1,LWORK)) !> On exit, if INFO = 0, WORK(1) returns the optimal LWORK. !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the array WORK. !> If SIDE = 'L', LWORK >= max(1,N); !> if SIDE = 'R', LWORK >= max(1,M). !> For optimum performance LWORK >= M*N. !> !> If LWORK = -1, then a workspace query is assumed; the routine !> only calculates the optimal size of the WORK array, returns !> this value as the first entry of the WORK array, and no error !> message related to LWORK is issued by XERBLA. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 160 of file cunm22.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
      IMPLICIT NONE
*
*     .. Scalar Arguments ..
      CHARACTER          SIDE, TRANS
      INTEGER            M, N, N1, N2, LDQ, LDC, LWORK, INFO
*     ..
*     .. Array Arguments ..
      COMPLEX            Q( LDQ, * ), C( LDC, * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            ONE
      parameter( one = ( 1.0e+0, 0.0e+0 ) )
*
*     .. Local Scalars ..
      LOGICAL            LEFT, LQUERY, NOTRAN
      INTEGER            I, LDWORK, LEN, LWKOPT, NB, NQ, NW
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           cgemm, clacpy, ctrmm, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          cmplx, max, min
*     ..
*     .. Executable Statements ..
*
*     Test the input arguments
*
      info = 0
      left = lsame( side, 'L' )
      notran = lsame( trans, 'N' )
      lquery = ( lwork.EQ.-1 )
*
*     NQ is the order of Q;
*     NW is the minimum dimension of WORK.
*
      IF( left ) THEN
         nq = m
      ELSE
         nq = n
      END IF
      nw = nq
      IF( n1.EQ.0 .OR. n2.EQ.0 ) nw = 1
      IF( .NOT.left .AND. .NOT.lsame( side, 'R' ) ) THEN
         info = -1
      ELSE IF( .NOT.lsame( trans, 'N' ) .AND. .NOT.lsame( trans, 'C' ) )
     $          THEN
         info = -2
      ELSE IF( m.LT.0 ) THEN
         info = -3
      ELSE IF( n.LT.0 ) THEN
         info = -4
      ELSE IF( n1.LT.0 .OR. n1+n2.NE.nq ) THEN
         info = -5
      ELSE IF( n2.LT.0 ) THEN
         info = -6
      ELSE IF( ldq.LT.max( 1, nq ) ) THEN
         info = -8
      ELSE IF( ldc.LT.max( 1, m ) ) THEN
         info = -10
      ELSE IF( lwork.LT.nw .AND. .NOT.lquery ) THEN
         info = -12
      END IF
*
      IF( info.EQ.0 ) THEN
         lwkopt = m*n
         work( 1 ) = cmplx( lwkopt )
      END IF
*
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CUNM22', -info )
         RETURN
      ELSE IF( lquery ) THEN
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( m.EQ.0 .OR. n.EQ.0 ) THEN
         work( 1 ) = 1
         RETURN
      END IF
*
*     Degenerate cases (N1 = 0 or N2 = 0) are handled using CTRMM.
*
      IF( n1.EQ.0 ) THEN
         CALL ctrmm( side, 'Upper', trans, 'Non-Unit', m, n, one,
     $               q, ldq, c, ldc )
         work( 1 ) = one
         RETURN
      ELSE IF( n2.EQ.0 ) THEN
         CALL ctrmm( side, 'Lower', trans, 'Non-Unit', m, n, one,
     $               q, ldq, c, ldc )
         work( 1 ) = one
         RETURN
      END IF
*
*     Compute the largest chunk size available from the workspace.
*
      nb = max( 1, min( lwork, lwkopt ) / nq )
*
      IF( left ) THEN
         IF( notran ) THEN
            DO i = 1, n, nb
               len = min( nb, n-i+1 )
               ldwork = m
*
*              Multiply bottom part of C by Q12.
*
               CALL clacpy( 'All', n1, len, c( n2+1, i ), ldc, work,
     $                      ldwork )
               CALL ctrmm( 'Left', 'Lower', 'No Transpose', 'Non-Unit',
     $                     n1, len, one, q( 1, n2+1 ), ldq, work,
     $                     ldwork )
*
*              Multiply top part of C by Q11.
*
               CALL cgemm( 'No Transpose', 'No Transpose', n1, len, n2,
     $                     one, q, ldq, c( 1, i ), ldc, one, work,
     $                     ldwork )
*
*              Multiply top part of C by Q21.
*
               CALL clacpy( 'All', n2, len, c( 1, i ), ldc,
     $                      work( n1+1 ), ldwork )
               CALL ctrmm( 'Left', 'Upper', 'No Transpose', 'Non-Unit',
     $                     n2, len, one, q( n1+1, 1 ), ldq,
     $                     work( n1+1 ), ldwork )
*
*              Multiply bottom part of C by Q22.
*
               CALL cgemm( 'No Transpose', 'No Transpose', n2, len, n1,
     $                     one, q( n1+1, n2+1 ), ldq, c( n2+1, i ), ldc,
     $                     one, work( n1+1 ), ldwork )
*
*              Copy everything back.
*
               CALL clacpy( 'All', m, len, work, ldwork, c( 1, i ),
     $                      ldc )
            END DO
         ELSE
            DO i = 1, n, nb
               len = min( nb, n-i+1 )
               ldwork = m
*
*              Multiply bottom part of C by Q21**H.
*
               CALL clacpy( 'All', n2, len, c( n1+1, i ), ldc, work,
     $                      ldwork )
               CALL ctrmm( 'Left', 'Upper', 'Conjugate', 'Non-Unit',
     $                     n2, len, one, q( n1+1, 1 ), ldq, work,
     $                     ldwork )
*
*              Multiply top part of C by Q11**H.
*
               CALL cgemm( 'Conjugate', 'No Transpose', n2, len, n1,
     $                     one, q, ldq, c( 1, i ), ldc, one, work,
     $                     ldwork )
*
*              Multiply top part of C by Q12**H.
*
               CALL clacpy( 'All', n1, len, c( 1, i ), ldc,
     $                      work( n2+1 ), ldwork )
               CALL ctrmm( 'Left', 'Lower', 'Conjugate', 'Non-Unit',
     $                     n1, len, one, q( 1, n2+1 ), ldq,
     $                     work( n2+1 ), ldwork )
*
*              Multiply bottom part of C by Q22**H.
*
               CALL cgemm( 'Conjugate', 'No Transpose', n1, len, n2,
     $                     one, q( n1+1, n2+1 ), ldq, c( n1+1, i ), ldc,
     $                     one, work( n2+1 ), ldwork )
*
*              Copy everything back.
*
               CALL clacpy( 'All', m, len, work, ldwork, c( 1, i ),
     $                      ldc )
            END DO
         END IF
      ELSE
         IF( notran ) THEN
            DO i = 1, m, nb
               len = min( nb, m-i+1 )
               ldwork = len
*
*              Multiply right part of C by Q21.
*
               CALL clacpy( 'All', len, n2, c( i, n1+1 ), ldc, work,
     $                      ldwork )
               CALL ctrmm( 'Right', 'Upper', 'No Transpose', 'Non-Unit',
     $                     len, n2, one, q( n1+1, 1 ), ldq, work,
     $                     ldwork )
*
*              Multiply left part of C by Q11.
*
               CALL cgemm( 'No Transpose', 'No Transpose', len, n2, n1,
     $                     one, c( i, 1 ), ldc, q, ldq, one, work,
     $                     ldwork )
*
*              Multiply left part of C by Q12.
*
               CALL clacpy( 'All', len, n1, c( i, 1 ), ldc,
     $                      work( 1 + n2*ldwork ), ldwork )
               CALL ctrmm( 'Right', 'Lower', 'No Transpose', 'Non-Unit',
     $                     len, n1, one, q( 1, n2+1 ), ldq,
     $                     work( 1 + n2*ldwork ), ldwork )
*
*              Multiply right part of C by Q22.
*
               CALL cgemm( 'No Transpose', 'No Transpose', len, n1, n2,
     $                     one, c( i, n1+1 ), ldc, q( n1+1, n2+1 ), ldq,
     $                     one, work( 1 + n2*ldwork ), ldwork )
*
*              Copy everything back.
*
               CALL clacpy( 'All', len, n, work, ldwork, c( i, 1 ),
     $                      ldc )
            END DO
         ELSE
            DO i = 1, m, nb
               len = min( nb, m-i+1 )
               ldwork = len
*
*              Multiply right part of C by Q12**H.
*
               CALL clacpy( 'All', len, n1, c( i, n2+1 ), ldc, work,
     $                      ldwork )
               CALL ctrmm( 'Right', 'Lower', 'Conjugate', 'Non-Unit',
     $                     len, n1, one, q( 1, n2+1 ), ldq, work,
     $                     ldwork )
*
*              Multiply left part of C by Q11**H.
*
               CALL cgemm( 'No Transpose', 'Conjugate', len, n1, n2,
     $                     one, c( i, 1 ), ldc, q, ldq, one, work,
     $                     ldwork )
*
*              Multiply left part of C by Q21**H.
*
               CALL clacpy( 'All', len, n2, c( i, 1 ), ldc,
     $                      work( 1 + n1*ldwork ), ldwork )
               CALL ctrmm( 'Right', 'Upper', 'Conjugate', 'Non-Unit',
     $                     len, n2, one, q( n1+1, 1 ), ldq,
     $                     work( 1 + n1*ldwork ), ldwork )
*
*              Multiply right part of C by Q22**H.
*
               CALL cgemm( 'No Transpose', 'Conjugate', len, n2, n1,
     $                     one, c( i, n2+1 ), ldc, q( n1+1, n2+1 ), ldq,
     $                     one, work( 1 + n1*ldwork ), ldwork )
*
*              Copy everything back.
*
               CALL clacpy( 'All', len, n, work, ldwork, c( i, 1 ),
     $                      ldc )
            END DO
         END IF
      END IF
*
      work( 1 ) = cmplx( lwkopt )
      RETURN
*
*     End of CUNM22
*

◆ cunm2l()

subroutine cunm2l	(	character	side,
		character	trans,
		integer	m,
		integer	n,
		integer	k,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( * )	tau,
		complex, dimension( ldc, * )	c,
		integer	ldc,
		complex, dimension( * )	work,
		integer	info )

CUNM2L multiplies a general matrix by the unitary matrix from a QL factorization determined by cgeqlf (unblocked algorithm).

Download CUNM2L + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CUNM2L overwrites the general complex m-by-n matrix C with
!>
!>       Q * C  if SIDE = 'L' and TRANS = 'N', or
!>
!>       Q**H* C  if SIDE = 'L' and TRANS = 'C', or
!>
!>       C * Q  if SIDE = 'R' and TRANS = 'N', or
!>
!>       C * Q**H if SIDE = 'R' and TRANS = 'C',
!>
!> where Q is a complex unitary matrix defined as the product of k
!> elementary reflectors
!>
!>       Q = H(k) . . . H(2) H(1)
!>
!> as returned by CGEQLF. Q is of order m if SIDE = 'L' and of order n
!> if SIDE = 'R'.
!>

Parameters

[in]	SIDE	!> SIDE is CHARACTER1 !> = 'L': apply Q or QH from the Left !> = 'R': apply Q or Q*H from the Right !>
[in]	TRANS	!> TRANS is CHARACTER1 !> = 'N': apply Q (No transpose) !> = 'C': apply Q*H (Conjugate transpose) !>
[in]	M	!> M is INTEGER !> The number of rows of the matrix C. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix C. N >= 0. !>
[in]	K	!> K is INTEGER !> The number of elementary reflectors whose product defines !> the matrix Q. !> If SIDE = 'L', M >= K >= 0; !> if SIDE = 'R', N >= K >= 0. !>
[in]	A	!> A is COMPLEX array, dimension (LDA,K) !> The i-th column must contain the vector which defines the !> elementary reflector H(i), for i = 1,2,...,k, as returned by !> CGEQLF in the last k columns of its array argument A. !> A is modified by the routine but restored on exit. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. !> If SIDE = 'L', LDA >= max(1,M); !> if SIDE = 'R', LDA >= max(1,N). !>
[in]	TAU	!> TAU is COMPLEX array, dimension (K) !> TAU(i) must contain the scalar factor of the elementary !> reflector H(i), as returned by CGEQLF. !>
[in,out]	C	!> C is COMPLEX array, dimension (LDC,N) !> On entry, the m-by-n matrix C. !> On exit, C is overwritten by QC or QHC or CQH or CQ. !>
[in]	LDC	!> LDC is INTEGER !> The leading dimension of the array C. LDC >= max(1,M). !>
[out]	WORK	!> WORK is COMPLEX array, dimension !> (N) if SIDE = 'L', !> (M) if SIDE = 'R' !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 157 of file cunm2l.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          SIDE, TRANS
      INTEGER            INFO, K, LDA, LDC, M, N
*     ..
*     .. Array Arguments ..
      COMPLEX            A( LDA, * ), C( LDC, * ), TAU( * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            ONE
      parameter( one = ( 1.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      LOGICAL            LEFT, NOTRAN
      INTEGER            I, I1, I2, I3, MI, NI, NQ
      COMPLEX            AII, TAUI
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           clarf, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          conjg, max
*     ..
*     .. Executable Statements ..
*
*     Test the input arguments
*
      info = 0
      left = lsame( side, 'L' )
      notran = lsame( trans, 'N' )
*
*     NQ is the order of Q
*
      IF( left ) THEN
         nq = m
      ELSE
         nq = n
      END IF
      IF( .NOT.left .AND. .NOT.lsame( side, 'R' ) ) THEN
         info = -1
      ELSE IF( .NOT.notran .AND. .NOT.lsame( trans, 'C' ) ) THEN
         info = -2
      ELSE IF( m.LT.0 ) THEN
         info = -3
      ELSE IF( n.LT.0 ) THEN
         info = -4
      ELSE IF( k.LT.0 .OR. k.GT.nq ) THEN
         info = -5
      ELSE IF( lda.LT.max( 1, nq ) ) THEN
         info = -7
      ELSE IF( ldc.LT.max( 1, m ) ) THEN
         info = -10
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CUNM2L', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( m.EQ.0 .OR. n.EQ.0 .OR. k.EQ.0 )
     $   RETURN
*
      IF( ( left .AND. notran .OR. .NOT.left .AND. .NOT.notran ) ) THEN
         i1 = 1
         i2 = k
         i3 = 1
      ELSE
         i1 = k
         i2 = 1
         i3 = -1
      END IF
*
      IF( left ) THEN
         ni = n
      ELSE
         mi = m
      END IF
*
      DO 10 i = i1, i2, i3
         IF( left ) THEN
*
*           H(i) or H(i)**H is applied to C(1:m-k+i,1:n)
*
            mi = m - k + i
         ELSE
*
*           H(i) or H(i)**H is applied to C(1:m,1:n-k+i)
*
            ni = n - k + i
         END IF
*
*        Apply H(i) or H(i)**H
*
         IF( notran ) THEN
            taui = tau( i )
         ELSE
            taui = conjg( tau( i ) )
         END IF
         aii = a( nq-k+i, i )
         a( nq-k+i, i ) = one
         CALL clarf( side, mi, ni, a( 1, i ), 1, taui, c, ldc, work )
         a( nq-k+i, i ) = aii
   10 CONTINUE
      RETURN
*
*     End of CUNM2L
*

◆ cunm2r()

subroutine cunm2r	(	character	side,
		character	trans,
		integer	m,
		integer	n,
		integer	k,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( * )	tau,
		complex, dimension( ldc, * )	c,
		integer	ldc,
		complex, dimension( * )	work,
		integer	info )

CUNM2R multiplies a general matrix by the unitary matrix from a QR factorization determined by cgeqrf (unblocked algorithm).

Download CUNM2R + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CUNM2R overwrites the general complex m-by-n matrix C with
!>
!>       Q * C  if SIDE = 'L' and TRANS = 'N', or
!>
!>       Q**H* C  if SIDE = 'L' and TRANS = 'C', or
!>
!>       C * Q  if SIDE = 'R' and TRANS = 'N', or
!>
!>       C * Q**H if SIDE = 'R' and TRANS = 'C',
!>
!> where Q is a complex unitary matrix defined as the product of k
!> elementary reflectors
!>
!>       Q = H(1) H(2) . . . H(k)
!>
!> as returned by CGEQRF. Q is of order m if SIDE = 'L' and of order n
!> if SIDE = 'R'.
!>

Parameters

[in]	SIDE	!> SIDE is CHARACTER1 !> = 'L': apply Q or QH from the Left !> = 'R': apply Q or Q*H from the Right !>
[in]	TRANS	!> TRANS is CHARACTER1 !> = 'N': apply Q (No transpose) !> = 'C': apply Q*H (Conjugate transpose) !>
[in]	M	!> M is INTEGER !> The number of rows of the matrix C. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix C. N >= 0. !>
[in]	K	!> K is INTEGER !> The number of elementary reflectors whose product defines !> the matrix Q. !> If SIDE = 'L', M >= K >= 0; !> if SIDE = 'R', N >= K >= 0. !>
[in]	A	!> A is COMPLEX array, dimension (LDA,K) !> The i-th column must contain the vector which defines the !> elementary reflector H(i), for i = 1,2,...,k, as returned by !> CGEQRF in the first k columns of its array argument A. !> A is modified by the routine but restored on exit. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. !> If SIDE = 'L', LDA >= max(1,M); !> if SIDE = 'R', LDA >= max(1,N). !>
[in]	TAU	!> TAU is COMPLEX array, dimension (K) !> TAU(i) must contain the scalar factor of the elementary !> reflector H(i), as returned by CGEQRF. !>
[in,out]	C	!> C is COMPLEX array, dimension (LDC,N) !> On entry, the m-by-n matrix C. !> On exit, C is overwritten by QC or QHC or CQH or CQ. !>
[in]	LDC	!> LDC is INTEGER !> The leading dimension of the array C. LDC >= max(1,M). !>
[out]	WORK	!> WORK is COMPLEX array, dimension !> (N) if SIDE = 'L', !> (M) if SIDE = 'R' !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 157 of file cunm2r.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          SIDE, TRANS
      INTEGER            INFO, K, LDA, LDC, M, N
*     ..
*     .. Array Arguments ..
      COMPLEX            A( LDA, * ), C( LDC, * ), TAU( * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            ONE
      parameter( one = ( 1.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      LOGICAL            LEFT, NOTRAN
      INTEGER            I, I1, I2, I3, IC, JC, MI, NI, NQ
      COMPLEX            AII, TAUI
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           clarf, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          conjg, max
*     ..
*     .. Executable Statements ..
*
*     Test the input arguments
*
      info = 0
      left = lsame( side, 'L' )
      notran = lsame( trans, 'N' )
*
*     NQ is the order of Q
*
      IF( left ) THEN
         nq = m
      ELSE
         nq = n
      END IF
      IF( .NOT.left .AND. .NOT.lsame( side, 'R' ) ) THEN
         info = -1
      ELSE IF( .NOT.notran .AND. .NOT.lsame( trans, 'C' ) ) THEN
         info = -2
      ELSE IF( m.LT.0 ) THEN
         info = -3
      ELSE IF( n.LT.0 ) THEN
         info = -4
      ELSE IF( k.LT.0 .OR. k.GT.nq ) THEN
         info = -5
      ELSE IF( lda.LT.max( 1, nq ) ) THEN
         info = -7
      ELSE IF( ldc.LT.max( 1, m ) ) THEN
         info = -10
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CUNM2R', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( m.EQ.0 .OR. n.EQ.0 .OR. k.EQ.0 )
     $   RETURN
*
      IF( ( left .AND. .NOT.notran .OR. .NOT.left .AND. notran ) ) THEN
         i1 = 1
         i2 = k
         i3 = 1
      ELSE
         i1 = k
         i2 = 1
         i3 = -1
      END IF
*
      IF( left ) THEN
         ni = n
         jc = 1
      ELSE
         mi = m
         ic = 1
      END IF
*
      DO 10 i = i1, i2, i3
         IF( left ) THEN
*
*           H(i) or H(i)**H is applied to C(i:m,1:n)
*
            mi = m - i + 1
            ic = i
         ELSE
*
*           H(i) or H(i)**H is applied to C(1:m,i:n)
*
            ni = n - i + 1
            jc = i
         END IF
*
*        Apply H(i) or H(i)**H
*
         IF( notran ) THEN
            taui = tau( i )
         ELSE
            taui = conjg( tau( i ) )
         END IF
         aii = a( i, i )
         a( i, i ) = one
         CALL clarf( side, mi, ni, a( i, i ), 1, taui, c( ic, jc ), ldc,
     $               work )
         a( i, i ) = aii
   10 CONTINUE
      RETURN
*
*     End of CUNM2R
*

◆ cunmbr()

subroutine cunmbr	(	character	vect,
		character	side,
		character	trans,
		integer	m,
		integer	n,
		integer	k,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( * )	tau,
		complex, dimension( ldc, * )	c,
		integer	ldc,
		complex, dimension( * )	work,
		integer	lwork,
		integer	info )

CUNMBR

Download CUNMBR + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> If VECT = 'Q', CUNMBR overwrites the general complex M-by-N matrix C
!> with
!>                 SIDE = 'L'     SIDE = 'R'
!> TRANS = 'N':      Q * C          C * Q
!> TRANS = 'C':      Q**H * C       C * Q**H
!>
!> If VECT = 'P', CUNMBR overwrites the general complex M-by-N matrix C
!> with
!>                 SIDE = 'L'     SIDE = 'R'
!> TRANS = 'N':      P * C          C * P
!> TRANS = 'C':      P**H * C       C * P**H
!>
!> Here Q and P**H are the unitary matrices determined by CGEBRD when
!> reducing a complex matrix A to bidiagonal form: A = Q * B * P**H. Q
!> and P**H are defined as products of elementary reflectors H(i) and
!> G(i) respectively.
!>
!> Let nq = m if SIDE = 'L' and nq = n if SIDE = 'R'. Thus nq is the
!> order of the unitary matrix Q or P**H that is applied.
!>
!> If VECT = 'Q', A is assumed to have been an NQ-by-K matrix:
!> if nq >= k, Q = H(1) H(2) . . . H(k);
!> if nq < k, Q = H(1) H(2) . . . H(nq-1).
!>
!> If VECT = 'P', A is assumed to have been a K-by-NQ matrix:
!> if k < nq, P = G(1) G(2) . . . G(k);
!> if k >= nq, P = G(1) G(2) . . . G(nq-1).
!>

Parameters

[in]	VECT	!> VECT is CHARACTER1 !> = 'Q': apply Q or QH; !> = 'P': apply P or P*H. !>
[in]	SIDE	!> SIDE is CHARACTER1 !> = 'L': apply Q, QH, P or PH from the Left; !> = 'R': apply Q, QH, P or P*H from the Right. !>
[in]	TRANS	!> TRANS is CHARACTER1 !> = 'N': No transpose, apply Q or P; !> = 'C': Conjugate transpose, apply QH or P*H. !>
[in]	M	!> M is INTEGER !> The number of rows of the matrix C. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix C. N >= 0. !>
[in]	K	!> K is INTEGER !> If VECT = 'Q', the number of columns in the original !> matrix reduced by CGEBRD. !> If VECT = 'P', the number of rows in the original !> matrix reduced by CGEBRD. !> K >= 0. !>
[in]	A	!> A is COMPLEX array, dimension !> (LDA,min(nq,K)) if VECT = 'Q' !> (LDA,nq) if VECT = 'P' !> The vectors which define the elementary reflectors H(i) and !> G(i), whose products determine the matrices Q and P, as !> returned by CGEBRD. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. !> If VECT = 'Q', LDA >= max(1,nq); !> if VECT = 'P', LDA >= max(1,min(nq,K)). !>
[in]	TAU	!> TAU is COMPLEX array, dimension (min(nq,K)) !> TAU(i) must contain the scalar factor of the elementary !> reflector H(i) or G(i) which determines Q or P, as returned !> by CGEBRD in the array argument TAUQ or TAUP. !>
[in,out]	C	!> C is COMPLEX array, dimension (LDC,N) !> On entry, the M-by-N matrix C. !> On exit, C is overwritten by QC or QHC or CQH or CQ !> or PC or PHC or CP or CP**H. !>
[in]	LDC	!> LDC is INTEGER !> The leading dimension of the array C. LDC >= max(1,M). !>
[out]	WORK	!> WORK is COMPLEX array, dimension (MAX(1,LWORK)) !> On exit, if INFO = 0, WORK(1) returns the optimal LWORK. !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the array WORK. !> If SIDE = 'L', LWORK >= max(1,N); !> if SIDE = 'R', LWORK >= max(1,M); !> if N = 0 or M = 0, LWORK >= 1. !> For optimum performance LWORK >= max(1,NNB) if SIDE = 'L', !> and LWORK >= max(1,MNB) if SIDE = 'R', where NB is the !> optimal blocksize. (NB = 0 if M = 0 or N = 0.) !> !> If LWORK = -1, then a workspace query is assumed; the routine !> only calculates the optimal size of the WORK array, returns !> this value as the first entry of the WORK array, and no error !> message related to LWORK is issued by XERBLA. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 195 of file cunmbr.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          SIDE, TRANS, VECT
      INTEGER            INFO, K, LDA, LDC, LWORK, M, N
*     ..
*     .. Array Arguments ..
      COMPLEX            A( LDA, * ), C( LDC, * ), TAU( * ),
     $                   WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Local Scalars ..
      LOGICAL            APPLYQ, LEFT, LQUERY, NOTRAN
      CHARACTER          TRANST
      INTEGER            I1, I2, IINFO, LWKOPT, MI, NB, NI, NQ, NW
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      INTEGER            ILAENV
      EXTERNAL           ilaenv, lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           cunmlq, cunmqr, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, min
*     ..
*     .. Executable Statements ..
*
*     Test the input arguments
*
      info = 0
      applyq = lsame( vect, 'Q' )
      left = lsame( side, 'L' )
      notran = lsame( trans, 'N' )
      lquery = ( lwork.EQ.-1 )
*
*     NQ is the order of Q or P and NW is the minimum dimension of WORK
*
      IF( left ) THEN
         nq = m
         nw = max( 1, n )
      ELSE
         nq = n
         nw = max( 1, m )
      END IF
      IF( .NOT.applyq .AND. .NOT.lsame( vect, 'P' ) ) THEN
         info = -1
      ELSE IF( .NOT.left .AND. .NOT.lsame( side, 'R' ) ) THEN
         info = -2
      ELSE IF( .NOT.notran .AND. .NOT.lsame( trans, 'C' ) ) THEN
         info = -3
      ELSE IF( m.LT.0 ) THEN
         info = -4
      ELSE IF( n.LT.0 ) THEN
         info = -5
      ELSE IF( k.LT.0 ) THEN
         info = -6
      ELSE IF( ( applyq .AND. lda.LT.max( 1, nq ) ) .OR.
     $         ( .NOT.applyq .AND. lda.LT.max( 1, min( nq, k ) ) ) )
     $          THEN
         info = -8
      ELSE IF( ldc.LT.max( 1, m ) ) THEN
         info = -11
      ELSE IF( lwork.LT.nw .AND. .NOT.lquery ) THEN
         info = -13
      END IF
*
      IF( info.EQ.0 ) THEN
         IF( m.GT.0 .AND. n.GT.0 ) THEN
            IF( applyq ) THEN
               IF( left ) THEN
                  nb = ilaenv( 1, 'CUNMQR', side // trans, m-1, n, m-1,
     $                         -1 )
               ELSE
                  nb = ilaenv( 1, 'CUNMQR', side // trans, m, n-1, n-1,
     $                         -1 )
               END IF
            ELSE
               IF( left ) THEN
                  nb = ilaenv( 1, 'CUNMLQ', side // trans, m-1, n, m-1,
     $                         -1 )
               ELSE
                  nb = ilaenv( 1, 'CUNMLQ', side // trans, m, n-1, n-1,
     $                         -1 )
               END IF
            END IF
            lwkopt = nw*nb
         ELSE
            lwkopt = 1
         END IF
         work( 1 ) = lwkopt
      END IF
*
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CUNMBR', -info )
         RETURN
      ELSE IF( lquery ) THEN
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( m.EQ.0 .OR. n.EQ.0 )
     $   RETURN
*
      IF( applyq ) THEN
*
*        Apply Q
*
         IF( nq.GE.k ) THEN
*
*           Q was determined by a call to CGEBRD with nq >= k
*
            CALL cunmqr( side, trans, m, n, k, a, lda, tau, c, ldc,
     $                   work, lwork, iinfo )
         ELSE IF( nq.GT.1 ) THEN
*
*           Q was determined by a call to CGEBRD with nq < k
*
            IF( left ) THEN
               mi = m - 1
               ni = n
               i1 = 2
               i2 = 1
            ELSE
               mi = m
               ni = n - 1
               i1 = 1
               i2 = 2
            END IF
            CALL cunmqr( side, trans, mi, ni, nq-1, a( 2, 1 ), lda, tau,
     $                   c( i1, i2 ), ldc, work, lwork, iinfo )
         END IF
      ELSE
*
*        Apply P
*
         IF( notran ) THEN
            transt = 'C'
         ELSE
            transt = 'N'
         END IF
         IF( nq.GT.k ) THEN
*
*           P was determined by a call to CGEBRD with nq > k
*
            CALL cunmlq( side, transt, m, n, k, a, lda, tau, c, ldc,
     $                   work, lwork, iinfo )
         ELSE IF( nq.GT.1 ) THEN
*
*           P was determined by a call to CGEBRD with nq <= k
*
            IF( left ) THEN
               mi = m - 1
               ni = n
               i1 = 2
               i2 = 1
            ELSE
               mi = m
               ni = n - 1
               i1 = 1
               i2 = 2
            END IF
            CALL cunmlq( side, transt, mi, ni, nq-1, a( 1, 2 ), lda,
     $                   tau, c( i1, i2 ), ldc, work, lwork, iinfo )
         END IF
      END IF
      work( 1 ) = lwkopt
      RETURN
*
*     End of CUNMBR
*

◆ cunmhr()

subroutine cunmhr	(	character	side,
		character	trans,
		integer	m,
		integer	n,
		integer	ilo,
		integer	ihi,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( * )	tau,
		complex, dimension( ldc, * )	c,
		integer	ldc,
		complex, dimension( * )	work,
		integer	lwork,
		integer	info )

CUNMHR

Download CUNMHR + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CUNMHR overwrites the general complex M-by-N matrix C with
!>
!>                 SIDE = 'L'     SIDE = 'R'
!> TRANS = 'N':      Q * C          C * Q
!> TRANS = 'C':      Q**H * C       C * Q**H
!>
!> where Q is a complex unitary matrix of order nq, with nq = m if
!> SIDE = 'L' and nq = n if SIDE = 'R'. Q is defined as the product of
!> IHI-ILO elementary reflectors, as returned by CGEHRD:
!>
!> Q = H(ilo) H(ilo+1) . . . H(ihi-1).
!>

Parameters

[in]	SIDE	!> SIDE is CHARACTER1 !> = 'L': apply Q or QH from the Left; !> = 'R': apply Q or Q*H from the Right. !>
[in]	TRANS	!> TRANS is CHARACTER1 !> = 'N': apply Q (No transpose) !> = 'C': apply Q*H (Conjugate transpose) !>
[in]	M	!> M is INTEGER !> The number of rows of the matrix C. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix C. N >= 0. !>
[in]	ILO	!> ILO is INTEGER !>
[in]	IHI	!> IHI is INTEGER !> !> ILO and IHI must have the same values as in the previous call !> of CGEHRD. Q is equal to the unit matrix except in the !> submatrix Q(ilo+1:ihi,ilo+1:ihi). !> If SIDE = 'L', then 1 <= ILO <= IHI <= M, if M > 0, and !> ILO = 1 and IHI = 0, if M = 0; !> if SIDE = 'R', then 1 <= ILO <= IHI <= N, if N > 0, and !> ILO = 1 and IHI = 0, if N = 0. !>
[in]	A	!> A is COMPLEX array, dimension !> (LDA,M) if SIDE = 'L' !> (LDA,N) if SIDE = 'R' !> The vectors which define the elementary reflectors, as !> returned by CGEHRD. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. !> LDA >= max(1,M) if SIDE = 'L'; LDA >= max(1,N) if SIDE = 'R'. !>
[in]	TAU	!> TAU is COMPLEX array, dimension !> (M-1) if SIDE = 'L' !> (N-1) if SIDE = 'R' !> TAU(i) must contain the scalar factor of the elementary !> reflector H(i), as returned by CGEHRD. !>
[in,out]	C	!> C is COMPLEX array, dimension (LDC,N) !> On entry, the M-by-N matrix C. !> On exit, C is overwritten by QC or QHC or CQH or CQ. !>
[in]	LDC	!> LDC is INTEGER !> The leading dimension of the array C. LDC >= max(1,M). !>
[out]	WORK	!> WORK is COMPLEX array, dimension (MAX(1,LWORK)) !> On exit, if INFO = 0, WORK(1) returns the optimal LWORK. !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the array WORK. !> If SIDE = 'L', LWORK >= max(1,N); !> if SIDE = 'R', LWORK >= max(1,M). !> For optimum performance LWORK >= NNB if SIDE = 'L', and !> LWORK >= MNB if SIDE = 'R', where NB is the optimal !> blocksize. !> !> If LWORK = -1, then a workspace query is assumed; the routine !> only calculates the optimal size of the WORK array, returns !> this value as the first entry of the WORK array, and no error !> message related to LWORK is issued by XERBLA. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 177 of file cunmhr.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          SIDE, TRANS
      INTEGER            IHI, ILO, INFO, LDA, LDC, LWORK, M, N
*     ..
*     .. Array Arguments ..
      COMPLEX            A( LDA, * ), C( LDC, * ), TAU( * ),
     $                   WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Local Scalars ..
      LOGICAL            LEFT, LQUERY
      INTEGER            I1, I2, IINFO, LWKOPT, MI, NB, NH, NI, NQ, NW
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      INTEGER            ILAENV
      EXTERNAL           ilaenv, lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           cunmqr, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, min
*     ..
*     .. Executable Statements ..
*
*     Test the input arguments
*
      info = 0
      nh = ihi - ilo
      left = lsame( side, 'L' )
      lquery = ( lwork.EQ.-1 )
*
*     NQ is the order of Q and NW is the minimum dimension of WORK
*
      IF( left ) THEN
         nq = m
         nw = max( 1, n )
      ELSE
         nq = n
         nw = max( 1, m )
      END IF
      IF( .NOT.left .AND. .NOT.lsame( side, 'R' ) ) THEN
         info = -1
      ELSE IF( .NOT.lsame( trans, 'N' ) .AND. .NOT.lsame( trans, 'C' ) )
     $          THEN
         info = -2
      ELSE IF( m.LT.0 ) THEN
         info = -3
      ELSE IF( n.LT.0 ) THEN
         info = -4
      ELSE IF( ilo.LT.1 .OR. ilo.GT.max( 1, nq ) ) THEN
         info = -5
      ELSE IF( ihi.LT.min( ilo, nq ) .OR. ihi.GT.nq ) THEN
         info = -6
      ELSE IF( lda.LT.max( 1, nq ) ) THEN
         info = -8
      ELSE IF( ldc.LT.max( 1, m ) ) THEN
         info = -11
      ELSE IF( lwork.LT.nw .AND. .NOT.lquery ) THEN
         info = -13
      END IF
*
      IF( info.EQ.0 ) THEN
         IF( left ) THEN
            nb = ilaenv( 1, 'CUNMQR', side // trans, nh, n, nh, -1 )
         ELSE
            nb = ilaenv( 1, 'CUNMQR', side // trans, m, nh, nh, -1 )
         END IF
         lwkopt = nw*nb
         work( 1 ) = lwkopt
      END IF
*
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CUNMHR', -info )
         RETURN
      ELSE IF( lquery ) THEN
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( m.EQ.0 .OR. n.EQ.0 .OR. nh.EQ.0 ) THEN
         work( 1 ) = 1
         RETURN
      END IF
*
      IF( left ) THEN
         mi = nh
         ni = n
         i1 = ilo + 1
         i2 = 1
      ELSE
         mi = m
         ni = nh
         i1 = 1
         i2 = ilo + 1
      END IF
*
      CALL cunmqr( side, trans, mi, ni, nh, a( ilo+1, ilo ), lda,
     $             tau( ilo ), c( i1, i2 ), ldc, work, lwork, iinfo )
*
      work( 1 ) = lwkopt
      RETURN
*
*     End of CUNMHR
*

◆ cunml2()

subroutine cunml2	(	character	side,
		character	trans,
		integer	m,
		integer	n,
		integer	k,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( * )	tau,
		complex, dimension( ldc, * )	c,
		integer	ldc,
		complex, dimension( * )	work,
		integer	info )

CUNML2 multiplies a general matrix by the unitary matrix from a LQ factorization determined by cgelqf (unblocked algorithm).

Download CUNML2 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CUNML2 overwrites the general complex m-by-n matrix C with
!>
!>       Q * C  if SIDE = 'L' and TRANS = 'N', or
!>
!>       Q**H* C  if SIDE = 'L' and TRANS = 'C', or
!>
!>       C * Q  if SIDE = 'R' and TRANS = 'N', or
!>
!>       C * Q**H if SIDE = 'R' and TRANS = 'C',
!>
!> where Q is a complex unitary matrix defined as the product of k
!> elementary reflectors
!>
!>       Q = H(k)**H . . . H(2)**H H(1)**H
!>
!> as returned by CGELQF. Q is of order m if SIDE = 'L' and of order n
!> if SIDE = 'R'.
!>

Parameters

[in]	SIDE	!> SIDE is CHARACTER1 !> = 'L': apply Q or QH from the Left !> = 'R': apply Q or Q*H from the Right !>
[in]	TRANS	!> TRANS is CHARACTER1 !> = 'N': apply Q (No transpose) !> = 'C': apply Q*H (Conjugate transpose) !>
[in]	M	!> M is INTEGER !> The number of rows of the matrix C. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix C. N >= 0. !>
[in]	K	!> K is INTEGER !> The number of elementary reflectors whose product defines !> the matrix Q. !> If SIDE = 'L', M >= K >= 0; !> if SIDE = 'R', N >= K >= 0. !>
[in]	A	!> A is COMPLEX array, dimension !> (LDA,M) if SIDE = 'L', !> (LDA,N) if SIDE = 'R' !> The i-th row must contain the vector which defines the !> elementary reflector H(i), for i = 1,2,...,k, as returned by !> CGELQF in the first k rows of its array argument A. !> A is modified by the routine but restored on exit. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,K). !>
[in]	TAU	!> TAU is COMPLEX array, dimension (K) !> TAU(i) must contain the scalar factor of the elementary !> reflector H(i), as returned by CGELQF. !>
[in,out]	C	!> C is COMPLEX array, dimension (LDC,N) !> On entry, the m-by-n matrix C. !> On exit, C is overwritten by QC or QHC or CQH or CQ. !>
[in]	LDC	!> LDC is INTEGER !> The leading dimension of the array C. LDC >= max(1,M). !>
[out]	WORK	!> WORK is COMPLEX array, dimension !> (N) if SIDE = 'L', !> (M) if SIDE = 'R' !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 157 of file cunml2.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          SIDE, TRANS
      INTEGER            INFO, K, LDA, LDC, M, N
*     ..
*     .. Array Arguments ..
      COMPLEX            A( LDA, * ), C( LDC, * ), TAU( * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            ONE
      parameter( one = ( 1.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      LOGICAL            LEFT, NOTRAN
      INTEGER            I, I1, I2, I3, IC, JC, MI, NI, NQ
      COMPLEX            AII, TAUI
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           clacgv, clarf, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          conjg, max
*     ..
*     .. Executable Statements ..
*
*     Test the input arguments
*
      info = 0
      left = lsame( side, 'L' )
      notran = lsame( trans, 'N' )
*
*     NQ is the order of Q
*
      IF( left ) THEN
         nq = m
      ELSE
         nq = n
      END IF
      IF( .NOT.left .AND. .NOT.lsame( side, 'R' ) ) THEN
         info = -1
      ELSE IF( .NOT.notran .AND. .NOT.lsame( trans, 'C' ) ) THEN
         info = -2
      ELSE IF( m.LT.0 ) THEN
         info = -3
      ELSE IF( n.LT.0 ) THEN
         info = -4
      ELSE IF( k.LT.0 .OR. k.GT.nq ) THEN
         info = -5
      ELSE IF( lda.LT.max( 1, k ) ) THEN
         info = -7
      ELSE IF( ldc.LT.max( 1, m ) ) THEN
         info = -10
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CUNML2', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( m.EQ.0 .OR. n.EQ.0 .OR. k.EQ.0 )
     $   RETURN
*
      IF( ( left .AND. notran .OR. .NOT.left .AND. .NOT.notran ) ) THEN
         i1 = 1
         i2 = k
         i3 = 1
      ELSE
         i1 = k
         i2 = 1
         i3 = -1
      END IF
*
      IF( left ) THEN
         ni = n
         jc = 1
      ELSE
         mi = m
         ic = 1
      END IF
*
      DO 10 i = i1, i2, i3
         IF( left ) THEN
*
*           H(i) or H(i)**H is applied to C(i:m,1:n)
*
            mi = m - i + 1
            ic = i
         ELSE
*
*           H(i) or H(i)**H is applied to C(1:m,i:n)
*
            ni = n - i + 1
            jc = i
         END IF
*
*        Apply H(i) or H(i)**H
*
         IF( notran ) THEN
            taui = conjg( tau( i ) )
         ELSE
            taui = tau( i )
         END IF
         IF( i.LT.nq )
     $      CALL clacgv( nq-i, a( i, i+1 ), lda )
         aii = a( i, i )
         a( i, i ) = one
         CALL clarf( side, mi, ni, a( i, i ), lda, taui, c( ic, jc ),
     $               ldc, work )
         a( i, i ) = aii
         IF( i.LT.nq )
     $      CALL clacgv( nq-i, a( i, i+1 ), lda )
   10 CONTINUE
      RETURN
*
*     End of CUNML2
*

◆ cunmlq()

subroutine cunmlq	(	character	side,
		character	trans,
		integer	m,
		integer	n,
		integer	k,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( * )	tau,
		complex, dimension( ldc, * )	c,
		integer	ldc,
		complex, dimension( * )	work,
		integer	lwork,
		integer	info )

CUNMLQ

Download CUNMLQ + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CUNMLQ overwrites the general complex M-by-N matrix C with
!>
!>                 SIDE = 'L'     SIDE = 'R'
!> TRANS = 'N':      Q * C          C * Q
!> TRANS = 'C':      Q**H * C       C * Q**H
!>
!> where Q is a complex unitary matrix defined as the product of k
!> elementary reflectors
!>
!>       Q = H(k)**H . . . H(2)**H H(1)**H
!>
!> as returned by CGELQF. Q is of order M if SIDE = 'L' and of order N
!> if SIDE = 'R'.
!>

Parameters

[in]	SIDE	!> SIDE is CHARACTER1 !> = 'L': apply Q or QH from the Left; !> = 'R': apply Q or Q*H from the Right. !>
[in]	TRANS	!> TRANS is CHARACTER1 !> = 'N': No transpose, apply Q; !> = 'C': Conjugate transpose, apply Q*H. !>
[in]	M	!> M is INTEGER !> The number of rows of the matrix C. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix C. N >= 0. !>
[in]	K	!> K is INTEGER !> The number of elementary reflectors whose product defines !> the matrix Q. !> If SIDE = 'L', M >= K >= 0; !> if SIDE = 'R', N >= K >= 0. !>
[in]	A	!> A is COMPLEX array, dimension !> (LDA,M) if SIDE = 'L', !> (LDA,N) if SIDE = 'R' !> The i-th row must contain the vector which defines the !> elementary reflector H(i), for i = 1,2,...,k, as returned by !> CGELQF in the first k rows of its array argument A. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,K). !>
[in]	TAU	!> TAU is COMPLEX array, dimension (K) !> TAU(i) must contain the scalar factor of the elementary !> reflector H(i), as returned by CGELQF. !>
[in,out]	C	!> C is COMPLEX array, dimension (LDC,N) !> On entry, the M-by-N matrix C. !> On exit, C is overwritten by QC or QHC or CQH or CQ. !>
[in]	LDC	!> LDC is INTEGER !> The leading dimension of the array C. LDC >= max(1,M). !>
[out]	WORK	!> WORK is COMPLEX array, dimension (MAX(1,LWORK)) !> On exit, if INFO = 0, WORK(1) returns the optimal LWORK. !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the array WORK. !> If SIDE = 'L', LWORK >= max(1,N); !> if SIDE = 'R', LWORK >= max(1,M). !> For good performance, LWORK should generally be larger. !> !> If LWORK = -1, then a workspace query is assumed; the routine !> only calculates the optimal size of the WORK array, returns !> this value as the first entry of the WORK array, and no error !> message related to LWORK is issued by XERBLA. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 166 of file cunmlq.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          SIDE, TRANS
      INTEGER            INFO, K, LDA, LDC, LWORK, M, N
*     ..
*     .. Array Arguments ..
      COMPLEX            A( LDA, * ), C( LDC, * ), TAU( * ),
     $                   WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      INTEGER            NBMAX, LDT, TSIZE
      parameter( nbmax = 64, ldt = nbmax+1,
     $                     tsize = ldt*nbmax )
*     ..
*     .. Local Scalars ..
      LOGICAL            LEFT, LQUERY, NOTRAN
      CHARACTER          TRANST
      INTEGER            I, I1, I2, I3, IB, IC, IINFO, IWT, JC, LDWORK,
     $                   LWKOPT, MI, NB, NBMIN, NI, NQ, NW
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      INTEGER            ILAENV
      EXTERNAL           lsame, ilaenv
*     ..
*     .. External Subroutines ..
      EXTERNAL           clarfb, clarft, cunml2, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, min
*     ..
*     .. Executable Statements ..
*
*     Test the input arguments
*
      info = 0
      left = lsame( side, 'L' )
      notran = lsame( trans, 'N' )
      lquery = ( lwork.EQ.-1 )
*
*     NQ is the order of Q and NW is the minimum dimension of WORK
*
      IF( left ) THEN
         nq = m
         nw = max( 1, n )
      ELSE
         nq = n
         nw = max( 1, m )
      END IF
      IF( .NOT.left .AND. .NOT.lsame( side, 'R' ) ) THEN
         info = -1
      ELSE IF( .NOT.notran .AND. .NOT.lsame( trans, 'C' ) ) THEN
         info = -2
      ELSE IF( m.LT.0 ) THEN
         info = -3
      ELSE IF( n.LT.0 ) THEN
         info = -4
      ELSE IF( k.LT.0 .OR. k.GT.nq ) THEN
         info = -5
      ELSE IF( lda.LT.max( 1, k ) ) THEN
         info = -7
      ELSE IF( ldc.LT.max( 1, m ) ) THEN
         info = -10
      ELSE IF( lwork.LT.nw .AND. .NOT.lquery ) THEN
         info = -12
      END IF
*
      IF( info.EQ.0 ) THEN
*
*        Compute the workspace requirements
*
         IF( m.EQ.0 .OR. n.EQ.0 .OR. k.EQ.0 ) THEN
            lwkopt = 1
         ELSE
            nb = min( nbmax, ilaenv( 1, 'CUNMLQ', side // trans, m, n,
     $                               k, -1 ) )
            lwkopt = nw*nb + tsize
         END IF
         work( 1 ) = lwkopt
      END IF
*
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CUNMLQ', -info )
         RETURN
      ELSE IF( lquery ) THEN
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( m.EQ.0 .OR. n.EQ.0 .OR. k.EQ.0 ) THEN
         RETURN
      END IF
*
*     Determine the block size
*
      nbmin = 2
      ldwork = nw
      IF( nb.GT.1 .AND. nb.LT.k ) THEN
         IF( lwork.LT.lwkopt ) THEN
            nb = (lwork-tsize) / ldwork
            nbmin = max( 2, ilaenv( 2, 'CUNMLQ', side // trans, m, n, k,
     $              -1 ) )
         END IF
      END IF
*
      IF( nb.LT.nbmin .OR. nb.GE.k ) THEN
*
*        Use unblocked code
*
         CALL cunml2( side, trans, m, n, k, a, lda, tau, c, ldc, work,
     $                iinfo )
      ELSE
*
*        Use blocked code
*
         iwt = 1 + nw*nb
         IF( ( left .AND. notran ) .OR.
     $       ( .NOT.left .AND. .NOT.notran ) ) THEN
            i1 = 1
            i2 = k
            i3 = nb
         ELSE
            i1 = ( ( k-1 ) / nb )*nb + 1
            i2 = 1
            i3 = -nb
         END IF
*
         IF( left ) THEN
            ni = n
            jc = 1
         ELSE
            mi = m
            ic = 1
         END IF
*
         IF( notran ) THEN
            transt = 'C'
         ELSE
            transt = 'N'
         END IF
*
         DO 10 i = i1, i2, i3
            ib = min( nb, k-i+1 )
*
*           Form the triangular factor of the block reflector
*           H = H(i) H(i+1) . . . H(i+ib-1)
*
            CALL clarft( 'Forward', 'Rowwise', nq-i+1, ib, a( i, i ),
     $                   lda, tau( i ), work( iwt ), ldt )
            IF( left ) THEN
*
*              H or H**H is applied to C(i:m,1:n)
*
               mi = m - i + 1
               ic = i
            ELSE
*
*              H or H**H is applied to C(1:m,i:n)
*
               ni = n - i + 1
               jc = i
            END IF
*
*           Apply H or H**H
*
            CALL clarfb( side, transt, 'Forward', 'Rowwise', mi, ni, ib,
     $                   a( i, i ), lda, work( iwt ), ldt,
     $                   c( ic, jc ), ldc, work, ldwork )
   10    CONTINUE
      END IF
      work( 1 ) = lwkopt
      RETURN
*
*     End of CUNMLQ
*

◆ cunmql()

subroutine cunmql	(	character	side,
		character	trans,
		integer	m,
		integer	n,
		integer	k,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( * )	tau,
		complex, dimension( ldc, * )	c,
		integer	ldc,
		complex, dimension( * )	work,
		integer	lwork,
		integer	info )

CUNMQL

Download CUNMQL + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CUNMQL overwrites the general complex M-by-N matrix C with
!>
!>                 SIDE = 'L'     SIDE = 'R'
!> TRANS = 'N':      Q * C          C * Q
!> TRANS = 'C':      Q**H * C       C * Q**H
!>
!> where Q is a complex unitary matrix defined as the product of k
!> elementary reflectors
!>
!>       Q = H(k) . . . H(2) H(1)
!>
!> as returned by CGEQLF. Q is of order M if SIDE = 'L' and of order N
!> if SIDE = 'R'.
!>

Parameters

[in]	SIDE	!> SIDE is CHARACTER1 !> = 'L': apply Q or QH from the Left; !> = 'R': apply Q or Q*H from the Right. !>
[in]	TRANS	!> TRANS is CHARACTER1 !> = 'N': No transpose, apply Q; !> = 'C': Conjugate transpose, apply Q*H. !>
[in]	M	!> M is INTEGER !> The number of rows of the matrix C. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix C. N >= 0. !>
[in]	K	!> K is INTEGER !> The number of elementary reflectors whose product defines !> the matrix Q. !> If SIDE = 'L', M >= K >= 0; !> if SIDE = 'R', N >= K >= 0. !>
[in]	A	!> A is COMPLEX array, dimension (LDA,K) !> The i-th column must contain the vector which defines the !> elementary reflector H(i), for i = 1,2,...,k, as returned by !> CGEQLF in the last k columns of its array argument A. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. !> If SIDE = 'L', LDA >= max(1,M); !> if SIDE = 'R', LDA >= max(1,N). !>
[in]	TAU	!> TAU is COMPLEX array, dimension (K) !> TAU(i) must contain the scalar factor of the elementary !> reflector H(i), as returned by CGEQLF. !>
[in,out]	C	!> C is COMPLEX array, dimension (LDC,N) !> On entry, the M-by-N matrix C. !> On exit, C is overwritten by QC or QHC or CQH or CQ. !>
[in]	LDC	!> LDC is INTEGER !> The leading dimension of the array C. LDC >= max(1,M). !>
[out]	WORK	!> WORK is COMPLEX array, dimension (MAX(1,LWORK)) !> On exit, if INFO = 0, WORK(1) returns the optimal LWORK. !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the array WORK. !> If SIDE = 'L', LWORK >= max(1,N); !> if SIDE = 'R', LWORK >= max(1,M). !> For good performance, LWORK should generally be larger. !> !> If LWORK = -1, then a workspace query is assumed; the routine !> only calculates the optimal size of the WORK array, returns !> this value as the first entry of the WORK array, and no error !> message related to LWORK is issued by XERBLA. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 166 of file cunmql.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          SIDE, TRANS
      INTEGER            INFO, K, LDA, LDC, LWORK, M, N
*     ..
*     .. Array Arguments ..
      COMPLEX            A( LDA, * ), C( LDC, * ), TAU( * ),
     $                   WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      INTEGER            NBMAX, LDT, TSIZE
      parameter( nbmax = 64, ldt = nbmax+1,
     $                     tsize = ldt*nbmax )
*     ..
*     .. Local Scalars ..
      LOGICAL            LEFT, LQUERY, NOTRAN
      INTEGER            I, I1, I2, I3, IB, IINFO, IWT, LDWORK, LWKOPT,
     $                   MI, NB, NBMIN, NI, NQ, NW
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      INTEGER            ILAENV
      EXTERNAL           lsame, ilaenv
*     ..
*     .. External Subroutines ..
      EXTERNAL           clarfb, clarft, cunm2l, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, min
*     ..
*     .. Executable Statements ..
*
*     Test the input arguments
*
      info = 0
      left = lsame( side, 'L' )
      notran = lsame( trans, 'N' )
      lquery = ( lwork.EQ.-1 )
*
*     NQ is the order of Q and NW is the minimum dimension of WORK
*
      IF( left ) THEN
         nq = m
         nw = max( 1, n )
      ELSE
         nq = n
         nw = max( 1, m )
      END IF
      IF( .NOT.left .AND. .NOT.lsame( side, 'R' ) ) THEN
         info = -1
      ELSE IF( .NOT.notran .AND. .NOT.lsame( trans, 'C' ) ) THEN
         info = -2
      ELSE IF( m.LT.0 ) THEN
         info = -3
      ELSE IF( n.LT.0 ) THEN
         info = -4
      ELSE IF( k.LT.0 .OR. k.GT.nq ) THEN
         info = -5
      ELSE IF( lda.LT.max( 1, nq ) ) THEN
         info = -7
      ELSE IF( ldc.LT.max( 1, m ) ) THEN
         info = -10
      ELSE IF( lwork.LT.nw .AND. .NOT.lquery ) THEN
         info = -12
      END IF
*
      IF( info.EQ.0 ) THEN
*
*        Compute the workspace requirements
*
         IF( m.EQ.0 .OR. n.EQ.0 ) THEN
            lwkopt = 1
         ELSE
            nb = min( nbmax, ilaenv( 1, 'CUNMQL', side // trans, m, n,
     $                               k, -1 ) )
            lwkopt = nw*nb + tsize
         END IF
         work( 1 ) = lwkopt
      END IF
*
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CUNMQL', -info )
         RETURN
      ELSE IF( lquery ) THEN
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( m.EQ.0 .OR. n.EQ.0 ) THEN
         RETURN
      END IF
*
*     Determine the block size
*
      nbmin = 2
      ldwork = nw
      IF( nb.GT.1 .AND. nb.LT.k ) THEN
         IF( lwork.LT.lwkopt ) THEN
            nb = (lwork-tsize) / ldwork
            nbmin = max( 2, ilaenv( 2, 'CUNMQL', side // trans, m, n, k,
     $              -1 ) )
         END IF
      END IF
*
      IF( nb.LT.nbmin .OR. nb.GE.k ) THEN
*
*        Use unblocked code
*
         CALL cunm2l( side, trans, m, n, k, a, lda, tau, c, ldc, work,
     $                iinfo )
      ELSE
*
*        Use blocked code
*
         iwt = 1 + nw*nb
         IF( ( left .AND. notran ) .OR.
     $       ( .NOT.left .AND. .NOT.notran ) ) THEN
            i1 = 1
            i2 = k
            i3 = nb
         ELSE
            i1 = ( ( k-1 ) / nb )*nb + 1
            i2 = 1
            i3 = -nb
         END IF
*
         IF( left ) THEN
            ni = n
         ELSE
            mi = m
         END IF
*
         DO 10 i = i1, i2, i3
            ib = min( nb, k-i+1 )
*
*           Form the triangular factor of the block reflector
*           H = H(i+ib-1) . . . H(i+1) H(i)
*
            CALL clarft( 'Backward', 'Columnwise', nq-k+i+ib-1, ib,
     $                   a( 1, i ), lda, tau( i ), work( iwt ), ldt )
            IF( left ) THEN
*
*              H or H**H is applied to C(1:m-k+i+ib-1,1:n)
*
               mi = m - k + i + ib - 1
            ELSE
*
*              H or H**H is applied to C(1:m,1:n-k+i+ib-1)
*
               ni = n - k + i + ib - 1
            END IF
*
*           Apply H or H**H
*
            CALL clarfb( side, trans, 'Backward', 'Columnwise', mi, ni,
     $                   ib, a( 1, i ), lda, work( iwt ), ldt, c, ldc,
     $                   work, ldwork )
   10    CONTINUE
      END IF
      work( 1 ) = lwkopt
      RETURN
*
*     End of CUNMQL
*

◆ cunmqr()

subroutine cunmqr	(	character	side,
		character	trans,
		integer	m,
		integer	n,
		integer	k,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( * )	tau,
		complex, dimension( ldc, * )	c,
		integer	ldc,
		complex, dimension( * )	work,
		integer	lwork,
		integer	info )

CUNMQR

Download CUNMQR + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CUNMQR overwrites the general complex M-by-N matrix C with
!>
!>                 SIDE = 'L'     SIDE = 'R'
!> TRANS = 'N':      Q * C          C * Q
!> TRANS = 'C':      Q**H * C       C * Q**H
!>
!> where Q is a complex unitary matrix defined as the product of k
!> elementary reflectors
!>
!>       Q = H(1) H(2) . . . H(k)
!>
!> as returned by CGEQRF. Q is of order M if SIDE = 'L' and of order N
!> if SIDE = 'R'.
!>

Parameters

[in]	SIDE	!> SIDE is CHARACTER1 !> = 'L': apply Q or QH from the Left; !> = 'R': apply Q or Q*H from the Right. !>
[in]	TRANS	!> TRANS is CHARACTER1 !> = 'N': No transpose, apply Q; !> = 'C': Conjugate transpose, apply Q*H. !>
[in]	M	!> M is INTEGER !> The number of rows of the matrix C. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix C. N >= 0. !>
[in]	K	!> K is INTEGER !> The number of elementary reflectors whose product defines !> the matrix Q. !> If SIDE = 'L', M >= K >= 0; !> if SIDE = 'R', N >= K >= 0. !>
[in]	A	!> A is COMPLEX array, dimension (LDA,K) !> The i-th column must contain the vector which defines the !> elementary reflector H(i), for i = 1,2,...,k, as returned by !> CGEQRF in the first k columns of its array argument A. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. !> If SIDE = 'L', LDA >= max(1,M); !> if SIDE = 'R', LDA >= max(1,N). !>
[in]	TAU	!> TAU is COMPLEX array, dimension (K) !> TAU(i) must contain the scalar factor of the elementary !> reflector H(i), as returned by CGEQRF. !>
[in,out]	C	!> C is COMPLEX array, dimension (LDC,N) !> On entry, the M-by-N matrix C. !> On exit, C is overwritten by QC or QHC or CQH or CQ. !>
[in]	LDC	!> LDC is INTEGER !> The leading dimension of the array C. LDC >= max(1,M). !>
[out]	WORK	!> WORK is COMPLEX array, dimension (MAX(1,LWORK)) !> On exit, if INFO = 0, WORK(1) returns the optimal LWORK. !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the array WORK. !> If SIDE = 'L', LWORK >= max(1,N); !> if SIDE = 'R', LWORK >= max(1,M). !> For good performance, LWORK should generally be larger. !> !> If LWORK = -1, then a workspace query is assumed; the routine !> only calculates the optimal size of the WORK array, returns !> this value as the first entry of the WORK array, and no error !> message related to LWORK is issued by XERBLA. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 166 of file cunmqr.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          SIDE, TRANS
      INTEGER            INFO, K, LDA, LDC, LWORK, M, N
*     ..
*     .. Array Arguments ..
      COMPLEX            A( LDA, * ), C( LDC, * ), TAU( * ),
     $                   WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      INTEGER            NBMAX, LDT, TSIZE
      parameter( nbmax = 64, ldt = nbmax+1,
     $                     tsize = ldt*nbmax )
*     ..
*     .. Local Scalars ..
      LOGICAL            LEFT, LQUERY, NOTRAN
      INTEGER            I, I1, I2, I3, IB, IC, IINFO, IWT, JC, LDWORK,
     $                   LWKOPT, MI, NB, NBMIN, NI, NQ, NW
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      INTEGER            ILAENV
      EXTERNAL           lsame, ilaenv
*     ..
*     .. External Subroutines ..
      EXTERNAL           clarfb, clarft, cunm2r, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, min
*     ..
*     .. Executable Statements ..
*
*     Test the input arguments
*
      info = 0
      left = lsame( side, 'L' )
      notran = lsame( trans, 'N' )
      lquery = ( lwork.EQ.-1 )
*
*     NQ is the order of Q and NW is the minimum dimension of WORK
*
      IF( left ) THEN
         nq = m
         nw = max( 1, n )
      ELSE
         nq = n
         nw = max( 1, m )
      END IF
      IF( .NOT.left .AND. .NOT.lsame( side, 'R' ) ) THEN
         info = -1
      ELSE IF( .NOT.notran .AND. .NOT.lsame( trans, 'C' ) ) THEN
         info = -2
      ELSE IF( m.LT.0 ) THEN
         info = -3
      ELSE IF( n.LT.0 ) THEN
         info = -4
      ELSE IF( k.LT.0 .OR. k.GT.nq ) THEN
         info = -5
      ELSE IF( lda.LT.max( 1, nq ) ) THEN
         info = -7
      ELSE IF( ldc.LT.max( 1, m ) ) THEN
         info = -10
      ELSE IF( lwork.LT.nw .AND. .NOT.lquery ) THEN
         info = -12
      END IF
*
      IF( info.EQ.0 ) THEN
*
*        Compute the workspace requirements
*
         nb = min( nbmax, ilaenv( 1, 'CUNMQR', side // trans, m, n, k,
     $        -1 ) )
         lwkopt = nw*nb + tsize
         work( 1 ) = lwkopt
      END IF
*
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CUNMQR', -info )
         RETURN
      ELSE IF( lquery ) THEN
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( m.EQ.0 .OR. n.EQ.0 .OR. k.EQ.0 ) THEN
         work( 1 ) = 1
         RETURN
      END IF
*
      nbmin = 2
      ldwork = nw
      IF( nb.GT.1 .AND. nb.LT.k ) THEN
         IF( lwork.LT.lwkopt ) THEN
            nb = (lwork-tsize) / ldwork
            nbmin = max( 2, ilaenv( 2, 'CUNMQR', side // trans, m, n, k,
     $              -1 ) )
         END IF
      END IF
*
      IF( nb.LT.nbmin .OR. nb.GE.k ) THEN
*
*        Use unblocked code
*
         CALL cunm2r( side, trans, m, n, k, a, lda, tau, c, ldc, work,
     $                iinfo )
      ELSE
*
*        Use blocked code
*
         iwt = 1 + nw*nb
         IF( ( left .AND. .NOT.notran ) .OR.
     $       ( .NOT.left .AND. notran ) ) THEN
            i1 = 1
            i2 = k
            i3 = nb
         ELSE
            i1 = ( ( k-1 ) / nb )*nb + 1
            i2 = 1
            i3 = -nb
         END IF
*
         IF( left ) THEN
            ni = n
            jc = 1
         ELSE
            mi = m
            ic = 1
         END IF
*
         DO 10 i = i1, i2, i3
            ib = min( nb, k-i+1 )
*
*           Form the triangular factor of the block reflector
*           H = H(i) H(i+1) . . . H(i+ib-1)
*
            CALL clarft( 'Forward', 'Columnwise', nq-i+1, ib, a( i, i ),
     $                   lda, tau( i ), work( iwt ), ldt )
            IF( left ) THEN
*
*              H or H**H is applied to C(i:m,1:n)
*
               mi = m - i + 1
               ic = i
            ELSE
*
*              H or H**H is applied to C(1:m,i:n)
*
               ni = n - i + 1
               jc = i
            END IF
*
*           Apply H or H**H
*
            CALL clarfb( side, trans, 'Forward', 'Columnwise', mi, ni,
     $                   ib, a( i, i ), lda, work( iwt ), ldt,
     $                   c( ic, jc ), ldc, work, ldwork )
   10    CONTINUE
      END IF
      work( 1 ) = lwkopt
      RETURN
*
*     End of CUNMQR
*

◆ cunmr2()

subroutine cunmr2	(	character	side,
		character	trans,
		integer	m,
		integer	n,
		integer	k,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( * )	tau,
		complex, dimension( ldc, * )	c,
		integer	ldc,
		complex, dimension( * )	work,
		integer	info )

CUNMR2 multiplies a general matrix by the unitary matrix from a RQ factorization determined by cgerqf (unblocked algorithm).

Download CUNMR2 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CUNMR2 overwrites the general complex m-by-n matrix C with
!>
!>       Q * C  if SIDE = 'L' and TRANS = 'N', or
!>
!>       Q**H* C  if SIDE = 'L' and TRANS = 'C', or
!>
!>       C * Q  if SIDE = 'R' and TRANS = 'N', or
!>
!>       C * Q**H if SIDE = 'R' and TRANS = 'C',
!>
!> where Q is a complex unitary matrix defined as the product of k
!> elementary reflectors
!>
!>       Q = H(1)**H H(2)**H . . . H(k)**H
!>
!> as returned by CGERQF. Q is of order m if SIDE = 'L' and of order n
!> if SIDE = 'R'.
!>

Parameters

[in]	SIDE	!> SIDE is CHARACTER1 !> = 'L': apply Q or QH from the Left !> = 'R': apply Q or Q*H from the Right !>
[in]	TRANS	!> TRANS is CHARACTER1 !> = 'N': apply Q (No transpose) !> = 'C': apply Q*H (Conjugate transpose) !>
[in]	M	!> M is INTEGER !> The number of rows of the matrix C. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix C. N >= 0. !>
[in]	K	!> K is INTEGER !> The number of elementary reflectors whose product defines !> the matrix Q. !> If SIDE = 'L', M >= K >= 0; !> if SIDE = 'R', N >= K >= 0. !>
[in]	A	!> A is COMPLEX array, dimension !> (LDA,M) if SIDE = 'L', !> (LDA,N) if SIDE = 'R' !> The i-th row must contain the vector which defines the !> elementary reflector H(i), for i = 1,2,...,k, as returned by !> CGERQF in the last k rows of its array argument A. !> A is modified by the routine but restored on exit. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,K). !>
[in]	TAU	!> TAU is COMPLEX array, dimension (K) !> TAU(i) must contain the scalar factor of the elementary !> reflector H(i), as returned by CGERQF. !>
[in,out]	C	!> C is COMPLEX array, dimension (LDC,N) !> On entry, the m-by-n matrix C. !> On exit, C is overwritten by QC or QHC or CQH or CQ. !>
[in]	LDC	!> LDC is INTEGER !> The leading dimension of the array C. LDC >= max(1,M). !>
[out]	WORK	!> WORK is COMPLEX array, dimension !> (N) if SIDE = 'L', !> (M) if SIDE = 'R' !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 157 of file cunmr2.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          SIDE, TRANS
      INTEGER            INFO, K, LDA, LDC, M, N
*     ..
*     .. Array Arguments ..
      COMPLEX            A( LDA, * ), C( LDC, * ), TAU( * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            ONE
      parameter( one = ( 1.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      LOGICAL            LEFT, NOTRAN
      INTEGER            I, I1, I2, I3, MI, NI, NQ
      COMPLEX            AII, TAUI
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           clacgv, clarf, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          conjg, max
*     ..
*     .. Executable Statements ..
*
*     Test the input arguments
*
      info = 0
      left = lsame( side, 'L' )
      notran = lsame( trans, 'N' )
*
*     NQ is the order of Q
*
      IF( left ) THEN
         nq = m
      ELSE
         nq = n
      END IF
      IF( .NOT.left .AND. .NOT.lsame( side, 'R' ) ) THEN
         info = -1
      ELSE IF( .NOT.notran .AND. .NOT.lsame( trans, 'C' ) ) THEN
         info = -2
      ELSE IF( m.LT.0 ) THEN
         info = -3
      ELSE IF( n.LT.0 ) THEN
         info = -4
      ELSE IF( k.LT.0 .OR. k.GT.nq ) THEN
         info = -5
      ELSE IF( lda.LT.max( 1, k ) ) THEN
         info = -7
      ELSE IF( ldc.LT.max( 1, m ) ) THEN
         info = -10
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CUNMR2', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( m.EQ.0 .OR. n.EQ.0 .OR. k.EQ.0 )
     $   RETURN
*
      IF( ( left .AND. .NOT.notran .OR. .NOT.left .AND. notran ) ) THEN
         i1 = 1
         i2 = k
         i3 = 1
      ELSE
         i1 = k
         i2 = 1
         i3 = -1
      END IF
*
      IF( left ) THEN
         ni = n
      ELSE
         mi = m
      END IF
*
      DO 10 i = i1, i2, i3
         IF( left ) THEN
*
*           H(i) or H(i)**H is applied to C(1:m-k+i,1:n)
*
            mi = m - k + i
         ELSE
*
*           H(i) or H(i)**H is applied to C(1:m,1:n-k+i)
*
            ni = n - k + i
         END IF
*
*        Apply H(i) or H(i)**H
*
         IF( notran ) THEN
            taui = conjg( tau( i ) )
         ELSE
            taui = tau( i )
         END IF
         CALL clacgv( nq-k+i-1, a( i, 1 ), lda )
         aii = a( i, nq-k+i )
         a( i, nq-k+i ) = one
         CALL clarf( side, mi, ni, a( i, 1 ), lda, taui, c, ldc, work )
         a( i, nq-k+i ) = aii
         CALL clacgv( nq-k+i-1, a( i, 1 ), lda )
   10 CONTINUE
      RETURN
*
*     End of CUNMR2
*

◆ cunmr3()

subroutine cunmr3	(	character	side,
		character	trans,
		integer	m,
		integer	n,
		integer	k,
		integer	l,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( * )	tau,
		complex, dimension( ldc, * )	c,
		integer	ldc,
		complex, dimension( * )	work,
		integer	info )

CUNMR3 multiplies a general matrix by the unitary matrix from a RZ factorization determined by ctzrzf (unblocked algorithm).

Download CUNMR3 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CUNMR3 overwrites the general complex m by n matrix C with
!>
!>       Q * C  if SIDE = 'L' and TRANS = 'N', or
!>
!>       Q**H* C  if SIDE = 'L' and TRANS = 'C', or
!>
!>       C * Q  if SIDE = 'R' and TRANS = 'N', or
!>
!>       C * Q**H if SIDE = 'R' and TRANS = 'C',
!>
!> where Q is a complex unitary matrix defined as the product of k
!> elementary reflectors
!>
!>       Q = H(1) H(2) . . . H(k)
!>
!> as returned by CTZRZF. Q is of order m if SIDE = 'L' and of order n
!> if SIDE = 'R'.
!>

Parameters

[in]	SIDE	!> SIDE is CHARACTER1 !> = 'L': apply Q or QH from the Left !> = 'R': apply Q or Q*H from the Right !>
[in]	TRANS	!> TRANS is CHARACTER1 !> = 'N': apply Q (No transpose) !> = 'C': apply Q*H (Conjugate transpose) !>
[in]	M	!> M is INTEGER !> The number of rows of the matrix C. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix C. N >= 0. !>
[in]	K	!> K is INTEGER !> The number of elementary reflectors whose product defines !> the matrix Q. !> If SIDE = 'L', M >= K >= 0; !> if SIDE = 'R', N >= K >= 0. !>
[in]	L	!> L is INTEGER !> The number of columns of the matrix A containing !> the meaningful part of the Householder reflectors. !> If SIDE = 'L', M >= L >= 0, if SIDE = 'R', N >= L >= 0. !>
[in]	A	!> A is COMPLEX array, dimension !> (LDA,M) if SIDE = 'L', !> (LDA,N) if SIDE = 'R' !> The i-th row must contain the vector which defines the !> elementary reflector H(i), for i = 1,2,...,k, as returned by !> CTZRZF in the last k rows of its array argument A. !> A is modified by the routine but restored on exit. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,K). !>
[in]	TAU	!> TAU is COMPLEX array, dimension (K) !> TAU(i) must contain the scalar factor of the elementary !> reflector H(i), as returned by CTZRZF. !>
[in,out]	C	!> C is COMPLEX array, dimension (LDC,N) !> On entry, the m-by-n matrix C. !> On exit, C is overwritten by QC or QHC or CQH or CQ. !>
[in]	LDC	!> LDC is INTEGER !> The leading dimension of the array C. LDC >= max(1,M). !>
[out]	WORK	!> WORK is COMPLEX array, dimension !> (N) if SIDE = 'L', !> (M) if SIDE = 'R' !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: A. Petitet, Computer Science Dept., Univ. of Tenn., Knoxville, USA

Further Details:

!>

Definition at line 176 of file cunmr3.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          SIDE, TRANS
      INTEGER            INFO, K, L, LDA, LDC, M, N
*     ..
*     .. Array Arguments ..
      COMPLEX            A( LDA, * ), C( LDC, * ), TAU( * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Local Scalars ..
      LOGICAL            LEFT, NOTRAN
      INTEGER            I, I1, I2, I3, IC, JA, JC, MI, NI, NQ
      COMPLEX            TAUI
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           clarz, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          conjg, max
*     ..
*     .. Executable Statements ..
*
*     Test the input arguments
*
      info = 0
      left = lsame( side, 'L' )
      notran = lsame( trans, 'N' )
*
*     NQ is the order of Q
*
      IF( left ) THEN
         nq = m
      ELSE
         nq = n
      END IF
      IF( .NOT.left .AND. .NOT.lsame( side, 'R' ) ) THEN
         info = -1
      ELSE IF( .NOT.notran .AND. .NOT.lsame( trans, 'C' ) ) THEN
         info = -2
      ELSE IF( m.LT.0 ) THEN
         info = -3
      ELSE IF( n.LT.0 ) THEN
         info = -4
      ELSE IF( k.LT.0 .OR. k.GT.nq ) THEN
         info = -5
      ELSE IF( l.LT.0 .OR. ( left .AND. ( l.GT.m ) ) .OR.
     $         ( .NOT.left .AND. ( l.GT.n ) ) ) THEN
         info = -6
      ELSE IF( lda.LT.max( 1, k ) ) THEN
         info = -8
      ELSE IF( ldc.LT.max( 1, m ) ) THEN
         info = -11
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CUNMR3', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( m.EQ.0 .OR. n.EQ.0 .OR. k.EQ.0 )
     $   RETURN
*
      IF( ( left .AND. .NOT.notran .OR. .NOT.left .AND. notran ) ) THEN
         i1 = 1
         i2 = k
         i3 = 1
      ELSE
         i1 = k
         i2 = 1
         i3 = -1
      END IF
*
      IF( left ) THEN
         ni = n
         ja = m - l + 1
         jc = 1
      ELSE
         mi = m
         ja = n - l + 1
         ic = 1
      END IF
*
      DO 10 i = i1, i2, i3
         IF( left ) THEN
*
*           H(i) or H(i)**H is applied to C(i:m,1:n)
*
            mi = m - i + 1
            ic = i
         ELSE
*
*           H(i) or H(i)**H is applied to C(1:m,i:n)
*
            ni = n - i + 1
            jc = i
         END IF
*
*        Apply H(i) or H(i)**H
*
         IF( notran ) THEN
            taui = tau( i )
         ELSE
            taui = conjg( tau( i ) )
         END IF
         CALL clarz( side, mi, ni, l, a( i, ja ), lda, taui,
     $               c( ic, jc ), ldc, work )
*
   10 CONTINUE
*
      RETURN
*
*     End of CUNMR3
*

◆ cunmrq()

subroutine cunmrq	(	character	side,
		character	trans,
		integer	m,
		integer	n,
		integer	k,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( * )	tau,
		complex, dimension( ldc, * )	c,
		integer	ldc,
		complex, dimension( * )	work,
		integer	lwork,
		integer	info )

CUNMRQ

Download CUNMRQ + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CUNMRQ overwrites the general complex M-by-N matrix C with
!>
!>                 SIDE = 'L'     SIDE = 'R'
!> TRANS = 'N':      Q * C          C * Q
!> TRANS = 'C':      Q**H * C       C * Q**H
!>
!> where Q is a complex unitary matrix defined as the product of k
!> elementary reflectors
!>
!>       Q = H(1)**H H(2)**H . . . H(k)**H
!>
!> as returned by CGERQF. Q is of order M if SIDE = 'L' and of order N
!> if SIDE = 'R'.
!>

Parameters

[in]	SIDE	!> SIDE is CHARACTER1 !> = 'L': apply Q or QH from the Left; !> = 'R': apply Q or Q*H from the Right. !>
[in]	TRANS	!> TRANS is CHARACTER1 !> = 'N': No transpose, apply Q; !> = 'C': Conjugate transpose, apply Q*H. !>
[in]	M	!> M is INTEGER !> The number of rows of the matrix C. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix C. N >= 0. !>
[in]	K	!> K is INTEGER !> The number of elementary reflectors whose product defines !> the matrix Q. !> If SIDE = 'L', M >= K >= 0; !> if SIDE = 'R', N >= K >= 0. !>
[in]	A	!> A is COMPLEX array, dimension !> (LDA,M) if SIDE = 'L', !> (LDA,N) if SIDE = 'R' !> The i-th row must contain the vector which defines the !> elementary reflector H(i), for i = 1,2,...,k, as returned by !> CGERQF in the last k rows of its array argument A. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,K). !>
[in]	TAU	!> TAU is COMPLEX array, dimension (K) !> TAU(i) must contain the scalar factor of the elementary !> reflector H(i), as returned by CGERQF. !>
[in,out]	C	!> C is COMPLEX array, dimension (LDC,N) !> On entry, the M-by-N matrix C. !> On exit, C is overwritten by QC or QHC or CQH or CQ. !>
[in]	LDC	!> LDC is INTEGER !> The leading dimension of the array C. LDC >= max(1,M). !>
[out]	WORK	!> WORK is COMPLEX array, dimension (MAX(1,LWORK)) !> On exit, if INFO = 0, WORK(1) returns the optimal LWORK. !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the array WORK. !> If SIDE = 'L', LWORK >= max(1,N); !> if SIDE = 'R', LWORK >= max(1,M). !> For good performance, LWORK should generally be larger. !> !> If LWORK = -1, then a workspace query is assumed; the routine !> only calculates the optimal size of the WORK array, returns !> this value as the first entry of the WORK array, and no error !> message related to LWORK is issued by XERBLA. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 166 of file cunmrq.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          SIDE, TRANS
      INTEGER            INFO, K, LDA, LDC, LWORK, M, N
*     ..
*     .. Array Arguments ..
      COMPLEX            A( LDA, * ), C( LDC, * ), TAU( * ),
     $                   WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      INTEGER            NBMAX, LDT, TSIZE
      parameter( nbmax = 64, ldt = nbmax+1,
     $                     tsize = ldt*nbmax )
*     ..
*     .. Local Scalars ..
      LOGICAL            LEFT, LQUERY, NOTRAN
      CHARACTER          TRANST
      INTEGER            I, I1, I2, I3, IB, IINFO, IWT, LDWORK, LWKOPT,
     $                   MI, NB, NBMIN, NI, NQ, NW
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      INTEGER            ILAENV
      EXTERNAL           lsame, ilaenv
*     ..
*     .. External Subroutines ..
      EXTERNAL           clarfb, clarft, cunmr2, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, min
*     ..
*     .. Executable Statements ..
*
*     Test the input arguments
*
      info = 0
      left = lsame( side, 'L' )
      notran = lsame( trans, 'N' )
      lquery = ( lwork.EQ.-1 )
*
*     NQ is the order of Q and NW is the minimum dimension of WORK
*
      IF( left ) THEN
         nq = m
         nw = max( 1, n )
      ELSE
         nq = n
         nw = max( 1, m )
      END IF
      IF( .NOT.left .AND. .NOT.lsame( side, 'R' ) ) THEN
         info = -1
      ELSE IF( .NOT.notran .AND. .NOT.lsame( trans, 'C' ) ) THEN
         info = -2
      ELSE IF( m.LT.0 ) THEN
         info = -3
      ELSE IF( n.LT.0 ) THEN
         info = -4
      ELSE IF( k.LT.0 .OR. k.GT.nq ) THEN
         info = -5
      ELSE IF( lda.LT.max( 1, k ) ) THEN
         info = -7
      ELSE IF( ldc.LT.max( 1, m ) ) THEN
         info = -10
      ELSE IF( lwork.LT.nw .AND. .NOT.lquery ) THEN
         info = -12
      END IF
*
      IF( info.EQ.0 ) THEN
*
*        Compute the workspace requirements
*
         IF( m.EQ.0 .OR. n.EQ.0 ) THEN
            lwkopt = 1
         ELSE
            nb = min( nbmax, ilaenv( 1, 'CUNMRQ', side // trans, m, n,
     $                               k, -1 ) )
            lwkopt = nw*nb + tsize
         END IF
         work( 1 ) = lwkopt
      END IF
*
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CUNMRQ', -info )
         RETURN
      ELSE IF( lquery ) THEN
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( m.EQ.0 .OR. n.EQ.0 ) THEN
         RETURN
      END IF
*
      nbmin = 2
      ldwork = nw
      IF( nb.GT.1 .AND. nb.LT.k ) THEN
         IF( lwork.LT.lwkopt ) THEN
            nb = (lwork-tsize) / ldwork
            nbmin = max( 2, ilaenv( 2, 'CUNMRQ', side // trans, m, n, k,
     $              -1 ) )
         END IF
      END IF
*
      IF( nb.LT.nbmin .OR. nb.GE.k ) THEN
*
*        Use unblocked code
*
         CALL cunmr2( side, trans, m, n, k, a, lda, tau, c, ldc, work,
     $                iinfo )
      ELSE
*
*        Use blocked code
*
         iwt = 1 + nw*nb
         IF( ( left .AND. .NOT.notran ) .OR.
     $       ( .NOT.left .AND. notran ) ) THEN
            i1 = 1
            i2 = k
            i3 = nb
         ELSE
            i1 = ( ( k-1 ) / nb )*nb + 1
            i2 = 1
            i3 = -nb
         END IF
*
         IF( left ) THEN
            ni = n
         ELSE
            mi = m
         END IF
*
         IF( notran ) THEN
            transt = 'C'
         ELSE
            transt = 'N'
         END IF
*
         DO 10 i = i1, i2, i3
            ib = min( nb, k-i+1 )
*
*           Form the triangular factor of the block reflector
*           H = H(i+ib-1) . . . H(i+1) H(i)
*
            CALL clarft( 'Backward', 'Rowwise', nq-k+i+ib-1, ib,
     $                   a( i, 1 ), lda, tau( i ), work( iwt ), ldt )
            IF( left ) THEN
*
*              H or H**H is applied to C(1:m-k+i+ib-1,1:n)
*
               mi = m - k + i + ib - 1
            ELSE
*
*              H or H**H is applied to C(1:m,1:n-k+i+ib-1)
*
               ni = n - k + i + ib - 1
            END IF
*
*           Apply H or H**H
*
            CALL clarfb( side, transt, 'Backward', 'Rowwise', mi, ni,
     $                   ib, a( i, 1 ), lda, work( iwt ), ldt, c, ldc,
     $                   work, ldwork )
   10    CONTINUE
      END IF
      work( 1 ) = lwkopt
      RETURN
*
*     End of CUNMRQ
*

◆ cunmrz()

subroutine cunmrz	(	character	side,
		character	trans,
		integer	m,
		integer	n,
		integer	k,
		integer	l,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( * )	tau,
		complex, dimension( ldc, * )	c,
		integer	ldc,
		complex, dimension( * )	work,
		integer	lwork,
		integer	info )

CUNMRZ

Download CUNMRZ + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CUNMRZ overwrites the general complex M-by-N matrix C with
!>
!>                 SIDE = 'L'     SIDE = 'R'
!> TRANS = 'N':      Q * C          C * Q
!> TRANS = 'C':      Q**H * C       C * Q**H
!>
!> where Q is a complex unitary matrix defined as the product of k
!> elementary reflectors
!>
!>       Q = H(1) H(2) . . . H(k)
!>
!> as returned by CTZRZF. Q is of order M if SIDE = 'L' and of order N
!> if SIDE = 'R'.
!>

Parameters

[in]	SIDE	!> SIDE is CHARACTER1 !> = 'L': apply Q or QH from the Left; !> = 'R': apply Q or Q*H from the Right. !>
[in]	TRANS	!> TRANS is CHARACTER1 !> = 'N': No transpose, apply Q; !> = 'C': Conjugate transpose, apply Q*H. !>
[in]	M	!> M is INTEGER !> The number of rows of the matrix C. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix C. N >= 0. !>
[in]	K	!> K is INTEGER !> The number of elementary reflectors whose product defines !> the matrix Q. !> If SIDE = 'L', M >= K >= 0; !> if SIDE = 'R', N >= K >= 0. !>
[in]	L	!> L is INTEGER !> The number of columns of the matrix A containing !> the meaningful part of the Householder reflectors. !> If SIDE = 'L', M >= L >= 0, if SIDE = 'R', N >= L >= 0. !>
[in]	A	!> A is COMPLEX array, dimension !> (LDA,M) if SIDE = 'L', !> (LDA,N) if SIDE = 'R' !> The i-th row must contain the vector which defines the !> elementary reflector H(i), for i = 1,2,...,k, as returned by !> CTZRZF in the last k rows of its array argument A. !> A is modified by the routine but restored on exit. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,K). !>
[in]	TAU	!> TAU is COMPLEX array, dimension (K) !> TAU(i) must contain the scalar factor of the elementary !> reflector H(i), as returned by CTZRZF. !>
[in,out]	C	!> C is COMPLEX array, dimension (LDC,N) !> On entry, the M-by-N matrix C. !> On exit, C is overwritten by QC or QHC or CQH or CQ. !>
[in]	LDC	!> LDC is INTEGER !> The leading dimension of the array C. LDC >= max(1,M). !>
[out]	WORK	!> WORK is COMPLEX array, dimension (MAX(1,LWORK)) !> On exit, if INFO = 0, WORK(1) returns the optimal LWORK. !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the array WORK. !> If SIDE = 'L', LWORK >= max(1,N); !> if SIDE = 'R', LWORK >= max(1,M). !> For good performance, LWORK should generally be larger. !> !> If LWORK = -1, then a workspace query is assumed; the routine !> only calculates the optimal size of the WORK array, returns !> this value as the first entry of the WORK array, and no error !> message related to LWORK is issued by XERBLA. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: A. Petitet, Computer Science Dept., Univ. of Tenn., Knoxville, USA

Further Details:

!>

Definition at line 185 of file cunmrz.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          SIDE, TRANS
      INTEGER            INFO, K, L, LDA, LDC, LWORK, M, N
*     ..
*     .. Array Arguments ..
      COMPLEX            A( LDA, * ), C( LDC, * ), TAU( * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      INTEGER            NBMAX, LDT, TSIZE
      parameter( nbmax = 64, ldt = nbmax+1,
     $                     tsize = ldt*nbmax )
*     ..
*     .. Local Scalars ..
      LOGICAL            LEFT, LQUERY, NOTRAN
      CHARACTER          TRANST
      INTEGER            I, I1, I2, I3, IB, IC, IINFO, IWT, JA, JC,
     $                   LDWORK, LWKOPT, MI, NB, NBMIN, NI, NQ, NW
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      INTEGER            ILAENV
      EXTERNAL           lsame, ilaenv
*     ..
*     .. External Subroutines ..
      EXTERNAL           clarzb, clarzt, cunmr3, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, min
*     ..
*     .. Executable Statements ..
*
*     Test the input arguments
*
      info = 0
      left = lsame( side, 'L' )
      notran = lsame( trans, 'N' )
      lquery = ( lwork.EQ.-1 )
*
*     NQ is the order of Q and NW is the minimum dimension of WORK
*
      IF( left ) THEN
         nq = m
         nw = max( 1, n )
      ELSE
         nq = n
         nw = max( 1, m )
      END IF
      IF( .NOT.left .AND. .NOT.lsame( side, 'R' ) ) THEN
         info = -1
      ELSE IF( .NOT.notran .AND. .NOT.lsame( trans, 'C' ) ) THEN
         info = -2
      ELSE IF( m.LT.0 ) THEN
         info = -3
      ELSE IF( n.LT.0 ) THEN
         info = -4
      ELSE IF( k.LT.0 .OR. k.GT.nq ) THEN
         info = -5
      ELSE IF( l.LT.0 .OR. ( left .AND. ( l.GT.m ) ) .OR.
     $         ( .NOT.left .AND. ( l.GT.n ) ) ) THEN
         info = -6
      ELSE IF( lda.LT.max( 1, k ) ) THEN
         info = -8
      ELSE IF( ldc.LT.max( 1, m ) ) THEN
         info = -11
      ELSE IF( lwork.LT.nw .AND. .NOT.lquery ) THEN
         info = -13
      END IF
*
      IF( info.EQ.0 ) THEN
*
*        Compute the workspace requirements
*
         IF( m.EQ.0 .OR. n.EQ.0 ) THEN
            lwkopt = 1
         ELSE
            nb = min( nbmax, ilaenv( 1, 'CUNMRQ', side // trans, m, n,
     $                               k, -1 ) )
            lwkopt = nw*nb + tsize
         END IF
         work( 1 ) = lwkopt
      END IF
*
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CUNMRZ', -info )
         RETURN
      ELSE IF( lquery ) THEN
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( m.EQ.0 .OR. n.EQ.0 ) THEN
         RETURN
      END IF
*
*     Determine the block size.
*
      nb = min( nbmax, ilaenv( 1, 'CUNMRQ', side // trans, m, n, k,
     $                         -1 ) )
      nbmin = 2
      ldwork = nw
      IF( nb.GT.1 .AND. nb.LT.k ) THEN
         IF( lwork.LT.lwkopt ) THEN
            nb = (lwork-tsize) / ldwork
            nbmin = max( 2, ilaenv( 2, 'CUNMRQ', side // trans, m, n, k,
     $                              -1 ) )
         END IF
      END IF
*
      IF( nb.LT.nbmin .OR. nb.GE.k ) THEN
*
*        Use unblocked code
*
         CALL cunmr3( side, trans, m, n, k, l, a, lda, tau, c, ldc,
     $                work, iinfo )
      ELSE
*
*        Use blocked code
*
         iwt = 1 + nw*nb
         IF( ( left .AND. .NOT.notran ) .OR.
     $       ( .NOT.left .AND. notran ) ) THEN
            i1 = 1
            i2 = k
            i3 = nb
         ELSE
            i1 = ( ( k-1 ) / nb )*nb + 1
            i2 = 1
            i3 = -nb
         END IF
*
         IF( left ) THEN
            ni = n
            jc = 1
            ja = m - l + 1
         ELSE
            mi = m
            ic = 1
            ja = n - l + 1
         END IF
*
         IF( notran ) THEN
            transt = 'C'
         ELSE
            transt = 'N'
         END IF
*
         DO 10 i = i1, i2, i3
            ib = min( nb, k-i+1 )
*
*           Form the triangular factor of the block reflector
*           H = H(i+ib-1) . . . H(i+1) H(i)
*
            CALL clarzt( 'Backward', 'Rowwise', l, ib, a( i, ja ), lda,
     $                   tau( i ), work( iwt ), ldt )
*
            IF( left ) THEN
*
*              H or H**H is applied to C(i:m,1:n)
*
               mi = m - i + 1
               ic = i
            ELSE
*
*              H or H**H is applied to C(1:m,i:n)
*
               ni = n - i + 1
               jc = i
            END IF
*
*           Apply H or H**H
*
            CALL clarzb( side, transt, 'Backward', 'Rowwise', mi, ni,
     $                   ib, l, a( i, ja ), lda, work( iwt ), ldt,
     $                   c( ic, jc ), ldc, work, ldwork )
   10    CONTINUE
*
      END IF
*
      work( 1 ) = lwkopt
*
      RETURN
*
*     End of CUNMRZ
*

◆ cunmtr()

subroutine cunmtr	(	character	side,
		character	uplo,
		character	trans,
		integer	m,
		integer	n,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( * )	tau,
		complex, dimension( ldc, * )	c,
		integer	ldc,
		complex, dimension( * )	work,
		integer	lwork,
		integer	info )

CUNMTR

Download CUNMTR + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CUNMTR overwrites the general complex M-by-N matrix C with
!>
!>                 SIDE = 'L'     SIDE = 'R'
!> TRANS = 'N':      Q * C          C * Q
!> TRANS = 'C':      Q**H * C       C * Q**H
!>
!> where Q is a complex unitary matrix of order nq, with nq = m if
!> SIDE = 'L' and nq = n if SIDE = 'R'. Q is defined as the product of
!> nq-1 elementary reflectors, as returned by CHETRD:
!>
!> if UPLO = 'U', Q = H(nq-1) . . . H(2) H(1);
!>
!> if UPLO = 'L', Q = H(1) H(2) . . . H(nq-1).
!>

Parameters

[in]	SIDE	!> SIDE is CHARACTER1 !> = 'L': apply Q or QH from the Left; !> = 'R': apply Q or Q*H from the Right. !>
[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': Upper triangle of A contains elementary reflectors !> from CHETRD; !> = 'L': Lower triangle of A contains elementary reflectors !> from CHETRD. !>
[in]	TRANS	!> TRANS is CHARACTER1 !> = 'N': No transpose, apply Q; !> = 'C': Conjugate transpose, apply Q*H. !>
[in]	M	!> M is INTEGER !> The number of rows of the matrix C. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix C. N >= 0. !>
[in]	A	!> A is COMPLEX array, dimension !> (LDA,M) if SIDE = 'L' !> (LDA,N) if SIDE = 'R' !> The vectors which define the elementary reflectors, as !> returned by CHETRD. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. !> LDA >= max(1,M) if SIDE = 'L'; LDA >= max(1,N) if SIDE = 'R'. !>
[in]	TAU	!> TAU is COMPLEX array, dimension !> (M-1) if SIDE = 'L' !> (N-1) if SIDE = 'R' !> TAU(i) must contain the scalar factor of the elementary !> reflector H(i), as returned by CHETRD. !>
[in,out]	C	!> C is COMPLEX array, dimension (LDC,N) !> On entry, the M-by-N matrix C. !> On exit, C is overwritten by QC or QHC or CQH or CQ. !>
[in]	LDC	!> LDC is INTEGER !> The leading dimension of the array C. LDC >= max(1,M). !>
[out]	WORK	!> WORK is COMPLEX array, dimension (MAX(1,LWORK)) !> On exit, if INFO = 0, WORK(1) returns the optimal LWORK. !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the array WORK. !> If SIDE = 'L', LWORK >= max(1,N); !> if SIDE = 'R', LWORK >= max(1,M). !> For optimum performance LWORK >= NNB if SIDE = 'L', and !> LWORK >=MNB if SIDE = 'R', where NB is the optimal !> blocksize. !> !> If LWORK = -1, then a workspace query is assumed; the routine !> only calculates the optimal size of the WORK array, returns !> this value as the first entry of the WORK array, and no error !> message related to LWORK is issued by XERBLA. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 170 of file cunmtr.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          SIDE, TRANS, UPLO
      INTEGER            INFO, LDA, LDC, LWORK, M, N
*     ..
*     .. Array Arguments ..
      COMPLEX            A( LDA, * ), C( LDC, * ), TAU( * ),
     $                   WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Local Scalars ..
      LOGICAL            LEFT, LQUERY, UPPER
      INTEGER            I1, I2, IINFO, LWKOPT, MI, NB, NI, NQ, NW
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      INTEGER            ILAENV
      EXTERNAL           ilaenv, lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           cunmql, cunmqr, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max
*     ..
*     .. Executable Statements ..
*
*     Test the input arguments
*
      info = 0
      left = lsame( side, 'L' )
      upper = lsame( uplo, 'U' )
      lquery = ( lwork.EQ.-1 )
*
*     NQ is the order of Q and NW is the minimum dimension of WORK
*
      IF( left ) THEN
         nq = m
         nw = max( 1, n )
      ELSE
         nq = n
         nw = max( 1, m )
      END IF
      IF( .NOT.left .AND. .NOT.lsame( side, 'R' ) ) THEN
         info = -1
      ELSE IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -2
      ELSE IF( .NOT.lsame( trans, 'N' ) .AND. .NOT.lsame( trans, 'C' ) )
     $          THEN
         info = -3
      ELSE IF( m.LT.0 ) THEN
         info = -4
      ELSE IF( n.LT.0 ) THEN
         info = -5
      ELSE IF( lda.LT.max( 1, nq ) ) THEN
         info = -7
      ELSE IF( ldc.LT.max( 1, m ) ) THEN
         info = -10
      ELSE IF( lwork.LT.nw .AND. .NOT.lquery ) THEN
         info = -12
      END IF
*
      IF( info.EQ.0 ) THEN
         IF( upper ) THEN
            IF( left ) THEN
               nb = ilaenv( 1, 'CUNMQL', side // trans, m-1, n, m-1,
     $                      -1 )
            ELSE
               nb = ilaenv( 1, 'CUNMQL', side // trans, m, n-1, n-1,
     $                      -1 )
            END IF
         ELSE
            IF( left ) THEN
               nb = ilaenv( 1, 'CUNMQR', side // trans, m-1, n, m-1,
     $                      -1 )
            ELSE
               nb = ilaenv( 1, 'CUNMQR', side // trans, m, n-1, n-1,
     $                      -1 )
            END IF
         END IF
         lwkopt = nw*nb
         work( 1 ) = lwkopt
      END IF
*
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CUNMTR', -info )
         RETURN
      ELSE IF( lquery ) THEN
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( m.EQ.0 .OR. n.EQ.0 .OR. nq.EQ.1 ) THEN
         work( 1 ) = 1
         RETURN
      END IF
*
      IF( left ) THEN
         mi = m - 1
         ni = n
      ELSE
         mi = m
         ni = n - 1
      END IF
*
      IF( upper ) THEN
*
*        Q was determined by a call to CHETRD with UPLO = 'U'
*
         CALL cunmql( side, trans, mi, ni, nq-1, a( 1, 2 ), lda, tau, c,
     $                ldc, work, lwork, iinfo )
      ELSE
*
*        Q was determined by a call to CHETRD with UPLO = 'L'
*
         IF( left ) THEN
            i1 = 2
            i2 = 1
         ELSE
            i1 = 1
            i2 = 2
         END IF
         CALL cunmqr( side, trans, mi, ni, nq-1, a( 2, 1 ), lda, tau,
     $                c( i1, i2 ), ldc, work, lwork, iinfo )
      END IF
      work( 1 ) = lwkopt
      RETURN
*
*     End of CUNMTR
*

◆ cupgtr()

subroutine cupgtr	(	character	uplo,
		integer	n,
		complex, dimension( * )	ap,
		complex, dimension( * )	tau,
		complex, dimension( ldq, * )	q,
		integer	ldq,
		complex, dimension( * )	work,
		integer	info )

CUPGTR

Download CUPGTR + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CUPGTR generates a complex unitary matrix Q which is defined as the
!> product of n-1 elementary reflectors H(i) of order n, as returned by
!> CHPTRD using packed storage:
!>
!> if UPLO = 'U', Q = H(n-1) . . . H(2) H(1),
!>
!> if UPLO = 'L', Q = H(1) H(2) . . . H(n-1).
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': Upper triangular packed storage used in previous !> call to CHPTRD; !> = 'L': Lower triangular packed storage used in previous !> call to CHPTRD. !>
[in]	N	!> N is INTEGER !> The order of the matrix Q. N >= 0. !>
[in]	AP	!> AP is COMPLEX array, dimension (N*(N+1)/2) !> The vectors which define the elementary reflectors, as !> returned by CHPTRD. !>
[in]	TAU	!> TAU is COMPLEX array, dimension (N-1) !> TAU(i) must contain the scalar factor of the elementary !> reflector H(i), as returned by CHPTRD. !>
[out]	Q	!> Q is COMPLEX array, dimension (LDQ,N) !> The N-by-N unitary matrix Q. !>
[in]	LDQ	!> LDQ is INTEGER !> The leading dimension of the array Q. LDQ >= max(1,N). !>
[out]	WORK	!> WORK is COMPLEX array, dimension (N-1) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 113 of file cupgtr.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          UPLO
      INTEGER            INFO, LDQ, N
*     ..
*     .. Array Arguments ..
      COMPLEX            AP( * ), Q( LDQ, * ), TAU( * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            CZERO, CONE
      parameter( czero = ( 0.0e+0, 0.0e+0 ),
     $                   cone = ( 1.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      LOGICAL            UPPER
      INTEGER            I, IINFO, IJ, J
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           cung2l, cung2r, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max
*     ..
*     .. Executable Statements ..
*
*     Test the input arguments
*
      info = 0
      upper = lsame( uplo, 'U' )
      IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( ldq.LT.max( 1, n ) ) THEN
         info = -6
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CUPGTR', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
      IF( upper ) THEN
*
*        Q was determined by a call to CHPTRD with UPLO = 'U'
*
*        Unpack the vectors which define the elementary reflectors and
*        set the last row and column of Q equal to those of the unit
*        matrix
*
         ij = 2
         DO 20 j = 1, n - 1
            DO 10 i = 1, j - 1
               q( i, j ) = ap( ij )
               ij = ij + 1
   10       CONTINUE
            ij = ij + 2
            q( n, j ) = czero
   20    CONTINUE
         DO 30 i = 1, n - 1
            q( i, n ) = czero
   30    CONTINUE
         q( n, n ) = cone
*
*        Generate Q(1:n-1,1:n-1)
*
         CALL cung2l( n-1, n-1, n-1, q, ldq, tau, work, iinfo )
*
      ELSE
*
*        Q was determined by a call to CHPTRD with UPLO = 'L'.
*
*        Unpack the vectors which define the elementary reflectors and
*        set the first row and column of Q equal to those of the unit
*        matrix
*
         q( 1, 1 ) = cone
         DO 40 i = 2, n
            q( i, 1 ) = czero
   40    CONTINUE
         ij = 3
         DO 60 j = 2, n
            q( 1, j ) = czero
            DO 50 i = j + 1, n
               q( i, j ) = ap( ij )
               ij = ij + 1
   50       CONTINUE
            ij = ij + 2
   60    CONTINUE
         IF( n.GT.1 ) THEN
*
*           Generate Q(2:n,2:n)
*
            CALL cung2r( n-1, n-1, n-1, q( 2, 2 ), ldq, tau, work,
     $                   iinfo )
         END IF
      END IF
      RETURN
*
*     End of CUPGTR
*

◆ cupmtr()

subroutine cupmtr	(	character	side,
		character	uplo,
		character	trans,
		integer	m,
		integer	n,
		complex, dimension( * )	ap,
		complex, dimension( * )	tau,
		complex, dimension( ldc, * )	c,
		integer	ldc,
		complex, dimension( * )	work,
		integer	info )

CUPMTR

Download CUPMTR + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> CUPMTR overwrites the general complex M-by-N matrix C with
!>
!>                 SIDE = 'L'     SIDE = 'R'
!> TRANS = 'N':      Q * C          C * Q
!> TRANS = 'C':      Q**H * C       C * Q**H
!>
!> where Q is a complex unitary matrix of order nq, with nq = m if
!> SIDE = 'L' and nq = n if SIDE = 'R'. Q is defined as the product of
!> nq-1 elementary reflectors, as returned by CHPTRD using packed
!> storage:
!>
!> if UPLO = 'U', Q = H(nq-1) . . . H(2) H(1);
!>
!> if UPLO = 'L', Q = H(1) H(2) . . . H(nq-1).
!>

Parameters

[in]	SIDE	!> SIDE is CHARACTER1 !> = 'L': apply Q or QH from the Left; !> = 'R': apply Q or Q*H from the Right. !>
[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': Upper triangular packed storage used in previous !> call to CHPTRD; !> = 'L': Lower triangular packed storage used in previous !> call to CHPTRD. !>
[in]	TRANS	!> TRANS is CHARACTER1 !> = 'N': No transpose, apply Q; !> = 'C': Conjugate transpose, apply Q*H. !>
[in]	M	!> M is INTEGER !> The number of rows of the matrix C. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix C. N >= 0. !>
[in]	AP	!> AP is COMPLEX array, dimension !> (M(M+1)/2) if SIDE = 'L' !> (N(N+1)/2) if SIDE = 'R' !> The vectors which define the elementary reflectors, as !> returned by CHPTRD. AP is modified by the routine but !> restored on exit. !>
[in]	TAU	!> TAU is COMPLEX array, dimension (M-1) if SIDE = 'L' !> or (N-1) if SIDE = 'R' !> TAU(i) must contain the scalar factor of the elementary !> reflector H(i), as returned by CHPTRD. !>
[in,out]	C	!> C is COMPLEX array, dimension (LDC,N) !> On entry, the M-by-N matrix C. !> On exit, C is overwritten by QC or QHC or CQH or CQ. !>
[in]	LDC	!> LDC is INTEGER !> The leading dimension of the array C. LDC >= max(1,M). !>
[out]	WORK	!> WORK is COMPLEX array, dimension !> (N) if SIDE = 'L' !> (M) if SIDE = 'R' !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 148 of file cupmtr.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          SIDE, TRANS, UPLO
      INTEGER            INFO, LDC, M, N
*     ..
*     .. Array Arguments ..
      COMPLEX            AP( * ), C( LDC, * ), TAU( * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            ONE
      parameter( one = ( 1.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      LOGICAL            FORWRD, LEFT, NOTRAN, UPPER
      INTEGER            I, I1, I2, I3, IC, II, JC, MI, NI, NQ
      COMPLEX            AII, TAUI
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           clarf, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          conjg, max
*     ..
*     .. Executable Statements ..
*
*     Test the input arguments
*
      info = 0
      left = lsame( side, 'L' )
      notran = lsame( trans, 'N' )
      upper = lsame( uplo, 'U' )
*
*     NQ is the order of Q
*
      IF( left ) THEN
         nq = m
      ELSE
         nq = n
      END IF
      IF( .NOT.left .AND. .NOT.lsame( side, 'R' ) ) THEN
         info = -1
      ELSE IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -2
      ELSE IF( .NOT.notran .AND. .NOT.lsame( trans, 'C' ) ) THEN
         info = -3
      ELSE IF( m.LT.0 ) THEN
         info = -4
      ELSE IF( n.LT.0 ) THEN
         info = -5
      ELSE IF( ldc.LT.max( 1, m ) ) THEN
         info = -9
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CUPMTR', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( m.EQ.0 .OR. n.EQ.0 )
     $   RETURN
*
      IF( upper ) THEN
*
*        Q was determined by a call to CHPTRD with UPLO = 'U'
*
         forwrd = ( left .AND. notran ) .OR.
     $            ( .NOT.left .AND. .NOT.notran )
*
         IF( forwrd ) THEN
            i1 = 1
            i2 = nq - 1
            i3 = 1
            ii = 2
         ELSE
            i1 = nq - 1
            i2 = 1
            i3 = -1
            ii = nq*( nq+1 ) / 2 - 1
         END IF
*
         IF( left ) THEN
            ni = n
         ELSE
            mi = m
         END IF
*
         DO 10 i = i1, i2, i3
            IF( left ) THEN
*
*              H(i) or H(i)**H is applied to C(1:i,1:n)
*
               mi = i
            ELSE
*
*              H(i) or H(i)**H is applied to C(1:m,1:i)
*
               ni = i
            END IF
*
*           Apply H(i) or H(i)**H
*
            IF( notran ) THEN
               taui = tau( i )
            ELSE
               taui = conjg( tau( i ) )
            END IF
            aii = ap( ii )
            ap( ii ) = one
            CALL clarf( side, mi, ni, ap( ii-i+1 ), 1, taui, c, ldc,
     $                  work )
            ap( ii ) = aii
*
            IF( forwrd ) THEN
               ii = ii + i + 2
            ELSE
               ii = ii - i - 1
            END IF
   10    CONTINUE
      ELSE
*
*        Q was determined by a call to CHPTRD with UPLO = 'L'.
*
         forwrd = ( left .AND. .NOT.notran ) .OR.
     $            ( .NOT.left .AND. notran )
*
         IF( forwrd ) THEN
            i1 = 1
            i2 = nq - 1
            i3 = 1
            ii = 2
         ELSE
            i1 = nq - 1
            i2 = 1
            i3 = -1
            ii = nq*( nq+1 ) / 2 - 1
         END IF
*
         IF( left ) THEN
            ni = n
            jc = 1
         ELSE
            mi = m
            ic = 1
         END IF
*
         DO 20 i = i1, i2, i3
            aii = ap( ii )
            ap( ii ) = one
            IF( left ) THEN
*
*              H(i) or H(i)**H is applied to C(i+1:m,1:n)
*
               mi = m - i
               ic = i + 1
            ELSE
*
*              H(i) or H(i)**H is applied to C(1:m,i+1:n)
*
               ni = n - i
               jc = i + 1
            END IF
*
*           Apply H(i) or H(i)**H
*
            IF( notran ) THEN
               taui = tau( i )
            ELSE
               taui = conjg( tau( i ) )
            END IF
            CALL clarf( side, mi, ni, ap( ii ), 1, taui, c( ic, jc ),
     $                  ldc, work )
            ap( ii ) = aii
*
            IF( forwrd ) THEN
               ii = ii + nq - i + 1
            ELSE
               ii = ii - nq + i - 2
            END IF
   20    CONTINUE
      END IF
      RETURN
*
*     End of CUPMTR
*

◆ dorm22()

subroutine dorm22	(	character	side,
		character	trans,
		integer	m,
		integer	n,
		integer	n1,
		integer	n2,
		double precision, dimension( ldq, * )	q,
		integer	ldq,
		double precision, dimension( ldc, * )	c,
		integer	ldc,
		double precision, dimension( * )	work,
		integer	lwork,
		integer	info )

DORM22 multiplies a general matrix by a banded orthogonal matrix.

Download DORM22 + dependencies [TGZ] [ZIP] [TXT]

Purpose

!>
!>
!>  DORM22 overwrites the general real M-by-N matrix C with
!>
!>                  SIDE = 'L'     SIDE = 'R'
!>  TRANS = 'N':      Q * C          C * Q
!>  TRANS = 'T':      Q**T * C       C * Q**T
!>
!>  where Q is a real orthogonal matrix of order NQ, with NQ = M if
!>  SIDE = 'L' and NQ = N if SIDE = 'R'.
!>  The orthogonal matrix Q processes a 2-by-2 block structure
!>
!>         [  Q11  Q12  ]
!>     Q = [            ]
!>         [  Q21  Q22  ],
!>
!>  where Q12 is an N1-by-N1 lower triangular matrix and Q21 is an
!>  N2-by-N2 upper triangular matrix.
!>

Parameters

[in]	SIDE	!> SIDE is CHARACTER1 !> = 'L': apply Q or QT from the Left; !> = 'R': apply Q or Q*T from the Right. !>
[in]	TRANS	!> TRANS is CHARACTER1 !> = 'N': apply Q (No transpose); !> = 'C': apply Q*T (Conjugate transpose). !>
[in]	M	!> M is INTEGER !> The number of rows of the matrix C. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix C. N >= 0. !>
[in]	N1
[in]	N2	!> N1 is INTEGER !> N2 is INTEGER !> The dimension of Q12 and Q21, respectively. N1, N2 >= 0. !> The following requirement must be satisfied: !> N1 + N2 = M if SIDE = 'L' and N1 + N2 = N if SIDE = 'R'. !>
[in]	Q	!> Q is DOUBLE PRECISION array, dimension !> (LDQ,M) if SIDE = 'L' !> (LDQ,N) if SIDE = 'R' !>
[in]	LDQ	!> LDQ is INTEGER !> The leading dimension of the array Q. !> LDQ >= max(1,M) if SIDE = 'L'; LDQ >= max(1,N) if SIDE = 'R'. !>
[in,out]	C	!> C is DOUBLE PRECISION array, dimension (LDC,N) !> On entry, the M-by-N matrix C. !> On exit, C is overwritten by QC or QTC or CQT or CQ. !>
[in]	LDC	!> LDC is INTEGER !> The leading dimension of the array C. LDC >= max(1,M). !>
[out]	WORK	!> WORK is DOUBLE PRECISION array, dimension (MAX(1,LWORK)) !> On exit, if INFO = 0, WORK(1) returns the optimal LWORK. !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the array WORK. !> If SIDE = 'L', LWORK >= max(1,N); !> if SIDE = 'R', LWORK >= max(1,M). !> For optimum performance LWORK >= M*N. !> !> If LWORK = -1, then a workspace query is assumed; the routine !> only calculates the optimal size of the WORK array, returns !> this value as the first entry of the WORK array, and no error !> message related to LWORK is issued by XERBLA. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 161 of file dorm22.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
      IMPLICIT NONE
*
*     .. Scalar Arguments ..
      CHARACTER          SIDE, TRANS
      INTEGER            M, N, N1, N2, LDQ, LDC, LWORK, INFO
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   Q( LDQ, * ), C( LDC, * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ONE
      parameter( one = 1.0d+0 )
*
*     .. Local Scalars ..
      LOGICAL            LEFT, LQUERY, NOTRAN
      INTEGER            I, LDWORK, LEN, LWKOPT, NB, NQ, NW
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           dgemm, dlacpy, dtrmm, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          dble, max, min
*     ..
*     .. Executable Statements ..
*
*     Test the input arguments
*
      info = 0
      left = lsame( side, 'L' )
      notran = lsame( trans, 'N' )
      lquery = ( lwork.EQ.-1 )
*
*     NQ is the order of Q;
*     NW is the minimum dimension of WORK.
*
      IF( left ) THEN
         nq = m
      ELSE
         nq = n
      END IF
      nw = nq
      IF( n1.EQ.0 .OR. n2.EQ.0 ) nw = 1
      IF( .NOT.left .AND. .NOT.lsame( side, 'R' ) ) THEN
         info = -1
      ELSE IF( .NOT.lsame( trans, 'N' ) .AND. .NOT.lsame( trans, 'T' ) )
     $          THEN
         info = -2
      ELSE IF( m.LT.0 ) THEN
         info = -3
      ELSE IF( n.LT.0 ) THEN
         info = -4
      ELSE IF( n1.LT.0 .OR. n1+n2.NE.nq ) THEN
         info = -5
      ELSE IF( n2.LT.0 ) THEN
         info = -6
      ELSE IF( ldq.LT.max( 1, nq ) ) THEN
         info = -8
      ELSE IF( ldc.LT.max( 1, m ) ) THEN
         info = -10
      ELSE IF( lwork.LT.nw .AND. .NOT.lquery ) THEN
         info = -12
      END IF
*
      IF( info.EQ.0 ) THEN
         lwkopt = m*n
         work( 1 ) = dble( lwkopt )
      END IF
*
      IF( info.NE.0 ) THEN
         CALL xerbla( 'DORM22', -info )
         RETURN
      ELSE IF( lquery ) THEN
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( m.EQ.0 .OR. n.EQ.0 ) THEN
         work( 1 ) = 1
         RETURN
      END IF
*
*     Degenerate cases (N1 = 0 or N2 = 0) are handled using DTRMM.
*
      IF( n1.EQ.0 ) THEN
         CALL dtrmm( side, 'Upper', trans, 'Non-Unit', m, n, one,
     $               q, ldq, c, ldc )
         work( 1 ) = one
         RETURN
      ELSE IF( n2.EQ.0 ) THEN
         CALL dtrmm( side, 'Lower', trans, 'Non-Unit', m, n, one,
     $               q, ldq, c, ldc )
         work( 1 ) = one
         RETURN
      END IF
*
*     Compute the largest chunk size available from the workspace.
*
      nb = max( 1, min( lwork, lwkopt ) / nq )
*
      IF( left ) THEN
         IF( notran ) THEN
            DO i = 1, n, nb
               len = min( nb, n-i+1 )
               ldwork = m
*
*              Multiply bottom part of C by Q12.
*
               CALL dlacpy( 'All', n1, len, c( n2+1, i ), ldc, work,
     $                      ldwork )
               CALL dtrmm( 'Left', 'Lower', 'No Transpose', 'Non-Unit',
     $                     n1, len, one, q( 1, n2+1 ), ldq, work,
     $                     ldwork )
*
*              Multiply top part of C by Q11.
*
               CALL dgemm( 'No Transpose', 'No Transpose', n1, len, n2,
     $                     one, q, ldq, c( 1, i ), ldc, one, work,
     $                     ldwork )
*
*              Multiply top part of C by Q21.
*
               CALL dlacpy( 'All', n2, len, c( 1, i ), ldc,
     $                      work( n1+1 ), ldwork )
               CALL dtrmm( 'Left', 'Upper', 'No Transpose', 'Non-Unit',
     $                     n2, len, one, q( n1+1, 1 ), ldq,
     $                     work( n1+1 ), ldwork )
*
*              Multiply bottom part of C by Q22.
*
               CALL dgemm( 'No Transpose', 'No Transpose', n2, len, n1,
     $                     one, q( n1+1, n2+1 ), ldq, c( n2+1, i ), ldc,
     $                     one, work( n1+1 ), ldwork )
*
*              Copy everything back.
*
               CALL dlacpy( 'All', m, len, work, ldwork, c( 1, i ),
     $                      ldc )
            END DO
         ELSE
            DO i = 1, n, nb
               len = min( nb, n-i+1 )
               ldwork = m
*
*              Multiply bottom part of C by Q21**T.
*
               CALL dlacpy( 'All', n2, len, c( n1+1, i ), ldc, work,
     $                      ldwork )
               CALL dtrmm( 'Left', 'Upper', 'Transpose', 'Non-Unit',
     $                     n2, len, one, q( n1+1, 1 ), ldq, work,
     $                     ldwork )
*
*              Multiply top part of C by Q11**T.
*
               CALL dgemm( 'Transpose', 'No Transpose', n2, len, n1,
     $                     one, q, ldq, c( 1, i ), ldc, one, work,
     $                     ldwork )
*
*              Multiply top part of C by Q12**T.
*
               CALL dlacpy( 'All', n1, len, c( 1, i ), ldc,
     $                      work( n2+1 ), ldwork )
               CALL dtrmm( 'Left', 'Lower', 'Transpose', 'Non-Unit',
     $                     n1, len, one, q( 1, n2+1 ), ldq,
     $                     work( n2+1 ), ldwork )
*
*              Multiply bottom part of C by Q22**T.
*
               CALL dgemm( 'Transpose', 'No Transpose', n1, len, n2,
     $                     one, q( n1+1, n2+1 ), ldq, c( n1+1, i ), ldc,
     $                     one, work( n2+1 ), ldwork )
*
*              Copy everything back.
*
               CALL dlacpy( 'All', m, len, work, ldwork, c( 1, i ),
     $                      ldc )
            END DO
         END IF
      ELSE
         IF( notran ) THEN
            DO i = 1, m, nb
               len = min( nb, m-i+1 )
               ldwork = len
*
*              Multiply right part of C by Q21.
*
               CALL dlacpy( 'All', len, n2, c( i, n1+1 ), ldc, work,
     $                      ldwork )
               CALL dtrmm( 'Right', 'Upper', 'No Transpose', 'Non-Unit',
     $                     len, n2, one, q( n1+1, 1 ), ldq, work,
     $                     ldwork )
*
*              Multiply left part of C by Q11.
*
               CALL dgemm( 'No Transpose', 'No Transpose', len, n2, n1,
     $                     one, c( i, 1 ), ldc, q, ldq, one, work,
     $                     ldwork )
*
*              Multiply left part of C by Q12.
*
               CALL dlacpy( 'All', len, n1, c( i, 1 ), ldc,
     $                      work( 1 + n2*ldwork ), ldwork )
               CALL dtrmm( 'Right', 'Lower', 'No Transpose', 'Non-Unit',
     $                     len, n1, one, q( 1, n2+1 ), ldq,
     $                     work( 1 + n2*ldwork ), ldwork )
*
*              Multiply right part of C by Q22.
*
               CALL dgemm( 'No Transpose', 'No Transpose', len, n1, n2,
     $                     one, c( i, n1+1 ), ldc, q( n1+1, n2+1 ), ldq,
     $                     one, work( 1 + n2*ldwork ), ldwork )
*
*              Copy everything back.
*
               CALL dlacpy( 'All', len, n, work, ldwork, c( i, 1 ),
     $                      ldc )
            END DO
         ELSE
            DO i = 1, m, nb
               len = min( nb, m-i+1 )
               ldwork = len
*
*              Multiply right part of C by Q12**T.
*
               CALL dlacpy( 'All', len, n1, c( i, n2+1 ), ldc, work,
     $                      ldwork )
               CALL dtrmm( 'Right', 'Lower', 'Transpose', 'Non-Unit',
     $                     len, n1, one, q( 1, n2+1 ), ldq, work,
     $                     ldwork )
*
*              Multiply left part of C by Q11**T.
*
               CALL dgemm( 'No Transpose', 'Transpose', len, n1, n2,
     $                     one, c( i, 1 ), ldc, q, ldq, one, work,
     $                     ldwork )
*
*              Multiply left part of C by Q21**T.
*
               CALL dlacpy( 'All', len, n2, c( i, 1 ), ldc,
     $                      work( 1 + n1*ldwork ), ldwork )
               CALL dtrmm( 'Right', 'Upper', 'Transpose', 'Non-Unit',
     $                     len, n2, one, q( n1+1, 1 ), ldq,
     $                     work( 1 + n1*ldwork ), ldwork )
*
*              Multiply right part of C by Q22**T.
*
               CALL dgemm( 'No Transpose', 'Transpose', len, n2, n1,
     $                     one, c( i, n2+1 ), ldc, q( n1+1, n2+1 ), ldq,
     $                     one, work( 1 + n1*ldwork ), ldwork )
*
*              Copy everything back.
*
               CALL dlacpy( 'All', len, n, work, ldwork, c( i, 1 ),
     $                      ldc )
            END DO
         END IF
      END IF
*
      work( 1 ) = dble( lwkopt )
      RETURN
*
*     End of DORM22
*

◆ sorm22()

subroutine sorm22	(	character	side,
		character	trans,
		integer	m,
		integer	n,
		integer	n1,
		integer	n2,
		real, dimension( ldq, * )	q,
		integer	ldq,
		real, dimension( ldc, * )	c,
		integer	ldc,
		real, dimension( * )	work,
		integer	lwork,
		integer	info )

SORM22 multiplies a general matrix by a banded orthogonal matrix.

Download SORM22 + dependencies [TGZ] [ZIP] [TXT]

Purpose

!>
!>
!>  SORM22 overwrites the general real M-by-N matrix C with
!>
!>                  SIDE = 'L'     SIDE = 'R'
!>  TRANS = 'N':      Q * C          C * Q
!>  TRANS = 'T':      Q**T * C       C * Q**T
!>
!>  where Q is a real orthogonal matrix of order NQ, with NQ = M if
!>  SIDE = 'L' and NQ = N if SIDE = 'R'.
!>  The orthogonal matrix Q processes a 2-by-2 block structure
!>
!>         [  Q11  Q12  ]
!>     Q = [            ]
!>         [  Q21  Q22  ],
!>
!>  where Q12 is an N1-by-N1 lower triangular matrix and Q21 is an
!>  N2-by-N2 upper triangular matrix.
!>

Parameters

[in]	SIDE	!> SIDE is CHARACTER1 !> = 'L': apply Q or QT from the Left; !> = 'R': apply Q or Q*T from the Right. !>
[in]	TRANS	!> TRANS is CHARACTER1 !> = 'N': apply Q (No transpose); !> = 'C': apply Q*T (Conjugate transpose). !>
[in]	M	!> M is INTEGER !> The number of rows of the matrix C. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix C. N >= 0. !>
[in]	N1
[in]	N2	!> N1 is INTEGER !> N2 is INTEGER !> The dimension of Q12 and Q21, respectively. N1, N2 >= 0. !> The following requirement must be satisfied: !> N1 + N2 = M if SIDE = 'L' and N1 + N2 = N if SIDE = 'R'. !>
[in]	Q	!> Q is REAL array, dimension !> (LDQ,M) if SIDE = 'L' !> (LDQ,N) if SIDE = 'R' !>
[in]	LDQ	!> LDQ is INTEGER !> The leading dimension of the array Q. !> LDQ >= max(1,M) if SIDE = 'L'; LDQ >= max(1,N) if SIDE = 'R'. !>
[in,out]	C	!> C is REAL array, dimension (LDC,N) !> On entry, the M-by-N matrix C. !> On exit, C is overwritten by QC or QTC or CQT or CQ. !>
[in]	LDC	!> LDC is INTEGER !> The leading dimension of the array C. LDC >= max(1,M). !>
[out]	WORK	!> WORK is REAL array, dimension (MAX(1,LWORK)) !> On exit, if INFO = 0, WORK(1) returns the optimal LWORK. !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the array WORK. !> If SIDE = 'L', LWORK >= max(1,N); !> if SIDE = 'R', LWORK >= max(1,M). !> For optimum performance LWORK >= M*N. !> !> If LWORK = -1, then a workspace query is assumed; the routine !> only calculates the optimal size of the WORK array, returns !> this value as the first entry of the WORK array, and no error !> message related to LWORK is issued by XERBLA. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 161 of file sorm22.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
      IMPLICIT NONE
*
*     .. Scalar Arguments ..
      CHARACTER          SIDE, TRANS
      INTEGER            M, N, N1, N2, LDQ, LDC, LWORK, INFO
*     ..
*     .. Array Arguments ..
      REAL               Q( LDQ, * ), C( LDC, * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ONE
      parameter( one = 1.0e+0 )
*
*     .. Local Scalars ..
      LOGICAL            LEFT, LQUERY, NOTRAN
      INTEGER            I, LDWORK, LEN, LWKOPT, NB, NQ, NW
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           sgemm, slacpy, strmm, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          real, max, min
*     ..
*     .. Executable Statements ..
*
*     Test the input arguments
*
      info = 0
      left = lsame( side, 'L' )
      notran = lsame( trans, 'N' )
      lquery = ( lwork.EQ.-1 )
*
*     NQ is the order of Q;
*     NW is the minimum dimension of WORK.
*
      IF( left ) THEN
         nq = m
      ELSE
         nq = n
      END IF
      nw = nq
      IF( n1.EQ.0 .OR. n2.EQ.0 ) nw = 1
      IF( .NOT.left .AND. .NOT.lsame( side, 'R' ) ) THEN
         info = -1
      ELSE IF( .NOT.lsame( trans, 'N' ) .AND. .NOT.lsame( trans, 'T' ) )
     $          THEN
         info = -2
      ELSE IF( m.LT.0 ) THEN
         info = -3
      ELSE IF( n.LT.0 ) THEN
         info = -4
      ELSE IF( n1.LT.0 .OR. n1+n2.NE.nq ) THEN
         info = -5
      ELSE IF( n2.LT.0 ) THEN
         info = -6
      ELSE IF( ldq.LT.max( 1, nq ) ) THEN
         info = -8
      ELSE IF( ldc.LT.max( 1, m ) ) THEN
         info = -10
      ELSE IF( lwork.LT.nw .AND. .NOT.lquery ) THEN
         info = -12
      END IF
*
      IF( info.EQ.0 ) THEN
         lwkopt = m*n
         work( 1 ) = real( lwkopt )
      END IF
*
      IF( info.NE.0 ) THEN
         CALL xerbla( 'SORM22', -info )
         RETURN
      ELSE IF( lquery ) THEN
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( m.EQ.0 .OR. n.EQ.0 ) THEN
         work( 1 ) = 1
         RETURN
      END IF
*
*     Degenerate cases (N1 = 0 or N2 = 0) are handled using STRMM.
*
      IF( n1.EQ.0 ) THEN
         CALL strmm( side, 'Upper', trans, 'Non-Unit', m, n, one,
     $               q, ldq, c, ldc )
         work( 1 ) = one
         RETURN
      ELSE IF( n2.EQ.0 ) THEN
         CALL strmm( side, 'Lower', trans, 'Non-Unit', m, n, one,
     $               q, ldq, c, ldc )
         work( 1 ) = one
         RETURN
      END IF
*
*     Compute the largest chunk size available from the workspace.
*
      nb = max( 1, min( lwork, lwkopt ) / nq )
*
      IF( left ) THEN
         IF( notran ) THEN
            DO i = 1, n, nb
               len = min( nb, n-i+1 )
               ldwork = m
*
*              Multiply bottom part of C by Q12.
*
               CALL slacpy( 'All', n1, len, c( n2+1, i ), ldc, work,
     $                      ldwork )
               CALL strmm( 'Left', 'Lower', 'No Transpose', 'Non-Unit',
     $                     n1, len, one, q( 1, n2+1 ), ldq, work,
     $                     ldwork )
*
*              Multiply top part of C by Q11.
*
               CALL sgemm( 'No Transpose', 'No Transpose', n1, len, n2,
     $                     one, q, ldq, c( 1, i ), ldc, one, work,
     $                     ldwork )
*
*              Multiply top part of C by Q21.
*
               CALL slacpy( 'All', n2, len, c( 1, i ), ldc,
     $                      work( n1+1 ), ldwork )
               CALL strmm( 'Left', 'Upper', 'No Transpose', 'Non-Unit',
     $                     n2, len, one, q( n1+1, 1 ), ldq,
     $                     work( n1+1 ), ldwork )
*
*              Multiply bottom part of C by Q22.
*
               CALL sgemm( 'No Transpose', 'No Transpose', n2, len, n1,
     $                     one, q( n1+1, n2+1 ), ldq, c( n2+1, i ), ldc,
     $                     one, work( n1+1 ), ldwork )
*
*              Copy everything back.
*
               CALL slacpy( 'All', m, len, work, ldwork, c( 1, i ),
     $                      ldc )
            END DO
         ELSE
            DO i = 1, n, nb
               len = min( nb, n-i+1 )
               ldwork = m
*
*              Multiply bottom part of C by Q21**T.
*
               CALL slacpy( 'All', n2, len, c( n1+1, i ), ldc, work,
     $                      ldwork )
               CALL strmm( 'Left', 'Upper', 'Transpose', 'Non-Unit',
     $                     n2, len, one, q( n1+1, 1 ), ldq, work,
     $                     ldwork )
*
*              Multiply top part of C by Q11**T.
*
               CALL sgemm( 'Transpose', 'No Transpose', n2, len, n1,
     $                     one, q, ldq, c( 1, i ), ldc, one, work,
     $                     ldwork )
*
*              Multiply top part of C by Q12**T.
*
               CALL slacpy( 'All', n1, len, c( 1, i ), ldc,
     $                      work( n2+1 ), ldwork )
               CALL strmm( 'Left', 'Lower', 'Transpose', 'Non-Unit',
     $                     n1, len, one, q( 1, n2+1 ), ldq,
     $                     work( n2+1 ), ldwork )
*
*              Multiply bottom part of C by Q22**T.
*
               CALL sgemm( 'Transpose', 'No Transpose', n1, len, n2,
     $                     one, q( n1+1, n2+1 ), ldq, c( n1+1, i ), ldc,
     $                     one, work( n2+1 ), ldwork )
*
*              Copy everything back.
*
               CALL slacpy( 'All', m, len, work, ldwork, c( 1, i ),
     $                      ldc )
            END DO
         END IF
      ELSE
         IF( notran ) THEN
            DO i = 1, m, nb
               len = min( nb, m-i+1 )
               ldwork = len
*
*              Multiply right part of C by Q21.
*
               CALL slacpy( 'All', len, n2, c( i, n1+1 ), ldc, work,
     $                      ldwork )
               CALL strmm( 'Right', 'Upper', 'No Transpose', 'Non-Unit',
     $                     len, n2, one, q( n1+1, 1 ), ldq, work,
     $                     ldwork )
*
*              Multiply left part of C by Q11.
*
               CALL sgemm( 'No Transpose', 'No Transpose', len, n2, n1,
     $                     one, c( i, 1 ), ldc, q, ldq, one, work,
     $                     ldwork )
*
*              Multiply left part of C by Q12.
*
               CALL slacpy( 'All', len, n1, c( i, 1 ), ldc,
     $                      work( 1 + n2*ldwork ), ldwork )
               CALL strmm( 'Right', 'Lower', 'No Transpose', 'Non-Unit',
     $                     len, n1, one, q( 1, n2+1 ), ldq,
     $                     work( 1 + n2*ldwork ), ldwork )
*
*              Multiply right part of C by Q22.
*
               CALL sgemm( 'No Transpose', 'No Transpose', len, n1, n2,
     $                     one, c( i, n1+1 ), ldc, q( n1+1, n2+1 ), ldq,
     $                     one, work( 1 + n2*ldwork ), ldwork )
*
*              Copy everything back.
*
               CALL slacpy( 'All', len, n, work, ldwork, c( i, 1 ),
     $                      ldc )
            END DO
         ELSE
            DO i = 1, m, nb
               len = min( nb, m-i+1 )
               ldwork = len
*
*              Multiply right part of C by Q12**T.
*
               CALL slacpy( 'All', len, n1, c( i, n2+1 ), ldc, work,
     $                      ldwork )
               CALL strmm( 'Right', 'Lower', 'Transpose', 'Non-Unit',
     $                     len, n1, one, q( 1, n2+1 ), ldq, work,
     $                     ldwork )
*
*              Multiply left part of C by Q11**T.
*
               CALL sgemm( 'No Transpose', 'Transpose', len, n1, n2,
     $                     one, c( i, 1 ), ldc, q, ldq, one, work,
     $                     ldwork )
*
*              Multiply left part of C by Q21**T.
*
               CALL slacpy( 'All', len, n2, c( i, 1 ), ldc,
     $                      work( 1 + n1*ldwork ), ldwork )
               CALL strmm( 'Right', 'Upper', 'Transpose', 'Non-Unit',
     $                     len, n2, one, q( n1+1, 1 ), ldq,
     $                     work( 1 + n1*ldwork ), ldwork )
*
*              Multiply right part of C by Q22**T.
*
               CALL sgemm( 'No Transpose', 'Transpose', len, n2, n1,
     $                     one, c( i, n2+1 ), ldc, q( n1+1, n2+1 ), ldq,
     $                     one, work( 1 + n1*ldwork ), ldwork )
*
*              Copy everything back.
*
               CALL slacpy( 'All', len, n, work, ldwork, c( i, 1 ),
     $                      ldc )
            END DO
         END IF
      END IF
*
      work( 1 ) = real( lwkopt )
      RETURN
*
*     End of SORM22
*

◆ zunm22()

subroutine zunm22	(	character	side,
		character	trans,
		integer	m,
		integer	n,
		integer	n1,
		integer	n2,
		complex16, dimension( ldq, )	q,
		integer	ldq,
		complex16, dimension( ldc, )	c,
		integer	ldc,
		complex16, dimension( )	work,
		integer	lwork,
		integer	info )

ZUNM22 multiplies a general matrix by a banded unitary matrix.

Download ZUNM22 + dependencies [TGZ] [ZIP] [TXT]

Purpose

!>
!>  ZUNM22 overwrites the general complex M-by-N matrix C with
!>
!>                  SIDE = 'L'     SIDE = 'R'
!>  TRANS = 'N':      Q * C          C * Q
!>  TRANS = 'C':      Q**H * C       C * Q**H
!>
!>  where Q is a complex unitary matrix of order NQ, with NQ = M if
!>  SIDE = 'L' and NQ = N if SIDE = 'R'.
!>  The unitary matrix Q processes a 2-by-2 block structure
!>
!>         [  Q11  Q12  ]
!>     Q = [            ]
!>         [  Q21  Q22  ],
!>
!>  where Q12 is an N1-by-N1 lower triangular matrix and Q21 is an
!>  N2-by-N2 upper triangular matrix.
!>

Parameters

[in]	SIDE	!> SIDE is CHARACTER1 !> = 'L': apply Q or QH from the Left; !> = 'R': apply Q or Q*H from the Right. !>
[in]	TRANS	!> TRANS is CHARACTER1 !> = 'N': apply Q (No transpose); !> = 'C': apply Q*H (Conjugate transpose). !>
[in]	M	!> M is INTEGER !> The number of rows of the matrix C. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix C. N >= 0. !>
[in]	N1
[in]	N2	!> N1 is INTEGER !> N2 is INTEGER !> The dimension of Q12 and Q21, respectively. N1, N2 >= 0. !> The following requirement must be satisfied: !> N1 + N2 = M if SIDE = 'L' and N1 + N2 = N if SIDE = 'R'. !>
[in]	Q	!> Q is COMPLEX*16 array, dimension !> (LDQ,M) if SIDE = 'L' !> (LDQ,N) if SIDE = 'R' !>
[in]	LDQ	!> LDQ is INTEGER !> The leading dimension of the array Q. !> LDQ >= max(1,M) if SIDE = 'L'; LDQ >= max(1,N) if SIDE = 'R'. !>
[in,out]	C	!> C is COMPLEX16 array, dimension (LDC,N) !> On entry, the M-by-N matrix C. !> On exit, C is overwritten by QC or Q*HC or CQH or CQ. !>
[in]	LDC	!> LDC is INTEGER !> The leading dimension of the array C. LDC >= max(1,M). !>
[out]	WORK	!> WORK is COMPLEX*16 array, dimension (MAX(1,LWORK)) !> On exit, if INFO = 0, WORK(1) returns the optimal LWORK. !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the array WORK. !> If SIDE = 'L', LWORK >= max(1,N); !> if SIDE = 'R', LWORK >= max(1,M). !> For optimum performance LWORK >= M*N. !> !> If LWORK = -1, then a workspace query is assumed; the routine !> only calculates the optimal size of the WORK array, returns !> this value as the first entry of the WORK array, and no error !> message related to LWORK is issued by XERBLA. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 160 of file zunm22.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
      IMPLICIT NONE
*
*     .. Scalar Arguments ..
      CHARACTER          SIDE, TRANS
      INTEGER            M, N, N1, N2, LDQ, LDC, LWORK, INFO
*     ..
*     .. Array Arguments ..
      COMPLEX*16         Q( LDQ, * ), C( LDC, * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX*16         ONE
      parameter( one = ( 1.0d+0, 0.0d+0 ) )
*
*     .. Local Scalars ..
      LOGICAL            LEFT, LQUERY, NOTRAN
      INTEGER            I, LDWORK, LEN, LWKOPT, NB, NQ, NW
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           zgemm, zlacpy, ztrmm, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          dcmplx, max, min
*     ..
*     .. Executable Statements ..
*
*     Test the input arguments
*
      info = 0
      left = lsame( side, 'L' )
      notran = lsame( trans, 'N' )
      lquery = ( lwork.EQ.-1 )
*
*     NQ is the order of Q;
*     NW is the minimum dimension of WORK.
*
      IF( left ) THEN
         nq = m
      ELSE
         nq = n
      END IF
      nw = nq
      IF( n1.EQ.0 .OR. n2.EQ.0 ) nw = 1
      IF( .NOT.left .AND. .NOT.lsame( side, 'R' ) ) THEN
         info = -1
      ELSE IF( .NOT.lsame( trans, 'N' ) .AND. .NOT.lsame( trans, 'C' ) )
     $          THEN
         info = -2
      ELSE IF( m.LT.0 ) THEN
         info = -3
      ELSE IF( n.LT.0 ) THEN
         info = -4
      ELSE IF( n1.LT.0 .OR. n1+n2.NE.nq ) THEN
         info = -5
      ELSE IF( n2.LT.0 ) THEN
         info = -6
      ELSE IF( ldq.LT.max( 1, nq ) ) THEN
         info = -8
      ELSE IF( ldc.LT.max( 1, m ) ) THEN
         info = -10
      ELSE IF( lwork.LT.nw .AND. .NOT.lquery ) THEN
         info = -12
      END IF
*
      IF( info.EQ.0 ) THEN
         lwkopt = m*n
         work( 1 ) = dcmplx( lwkopt )
      END IF
*
      IF( info.NE.0 ) THEN
         CALL xerbla( 'ZUNM22', -info )
         RETURN
      ELSE IF( lquery ) THEN
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( m.EQ.0 .OR. n.EQ.0 ) THEN
         work( 1 ) = 1
         RETURN
      END IF
*
*     Degenerate cases (N1 = 0 or N2 = 0) are handled using ZTRMM.
*
      IF( n1.EQ.0 ) THEN
         CALL ztrmm( side, 'Upper', trans, 'Non-Unit', m, n, one,
     $               q, ldq, c, ldc )
         work( 1 ) = one
         RETURN
      ELSE IF( n2.EQ.0 ) THEN
         CALL ztrmm( side, 'Lower', trans, 'Non-Unit', m, n, one,
     $               q, ldq, c, ldc )
         work( 1 ) = one
         RETURN
      END IF
*
*     Compute the largest chunk size available from the workspace.
*
      nb = max( 1, min( lwork, lwkopt ) / nq )
*
      IF( left ) THEN
         IF( notran ) THEN
            DO i = 1, n, nb
               len = min( nb, n-i+1 )
               ldwork = m
*
*              Multiply bottom part of C by Q12.
*
               CALL zlacpy( 'All', n1, len, c( n2+1, i ), ldc, work,
     $                      ldwork )
               CALL ztrmm( 'Left', 'Lower', 'No Transpose', 'Non-Unit',
     $                     n1, len, one, q( 1, n2+1 ), ldq, work,
     $                     ldwork )
*
*              Multiply top part of C by Q11.
*
               CALL zgemm( 'No Transpose', 'No Transpose', n1, len, n2,
     $                     one, q, ldq, c( 1, i ), ldc, one, work,
     $                     ldwork )
*
*              Multiply top part of C by Q21.
*
               CALL zlacpy( 'All', n2, len, c( 1, i ), ldc,
     $                      work( n1+1 ), ldwork )
               CALL ztrmm( 'Left', 'Upper', 'No Transpose', 'Non-Unit',
     $                     n2, len, one, q( n1+1, 1 ), ldq,
     $                     work( n1+1 ), ldwork )
*
*              Multiply bottom part of C by Q22.
*
               CALL zgemm( 'No Transpose', 'No Transpose', n2, len, n1,
     $                     one, q( n1+1, n2+1 ), ldq, c( n2+1, i ), ldc,
     $                     one, work( n1+1 ), ldwork )
*
*              Copy everything back.
*
               CALL zlacpy( 'All', m, len, work, ldwork, c( 1, i ),
     $                      ldc )
            END DO
         ELSE
            DO i = 1, n, nb
               len = min( nb, n-i+1 )
               ldwork = m
*
*              Multiply bottom part of C by Q21**H.
*
               CALL zlacpy( 'All', n2, len, c( n1+1, i ), ldc, work,
     $                      ldwork )
               CALL ztrmm( 'Left', 'Upper', 'Conjugate', 'Non-Unit',
     $                     n2, len, one, q( n1+1, 1 ), ldq, work,
     $                     ldwork )
*
*              Multiply top part of C by Q11**H.
*
               CALL zgemm( 'Conjugate', 'No Transpose', n2, len, n1,
     $                     one, q, ldq, c( 1, i ), ldc, one, work,
     $                     ldwork )
*
*              Multiply top part of C by Q12**H.
*
               CALL zlacpy( 'All', n1, len, c( 1, i ), ldc,
     $                      work( n2+1 ), ldwork )
               CALL ztrmm( 'Left', 'Lower', 'Conjugate', 'Non-Unit',
     $                     n1, len, one, q( 1, n2+1 ), ldq,
     $                     work( n2+1 ), ldwork )
*
*              Multiply bottom part of C by Q22**H.
*
               CALL zgemm( 'Conjugate', 'No Transpose', n1, len, n2,
     $                     one, q( n1+1, n2+1 ), ldq, c( n1+1, i ), ldc,
     $                     one, work( n2+1 ), ldwork )
*
*              Copy everything back.
*
               CALL zlacpy( 'All', m, len, work, ldwork, c( 1, i ),
     $                      ldc )
            END DO
         END IF
      ELSE
         IF( notran ) THEN
            DO i = 1, m, nb
               len = min( nb, m-i+1 )
               ldwork = len
*
*              Multiply right part of C by Q21.
*
               CALL zlacpy( 'All', len, n2, c( i, n1+1 ), ldc, work,
     $                      ldwork )
               CALL ztrmm( 'Right', 'Upper', 'No Transpose', 'Non-Unit',
     $                     len, n2, one, q( n1+1, 1 ), ldq, work,
     $                     ldwork )
*
*              Multiply left part of C by Q11.
*
               CALL zgemm( 'No Transpose', 'No Transpose', len, n2, n1,
     $                     one, c( i, 1 ), ldc, q, ldq, one, work,
     $                     ldwork )
*
*              Multiply left part of C by Q12.
*
               CALL zlacpy( 'All', len, n1, c( i, 1 ), ldc,
     $                      work( 1 + n2*ldwork ), ldwork )
               CALL ztrmm( 'Right', 'Lower', 'No Transpose', 'Non-Unit',
     $                     len, n1, one, q( 1, n2+1 ), ldq,
     $                     work( 1 + n2*ldwork ), ldwork )
*
*              Multiply right part of C by Q22.
*
               CALL zgemm( 'No Transpose', 'No Transpose', len, n1, n2,
     $                     one, c( i, n1+1 ), ldc, q( n1+1, n2+1 ), ldq,
     $                     one, work( 1 + n2*ldwork ), ldwork )
*
*              Copy everything back.
*
               CALL zlacpy( 'All', len, n, work, ldwork, c( i, 1 ),
     $                      ldc )
            END DO
         ELSE
            DO i = 1, m, nb
               len = min( nb, m-i+1 )
               ldwork = len
*
*              Multiply right part of C by Q12**H.
*
               CALL zlacpy( 'All', len, n1, c( i, n2+1 ), ldc, work,
     $                      ldwork )
               CALL ztrmm( 'Right', 'Lower', 'Conjugate', 'Non-Unit',
     $                     len, n1, one, q( 1, n2+1 ), ldq, work,
     $                     ldwork )
*
*              Multiply left part of C by Q11**H.
*
               CALL zgemm( 'No Transpose', 'Conjugate', len, n1, n2,
     $                     one, c( i, 1 ), ldc, q, ldq, one, work,
     $                     ldwork )
*
*              Multiply left part of C by Q21**H.
*
               CALL zlacpy( 'All', len, n2, c( i, 1 ), ldc,
     $                      work( 1 + n1*ldwork ), ldwork )
               CALL ztrmm( 'Right', 'Upper', 'Conjugate', 'Non-Unit',
     $                     len, n2, one, q( n1+1, 1 ), ldq,
     $                     work( 1 + n1*ldwork ), ldwork )
*
*              Multiply right part of C by Q22**H.
*
               CALL zgemm( 'No Transpose', 'Conjugate', len, n2, n1,
     $                     one, c( i, n2+1 ), ldc, q( n1+1, n2+1 ), ldq,
     $                     one, work( 1 + n1*ldwork ), ldwork )
*
*              Copy everything back.
*
               CALL zlacpy( 'All', len, n, work, ldwork, c( i, 1 ),
     $                      ldc )
            END DO
         END IF
      END IF
*
      work( 1 ) = dcmplx( lwkopt )
      RETURN
*
*     End of ZUNM22
*

OpenRadioss 2025.1.11 OpenRadioss project