Functions
subroutine	cgetrf (m, n, a, lda, ipiv, info)
	CGETRF VARIANT: Crout Level 3 BLAS version of the algorithm.
subroutine	dgetrf (m, n, a, lda, ipiv, info)
	DGETRF VARIANT: Crout Level 3 BLAS version of the algorithm.
subroutine	sgetrf (m, n, a, lda, ipiv, info)
	SGETRF VARIANT: Crout Level 3 BLAS version of the algorithm.
subroutine	zgetrf (m, n, a, lda, ipiv, info)
	ZGETRF VARIANT: Crout Level 3 BLAS version of the algorithm.
subroutine	cgeqrf (m, n, a, lda, tau, work, lwork, info)
	CGEQRF VARIANT: left-looking Level 3 BLAS version of the algorithm.
subroutine	dgeqrf (m, n, a, lda, tau, work, lwork, info)
	DGEQRF VARIANT: left-looking Level 3 BLAS version of the algorithm.
subroutine	sgeqrf (m, n, a, lda, tau, work, lwork, info)
	SGEQRF VARIANT: left-looking Level 3 BLAS version of the algorithm.
subroutine	zgeqrf (m, n, a, lda, tau, work, lwork, info)
	ZGEQRF VARIANT: left-looking Level 3 BLAS of the algorithm.

Detailed Description

This is the group of Variants Computational routines

Function Documentation

◆ cgeqrf()

subroutine cgeqrf	(	integer	m,
		integer	n,
		complex, dimension( lda, * )	a,
		integer	lda,
		complex, dimension( * )	tau,
		complex, dimension( * )	work,
		integer	lwork,
		integer	info )

CGEQRF VARIANT: left-looking Level 3 BLAS version of the algorithm.

Purpose:

!>
!> CGEQRF computes a QR factorization of a real M-by-N matrix A:
!> A = Q * R.
!>
!> This is the left-looking Level 3 BLAS version of the algorithm.
!>
!>

Parameters

[in]	M	!> M is INTEGER !> The number of rows of the matrix A. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix A. N >= 0. !>
[in,out]	A	!> A is COMPLEX array, dimension (LDA,N) !> On entry, the M-by-N matrix A. !> On exit, the elements on and above the diagonal of the array !> contain the min(M,N)-by-N upper trapezoidal matrix R (R is !> upper triangular if m >= n); the elements below the diagonal, !> with the array TAU, represent the orthogonal matrix Q as a !> product of min(m,n) elementary reflectors (see Further !> Details). !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,M). !>
[out]	TAU	!> TAU is COMPLEX array, dimension (min(M,N)) !> The scalar factors of the elementary reflectors (see Further !> Details). !>
[out]	WORK	!> WORK is COMPLEX array, dimension (MAX(1,LWORK)) !> On exit, if INFO = 0, WORK(1) returns the optimal LWORK. !>
[in]	LWORK	!> LWORK is INTEGER !> !> The dimension of the array WORK. The dimension can be divided into three parts. !> !> 1) The part for the triangular factor T. If the very last T is not bigger !> than any of the rest, then this part is NB x ceiling(K/NB), otherwise, !> NB x (K-NT), where K = min(M,N) and NT is the dimension of the very last T !> !> 2) The part for the very last T when T is bigger than any of the rest T. !> The size of this part is NT x NT, where NT = K - ceiling ((K-NX)/NB) x NB, !> where K = min(M,N), NX is calculated by !> NX = MAX( 0, ILAENV( 3, 'CGEQRF', ' ', M, N, -1, -1 ) ) !> !> 3) The part for dlarfb is of size max((N-M)K, (N-M)NB, KNB, NBNB) !> !> So LWORK = part1 + part2 + part3 !> !> If LWORK = -1, then a workspace query is assumed; the routine !> only calculates the optimal size of the WORK array, returns !> this value as the first entry of the WORK array, and no error !> message related to LWORK is issued by XERBLA. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Date: December 2016

Further Details

!>
!>  The matrix Q is represented as a product of elementary reflectors
!>
!>     Q = H(1) H(2) . . . H(k), where k = min(m,n).
!>
!>  Each H(i) has the form
!>
!>     H(i) = I - tau * v * v'
!>
!>  where tau is a real scalar, and v is a real vector with
!>  v(1:i-1) = 0 and v(i) = 1; v(i+1:m) is stored on exit in A(i+1:m,i),
!>  and tau in TAU(i).
!>
!>

Definition at line 150 of file cgeqrf.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INFO, LDA, LWORK, M, N
*     ..
*     .. Array Arguments ..
      COMPLEX            A( LDA, * ), TAU( * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Local Scalars ..
      LOGICAL            LQUERY
      INTEGER            I, IB, IINFO, IWS, J, K, LWKOPT, NB,
     $                   NBMIN, NX, LBWORK, NT, LLWORK
*     ..
*     .. External Subroutines ..
      EXTERNAL           cgeqr2, clarfb, clarft, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, min
*     ..
*     .. External Functions ..
      INTEGER            ILAENV
      REAL               SCEIL
      EXTERNAL           ilaenv, sceil
*     ..
*     .. Executable Statements ..
 
      info = 0
      nbmin = 2
      nx = 0
      iws = n
      k = min( m, n )
      nb = ilaenv( 1, 'CGEQRF', ' ', m, n, -1, -1 )
 
      IF( nb.GT.1 .AND. nb.LT.k ) THEN
*
*        Determine when to cross over from blocked to unblocked code.
*
         nx = max( 0, ilaenv( 3, 'CGEQRF', ' ', m, n, -1, -1 ) )
      END IF
*
*     Get NT, the size of the very last T, which is the left-over from in-between K-NX and K to K, eg.:
*
*            NB=3     2NB=6       K=10
*            |        |           |
*      1--2--3--4--5--6--7--8--9--10
*                  |     \________/
*               K-NX=5      NT=4
*
*     So here 4 x 4 is the last T stored in the workspace
*
      nt = k-sceil(real(k-nx)/real(nb))*nb
 
*
*     optimal workspace = space for dlarfb + space for normal T's + space for the last T
*
      llwork = max(max((n-m)*k, (n-m)*nb), max(k*nb, nb*nb))
      llwork = sceil(real(llwork)/real(nb))
 
      IF ( nt.GT.nb ) THEN
 
          lbwork = k-nt
*
*         Optimal workspace for dlarfb = MAX(1,N)*NT
*
          lwkopt = (lbwork+llwork)*nb
          work( 1 ) = (lwkopt+nt*nt)
 
      ELSE
 
          lbwork = sceil(real(k)/real(nb))*nb
          lwkopt = (lbwork+llwork-nb)*nb
          work( 1 ) = lwkopt
 
      END IF
 
*
*     Test the input arguments
*
      lquery = ( lwork.EQ.-1 )
      IF( m.LT.0 ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( lda.LT.max( 1, m ) ) THEN
         info = -4
      ELSE IF( lwork.LT.max( 1, n ) .AND. .NOT.lquery ) THEN
         info = -7
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CGEQRF', -info )
         RETURN
      ELSE IF( lquery ) THEN
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( k.EQ.0 ) THEN
         work( 1 ) = 1
         RETURN
      END IF
*
      IF( nb.GT.1 .AND. nb.LT.k ) THEN
 
         IF( nx.LT.k ) THEN
*
*           Determine if workspace is large enough for blocked code.
*
            IF ( nt.LE.nb ) THEN
                iws = (lbwork+llwork-nb)*nb
            ELSE
                iws = (lbwork+llwork)*nb+nt*nt
            END IF
 
            IF( lwork.LT.iws ) THEN
*
*              Not enough workspace to use optimal NB:  reduce NB and
*              determine the minimum value of NB.
*
               IF ( nt.LE.nb ) THEN
                    nb = lwork / (llwork+(lbwork-nb))
               ELSE
                    nb = (lwork-nt*nt)/(lbwork+llwork)
               END IF
 
               nbmin = max( 2, ilaenv( 2, 'CGEQRF', ' ', m, n, -1,
     $                 -1 ) )
            END IF
         END IF
      END IF
*
      IF( nb.GE.nbmin .AND. nb.LT.k .AND. nx.LT.k ) THEN
*
*        Use blocked code initially
*
         DO 10 i = 1, k - nx, nb
            ib = min( k-i+1, nb )
*
*           Update the current column using old T's
*
            DO 20 j = 1, i - nb, nb
*
*              Apply H' to A(J:M,I:I+IB-1) from the left
*
               CALL clarfb( 'Left', 'Transpose', 'Forward',
     $                      'Columnwise', m-j+1, ib, nb,
     $                      a( j, j ), lda, work(j), lbwork,
     $                      a( j, i ), lda, work(lbwork*nb+nt*nt+1),
     $                      ib)
 
20          CONTINUE
*
*           Compute the QR factorization of the current block
*           A(I:M,I:I+IB-1)
*
            CALL cgeqr2( m-i+1, ib, a( i, i ), lda, tau( i ),
     $                        work(lbwork*nb+nt*nt+1), iinfo )
 
            IF( i+ib.LE.n ) THEN
*
*              Form the triangular factor of the block reflector
*              H = H(i) H(i+1) . . . H(i+ib-1)
*
               CALL clarft( 'Forward', 'Columnwise', m-i+1, ib,
     $                      a( i, i ), lda, tau( i ),
     $                      work(i), lbwork )
*
            END IF
   10    CONTINUE
      ELSE
         i = 1
      END IF
*
*     Use unblocked code to factor the last or only block.
*
      IF( i.LE.k ) THEN
 
         IF ( i .NE. 1 )   THEN
 
             DO 30 j = 1, i - nb, nb
*
*                Apply H' to A(J:M,I:K) from the left
*
                 CALL clarfb( 'Left', 'Transpose', 'Forward',
     $                       'Columnwise', m-j+1, k-i+1, nb,
     $                       a( j, j ), lda, work(j), lbwork,
     $                       a( j, i ), lda, work(lbwork*nb+nt*nt+1),
     $                       k-i+1)
30           CONTINUE
 
             CALL cgeqr2( m-i+1, k-i+1, a( i, i ), lda, tau( i ),
     $                   work(lbwork*nb+nt*nt+1),iinfo )
 
         ELSE
*
*        Use unblocked code to factor the last or only block.
*
         CALL cgeqr2( m-i+1, n-i+1, a( i, i ), lda, tau( i ),
     $               work,iinfo )
 
         END IF
      END IF
 
 
*
*     Apply update to the column M+1:N when N > M
*
      IF ( m.LT.n .AND. i.NE.1) THEN
*
*         Form the last triangular factor of the block reflector
*         H = H(i) H(i+1) . . . H(i+ib-1)
*
          IF ( nt .LE. nb ) THEN
               CALL clarft( 'Forward', 'Columnwise', m-i+1, k-i+1,
     $                     a( i, i ), lda, tau( i ), work(i), lbwork )
          ELSE
               CALL clarft( 'Forward', 'Columnwise', m-i+1, k-i+1,
     $                     a( i, i ), lda, tau( i ),
     $                     work(lbwork*nb+1), nt )
          END IF
 
*
*         Apply H' to A(1:M,M+1:N) from the left
*
          DO 40 j = 1, k-nx, nb
 
               ib = min( k-j+1, nb )
 
               CALL clarfb( 'Left', 'Transpose', 'Forward',
     $                     'Columnwise', m-j+1, n-m, ib,
     $                     a( j, j ), lda, work(j), lbwork,
     $                     a( j, m+1 ), lda, work(lbwork*nb+nt*nt+1),
     $                     n-m)
 
40       CONTINUE
 
         IF ( nt.LE.nb ) THEN
             CALL clarfb( 'Left', 'Transpose', 'Forward',
     $                   'Columnwise', m-j+1, n-m, k-j+1,
     $                   a( j, j ), lda, work(j), lbwork,
     $                   a( j, m+1 ), lda, work(lbwork*nb+nt*nt+1),
     $                   n-m)
         ELSE
             CALL clarfb( 'Left', 'Transpose', 'Forward',
     $                   'Columnwise', m-j+1, n-m, k-j+1,
     $                   a( j, j ), lda,
     $                   work(lbwork*nb+1),
     $                   nt, a( j, m+1 ), lda, work(lbwork*nb+nt*nt+1),
     $                   n-m)
         END IF
 
      END IF
 
      work( 1 ) = iws
      RETURN
*
*     End of CGEQRF
*

◆ cgetrf()

subroutine cgetrf	(	integer	m,
		integer	n,
		complex, dimension( lda, * )	a,
		integer	lda,
		integer, dimension( * )	ipiv,
		integer	info )

CGETRF VARIANT: Crout Level 3 BLAS version of the algorithm.

CGETRF VARIANT: iterative version of Sivan Toledo's recursive LU algorithm

CGETRF VARIANT: left-looking Level 3 BLAS version of the algorithm.

Purpose:

!>
!> CGETRF computes an LU factorization of a general M-by-N matrix A
!> using partial pivoting with row interchanges.
!>
!> The factorization has the form
!>    A = P * L * U
!> where P is a permutation matrix, L is lower triangular with unit
!> diagonal elements (lower trapezoidal if m > n), and U is upper
!> triangular (upper trapezoidal if m < n).
!>
!> This is the Crout Level 3 BLAS version of the algorithm.
!>
!>

Parameters

[in]	M	!> M is INTEGER !> The number of rows of the matrix A. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix A. N >= 0. !>
[in,out]	A	!> A is COMPLEX array, dimension (LDA,N) !> On entry, the M-by-N matrix to be factored. !> On exit, the factors L and U from the factorization !> A = PLU; the unit diagonal elements of L are not stored. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,M). !>
[out]	IPIV	!> IPIV is INTEGER array, dimension (min(M,N)) !> The pivot indices; for 1 <= i <= min(M,N), row i of the !> matrix was interchanged with row IPIV(i). !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !> > 0: if INFO = i, U(i,i) is exactly zero. The factorization !> has been completed, but the factor U is exactly !> singular, and division by zero will occur if it is used !> to solve a system of equations. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Date: December 2016

Purpose:

!>
!> CGETRF computes an LU factorization of a general M-by-N matrix A
!> using partial pivoting with row interchanges.
!>
!> The factorization has the form
!>    A = P * L * U
!> where P is a permutation matrix, L is lower triangular with unit
!> diagonal elements (lower trapezoidal if m > n), and U is upper
!> triangular (upper trapezoidal if m < n).
!>
!> This is the left-looking Level 3 BLAS version of the algorithm.
!>
!>

Parameters

[in]	M	!> M is INTEGER !> The number of rows of the matrix A. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix A. N >= 0. !>
[in,out]	A	!> A is COMPLEX array, dimension (LDA,N) !> On entry, the M-by-N matrix to be factored. !> On exit, the factors L and U from the factorization !> A = PLU; the unit diagonal elements of L are not stored. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,M). !>
[out]	IPIV	!> IPIV is INTEGER array, dimension (min(M,N)) !> The pivot indices; for 1 <= i <= min(M,N), row i of the !> matrix was interchanged with row IPIV(i). !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !> > 0: if INFO = i, U(i,i) is exactly zero. The factorization !> has been completed, but the factor U is exactly !> singular, and division by zero will occur if it is used !> to solve a system of equations. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Date: December 2016

Purpose:

!>
!> CGETRF computes an LU factorization of a general M-by-N matrix A
!> using partial pivoting with row interchanges.
!>
!> The factorization has the form
!>    A = P * L * U
!> where P is a permutation matrix, L is lower triangular with unit
!> diagonal elements (lower trapezoidal if m > n), and U is upper
!> triangular (upper trapezoidal if m < n).
!>
!> This code implements an iterative version of Sivan Toledo's recursive
!> LU algorithm[1].  For square matrices, this iterative versions should
!> be within a factor of two of the optimum number of memory transfers.
!>
!> The pattern is as follows, with the large blocks of U being updated
!> in one call to DTRSM, and the dotted lines denoting sections that
!> have had all pending permutations applied:
!>
!>  1 2 3 4 5 6 7 8
!> +-+-+---+-------+------
!> | |1|   |       |
!> |.+-+ 2 |       |
!> | | |   |       |
!> |.|.+-+-+   4   |
!> | | | |1|       |
!> | | |.+-+       |
!> | | | | |       |
!> |.|.|.|.+-+-+---+  8
!> | | | | | |1|   |
!> | | | | |.+-+ 2 |
!> | | | | | | |   |
!> | | | | |.|.+-+-+
!> | | | | | | | |1|
!> | | | | | | |.+-+
!> | | | | | | | | |
!> |.|.|.|.|.|.|.|.+-----
!> | | | | | | | | |
!>
!> The 1-2-1-4-1-2-1-8-... pattern is the position of the last 1 bit in
!> the binary expansion of the current column.  Each Schur update is
!> applied as soon as the necessary portion of U is available.
!>
!> [1] Toledo, S. 1997. Locality of Reference in LU Decomposition with
!> Partial Pivoting. SIAM J. Matrix Anal. Appl. 18, 4 (Oct. 1997),
!> 1065-1081. http://dx.doi.org/10.1137/S0895479896297744
!>
!>

Parameters

[in]	M	!> M is INTEGER !> The number of rows of the matrix A. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix A. N >= 0. !>
[in,out]	A	!> A is COMPLEX array, dimension (LDA,N) !> On entry, the M-by-N matrix to be factored. !> On exit, the factors L and U from the factorization !> A = PLU; the unit diagonal elements of L are not stored. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,M). !>
[out]	IPIV	!> IPIV is INTEGER array, dimension (min(M,N)) !> The pivot indices; for 1 <= i <= min(M,N), row i of the !> matrix was interchanged with row IPIV(i). !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !> > 0: if INFO = i, U(i,i) is exactly zero. The factorization !> has been completed, but the factor U is exactly !> singular, and division by zero will occur if it is used !> to solve a system of equations. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Date: December 2016

Definition at line 101 of file cgetrf.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INFO, LDA, M, N
*     ..
*     .. Array Arguments ..
      INTEGER            IPIV( * )
      COMPLEX            A( LDA, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX            ONE
      parameter( one = ( 1.0e+0, 0.0e+0 ) )
*     ..
*     .. Local Scalars ..
      INTEGER            I, IINFO, J, JB, NB
*     ..
*     .. External Subroutines ..
      EXTERNAL           cgemm, cgetf2, claswp, ctrsm, xerbla
*     ..
*     .. External Functions ..
      INTEGER            ILAENV
      EXTERNAL           ilaenv
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, min
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      IF( m.LT.0 ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( lda.LT.max( 1, m ) ) THEN
         info = -4
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'CGETRF', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( m.EQ.0 .OR. n.EQ.0 )
     $   RETURN
*
*     Determine the block size for this environment.
*
      nb = ilaenv( 1, 'CGETRF', ' ', m, n, -1, -1 )
      IF( nb.LE.1 .OR. nb.GE.min( m, n ) ) THEN
*
*        Use unblocked code.
*
         CALL cgetf2( m, n, a, lda, ipiv, info )
      ELSE
*
*        Use blocked code.
*
         DO 20 j = 1, min( m, n ), nb
            jb = min( min( m, n )-j+1, nb )
*
*           Update current block.
*
            CALL cgemm( 'No transpose', 'No transpose',
     $                 m-j+1, jb, j-1, -one,
     $                 a( j, 1 ), lda, a( 1, j ), lda, one,
     $                 a( j, j ), lda )
 
*
*           Factor diagonal and subdiagonal blocks and test for exact
*           singularity.
*
            CALL cgetf2( m-j+1, jb, a( j, j ), lda, ipiv( j ), iinfo )
*
*           Adjust INFO and the pivot indices.
*
            IF( info.EQ.0 .AND. iinfo.GT.0 )
     $         info = iinfo + j - 1
            DO 10 i = j, min( m, j+jb-1 )
               ipiv( i ) = j - 1 + ipiv( i )
   10       CONTINUE
*
*           Apply interchanges to column 1:J-1
*
            CALL claswp( j-1, a, lda, j, j+jb-1, ipiv, 1 )
*
            IF ( j+jb.LE.n ) THEN
*
*              Apply interchanges to column J+JB:N
*
               CALL claswp( n-j-jb+1, a( 1, j+jb ), lda, j, j+jb-1,
     $                     ipiv, 1 )
*
               CALL cgemm( 'No transpose', 'No transpose',
     $                    jb, n-j-jb+1, j-1, -one,
     $                    a( j, 1 ), lda, a( 1, j+jb ), lda, one,
     $                    a( j, j+jb ), lda )
*
*              Compute block row of U.
*
               CALL ctrsm( 'Left', 'Lower', 'No transpose', 'Unit',
     $                    jb, n-j-jb+1, one, a( j, j ), lda,
     $                    a( j, j+jb ), lda )
            END IF
 
   20    CONTINUE
 
      END IF
      RETURN
*
*     End of CGETRF
*

◆ dgeqrf()

subroutine dgeqrf	(	integer	m,
		integer	n,
		double precision, dimension( lda, * )	a,
		integer	lda,
		double precision, dimension( * )	tau,
		double precision, dimension( * )	work,
		integer	lwork,
		integer	info )

DGEQRF VARIANT: left-looking Level 3 BLAS version of the algorithm.

Purpose:

!>
!> DGEQRF computes a QR factorization of a real M-by-N matrix A:
!> A = Q * R.
!>
!> This is the left-looking Level 3 BLAS version of the algorithm.
!>
!>

Parameters

[in]	M	!> M is INTEGER !> The number of rows of the matrix A. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix A. N >= 0. !>
[in,out]	A	!> A is DOUBLE PRECISION array, dimension (LDA,N) !> On entry, the M-by-N matrix A. !> On exit, the elements on and above the diagonal of the array !> contain the min(M,N)-by-N upper trapezoidal matrix R (R is !> upper triangular if m >= n); the elements below the diagonal, !> with the array TAU, represent the orthogonal matrix Q as a !> product of min(m,n) elementary reflectors (see Further !> Details). !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,M). !>
[out]	TAU	!> TAU is DOUBLE PRECISION array, dimension (min(M,N)) !> The scalar factors of the elementary reflectors (see Further !> Details). !>
[out]	WORK	!> WORK is DOUBLE PRECISION array, dimension (MAX(1,LWORK)) !> On exit, if INFO = 0, WORK(1) returns the optimal LWORK. !>
[in]	LWORK	!> LWORK is INTEGER !> !> The dimension of the array WORK. The dimension can be divided into three parts. !> !> 1) The part for the triangular factor T. If the very last T is not bigger !> than any of the rest, then this part is NB x ceiling(K/NB), otherwise, !> NB x (K-NT), where K = min(M,N) and NT is the dimension of the very last T !> !> 2) The part for the very last T when T is bigger than any of the rest T. !> The size of this part is NT x NT, where NT = K - ceiling ((K-NX)/NB) x NB, !> where K = min(M,N), NX is calculated by !> NX = MAX( 0, ILAENV( 3, 'DGEQRF', ' ', M, N, -1, -1 ) ) !> !> 3) The part for dlarfb is of size max((N-M)K, (N-M)NB, KNB, NBNB) !> !> So LWORK = part1 + part2 + part3 !> !> If LWORK = -1, then a workspace query is assumed; the routine !> only calculates the optimal size of the WORK array, returns !> this value as the first entry of the WORK array, and no error !> message related to LWORK is issued by XERBLA. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Date: December 2016

Further Details

!>
!>  The matrix Q is represented as a product of elementary reflectors
!>
!>     Q = H(1) H(2) . . . H(k), where k = min(m,n).
!>
!>  Each H(i) has the form
!>
!>     H(i) = I - tau * v * v'
!>
!>  where tau is a real scalar, and v is a real vector with
!>  v(1:i-1) = 0 and v(i) = 1; v(i+1:m) is stored on exit in A(i+1:m,i),
!>  and tau in TAU(i).
!>
!>

Definition at line 150 of file dgeqrf.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INFO, LDA, LWORK, M, N
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   A( LDA, * ), TAU( * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Local Scalars ..
      LOGICAL            LQUERY
      INTEGER            I, IB, IINFO, IWS, J, K, LWKOPT, NB,
     $                   NBMIN, NX, LBWORK, NT, LLWORK
*     ..
*     .. External Subroutines ..
      EXTERNAL           dgeqr2, dlarfb, dlarft, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, min
*     ..
*     .. External Functions ..
      INTEGER            ILAENV
      REAL               SCEIL
      EXTERNAL           ilaenv, sceil
*     ..
*     .. Executable Statements ..
 
      info = 0
      nbmin = 2
      nx = 0
      iws = n
      k = min( m, n )
      nb = ilaenv( 1, 'DGEQRF', ' ', m, n, -1, -1 )
 
      IF( nb.GT.1 .AND. nb.LT.k ) THEN
*
*        Determine when to cross over from blocked to unblocked code.
*
         nx = max( 0, ilaenv( 3, 'DGEQRF', ' ', m, n, -1, -1 ) )
      END IF
*
*     Get NT, the size of the very last T, which is the left-over from in-between K-NX and K to K, eg.:
*
*            NB=3     2NB=6       K=10
*            |        |           |
*      1--2--3--4--5--6--7--8--9--10
*                  |     \________/
*               K-NX=5      NT=4
*
*     So here 4 x 4 is the last T stored in the workspace
*
      nt = k-sceil(real(k-nx)/real(nb))*nb
 
*
*     optimal workspace = space for dlarfb + space for normal T's + space for the last T
*
      llwork = max(max((n-m)*k, (n-m)*nb), max(k*nb, nb*nb))
      llwork = sceil(real(llwork)/real(nb))
 
      IF ( nt.GT.nb ) THEN
 
          lbwork = k-nt
*
*         Optimal workspace for dlarfb = MAX(1,N)*NT
*
          lwkopt = (lbwork+llwork)*nb
          work( 1 ) = (lwkopt+nt*nt)
 
      ELSE
 
          lbwork = sceil(real(k)/real(nb))*nb
          lwkopt = (lbwork+llwork-nb)*nb
          work( 1 ) = lwkopt
 
      END IF
 
*
*     Test the input arguments
*
      lquery = ( lwork.EQ.-1 )
      IF( m.LT.0 ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( lda.LT.max( 1, m ) ) THEN
         info = -4
      ELSE IF( lwork.LT.max( 1, n ) .AND. .NOT.lquery ) THEN
         info = -7
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'DGEQRF', -info )
         RETURN
      ELSE IF( lquery ) THEN
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( k.EQ.0 ) THEN
         work( 1 ) = 1
         RETURN
      END IF
*
      IF( nb.GT.1 .AND. nb.LT.k ) THEN
 
         IF( nx.LT.k ) THEN
*
*           Determine if workspace is large enough for blocked code.
*
            IF ( nt.LE.nb ) THEN
                iws = (lbwork+llwork-nb)*nb
            ELSE
                iws = (lbwork+llwork)*nb+nt*nt
            END IF
 
            IF( lwork.LT.iws ) THEN
*
*              Not enough workspace to use optimal NB:  reduce NB and
*              determine the minimum value of NB.
*
               IF ( nt.LE.nb ) THEN
                    nb = lwork / (llwork+(lbwork-nb))
               ELSE
                    nb = (lwork-nt*nt)/(lbwork+llwork)
               END IF
 
               nbmin = max( 2, ilaenv( 2, 'DGEQRF', ' ', m, n, -1,
     $                 -1 ) )
            END IF
         END IF
      END IF
*
      IF( nb.GE.nbmin .AND. nb.LT.k .AND. nx.LT.k ) THEN
*
*        Use blocked code initially
*
         DO 10 i = 1, k - nx, nb
            ib = min( k-i+1, nb )
*
*           Update the current column using old T's
*
            DO 20 j = 1, i - nb, nb
*
*              Apply H' to A(J:M,I:I+IB-1) from the left
*
               CALL dlarfb( 'Left', 'Transpose', 'Forward',
     $                      'Columnwise', m-j+1, ib, nb,
     $                      a( j, j ), lda, work(j), lbwork,
     $                      a( j, i ), lda, work(lbwork*nb+nt*nt+1),
     $                      ib)
 
20          CONTINUE
*
*           Compute the QR factorization of the current block
*           A(I:M,I:I+IB-1)
*
            CALL dgeqr2( m-i+1, ib, a( i, i ), lda, tau( i ),
     $                        work(lbwork*nb+nt*nt+1), iinfo )
 
            IF( i+ib.LE.n ) THEN
*
*              Form the triangular factor of the block reflector
*              H = H(i) H(i+1) . . . H(i+ib-1)
*
               CALL dlarft( 'Forward', 'Columnwise', m-i+1, ib,
     $                      a( i, i ), lda, tau( i ),
     $                      work(i), lbwork )
*
            END IF
   10    CONTINUE
      ELSE
         i = 1
      END IF
*
*     Use unblocked code to factor the last or only block.
*
      IF( i.LE.k ) THEN
 
         IF ( i .NE. 1 )   THEN
 
             DO 30 j = 1, i - nb, nb
*
*                Apply H' to A(J:M,I:K) from the left
*
                 CALL dlarfb( 'Left', 'Transpose', 'Forward',
     $                       'Columnwise', m-j+1, k-i+1, nb,
     $                       a( j, j ), lda, work(j), lbwork,
     $                       a( j, i ), lda, work(lbwork*nb+nt*nt+1),
     $                       k-i+1)
30           CONTINUE
 
             CALL dgeqr2( m-i+1, k-i+1, a( i, i ), lda, tau( i ),
     $                   work(lbwork*nb+nt*nt+1),iinfo )
 
         ELSE
*
*        Use unblocked code to factor the last or only block.
*
         CALL dgeqr2( m-i+1, n-i+1, a( i, i ), lda, tau( i ),
     $               work,iinfo )
 
         END IF
      END IF
 
 
*
*     Apply update to the column M+1:N when N > M
*
      IF ( m.LT.n .AND. i.NE.1) THEN
*
*         Form the last triangular factor of the block reflector
*         H = H(i) H(i+1) . . . H(i+ib-1)
*
          IF ( nt .LE. nb ) THEN
               CALL dlarft( 'Forward', 'Columnwise', m-i+1, k-i+1,
     $                     a( i, i ), lda, tau( i ), work(i), lbwork )
          ELSE
               CALL dlarft( 'Forward', 'Columnwise', m-i+1, k-i+1,
     $                     a( i, i ), lda, tau( i ),
     $                     work(lbwork*nb+1), nt )
          END IF
 
*
*         Apply H' to A(1:M,M+1:N) from the left
*
          DO 40 j = 1, k-nx, nb
 
               ib = min( k-j+1, nb )
 
               CALL dlarfb( 'Left', 'Transpose', 'Forward',
     $                     'Columnwise', m-j+1, n-m, ib,
     $                     a( j, j ), lda, work(j), lbwork,
     $                     a( j, m+1 ), lda, work(lbwork*nb+nt*nt+1),
     $                     n-m)
 
40       CONTINUE
 
         IF ( nt.LE.nb ) THEN
             CALL dlarfb( 'Left', 'Transpose', 'Forward',
     $                   'Columnwise', m-j+1, n-m, k-j+1,
     $                   a( j, j ), lda, work(j), lbwork,
     $                   a( j, m+1 ), lda, work(lbwork*nb+nt*nt+1),
     $                   n-m)
         ELSE
             CALL dlarfb( 'Left', 'Transpose', 'Forward',
     $                   'Columnwise', m-j+1, n-m, k-j+1,
     $                   a( j, j ), lda,
     $                   work(lbwork*nb+1),
     $                   nt, a( j, m+1 ), lda, work(lbwork*nb+nt*nt+1),
     $                   n-m)
         END IF
 
      END IF
 
      work( 1 ) = iws
      RETURN
*
*     End of DGEQRF
*

◆ dgetrf()

subroutine dgetrf	(	integer	m,
		integer	n,
		double precision, dimension( lda, * )	a,
		integer	lda,
		integer, dimension( * )	ipiv,
		integer	info )

DGETRF VARIANT: Crout Level 3 BLAS version of the algorithm.

DGETRF VARIANT: iterative version of Sivan Toledo's recursive LU algorithm

DGETRF VARIANT: left-looking Level 3 BLAS version of the algorithm.

Purpose:

!>
!> DGETRF computes an LU factorization of a general M-by-N matrix A
!> using partial pivoting with row interchanges.
!>
!> The factorization has the form
!>    A = P * L * U
!> where P is a permutation matrix, L is lower triangular with unit
!> diagonal elements (lower trapezoidal if m > n), and U is upper
!> triangular (upper trapezoidal if m < n).
!>
!> This is the Crout Level 3 BLAS version of the algorithm.
!>
!>

Parameters

[in]	M	!> M is INTEGER !> The number of rows of the matrix A. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix A. N >= 0. !>
[in,out]	A	!> A is DOUBLE PRECISION array, dimension (LDA,N) !> On entry, the M-by-N matrix to be factored. !> On exit, the factors L and U from the factorization !> A = PLU; the unit diagonal elements of L are not stored. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,M). !>
[out]	IPIV	!> IPIV is INTEGER array, dimension (min(M,N)) !> The pivot indices; for 1 <= i <= min(M,N), row i of the !> matrix was interchanged with row IPIV(i). !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !> > 0: if INFO = i, U(i,i) is exactly zero. The factorization !> has been completed, but the factor U is exactly !> singular, and division by zero will occur if it is used !> to solve a system of equations. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Date: December 2016

Purpose:

!>
!> DGETRF computes an LU factorization of a general M-by-N matrix A
!> using partial pivoting with row interchanges.
!>
!> The factorization has the form
!>    A = P * L * U
!> where P is a permutation matrix, L is lower triangular with unit
!> diagonal elements (lower trapezoidal if m > n), and U is upper
!> triangular (upper trapezoidal if m < n).
!>
!> This is the left-looking Level 3 BLAS version of the algorithm.
!>
!>

Parameters

[in]	M	!> M is INTEGER !> The number of rows of the matrix A. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix A. N >= 0. !>
[in,out]	A	!> A is DOUBLE PRECISION array, dimension (LDA,N) !> On entry, the M-by-N matrix to be factored. !> On exit, the factors L and U from the factorization !> A = PLU; the unit diagonal elements of L are not stored. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,M). !>
[out]	IPIV	!> IPIV is INTEGER array, dimension (min(M,N)) !> The pivot indices; for 1 <= i <= min(M,N), row i of the !> matrix was interchanged with row IPIV(i). !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !> > 0: if INFO = i, U(i,i) is exactly zero. The factorization !> has been completed, but the factor U is exactly !> singular, and division by zero will occur if it is used !> to solve a system of equations. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Date: December 2016

Purpose:

!>
!> DGETRF computes an LU factorization of a general M-by-N matrix A
!> using partial pivoting with row interchanges.
!>
!> The factorization has the form
!>    A = P * L * U
!> where P is a permutation matrix, L is lower triangular with unit
!> diagonal elements (lower trapezoidal if m > n), and U is upper
!> triangular (upper trapezoidal if m < n).
!>
!> This code implements an iterative version of Sivan Toledo's recursive
!> LU algorithm[1].  For square matrices, this iterative versions should
!> be within a factor of two of the optimum number of memory transfers.
!>
!> The pattern is as follows, with the large blocks of U being updated
!> in one call to DTRSM, and the dotted lines denoting sections that
!> have had all pending permutations applied:
!>
!>  1 2 3 4 5 6 7 8
!> +-+-+---+-------+------
!> | |1|   |       |
!> |.+-+ 2 |       |
!> | | |   |       |
!> |.|.+-+-+   4   |
!> | | | |1|       |
!> | | |.+-+       |
!> | | | | |       |
!> |.|.|.|.+-+-+---+  8
!> | | | | | |1|   |
!> | | | | |.+-+ 2 |
!> | | | | | | |   |
!> | | | | |.|.+-+-+
!> | | | | | | | |1|
!> | | | | | | |.+-+
!> | | | | | | | | |
!> |.|.|.|.|.|.|.|.+-----
!> | | | | | | | | |
!>
!> The 1-2-1-4-1-2-1-8-... pattern is the position of the last 1 bit in
!> the binary expansion of the current column.  Each Schur update is
!> applied as soon as the necessary portion of U is available.
!>
!> [1] Toledo, S. 1997. Locality of Reference in LU Decomposition with
!> Partial Pivoting. SIAM J. Matrix Anal. Appl. 18, 4 (Oct. 1997),
!> 1065-1081. http://dx.doi.org/10.1137/S0895479896297744
!>
!>

Parameters

[in]	M	!> M is INTEGER !> The number of rows of the matrix A. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix A. N >= 0. !>
[in,out]	A	!> A is DOUBLE PRECISION array, dimension (LDA,N) !> On entry, the M-by-N matrix to be factored. !> On exit, the factors L and U from the factorization !> A = PLU; the unit diagonal elements of L are not stored. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,M). !>
[out]	IPIV	!> IPIV is INTEGER array, dimension (min(M,N)) !> The pivot indices; for 1 <= i <= min(M,N), row i of the !> matrix was interchanged with row IPIV(i). !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !> > 0: if INFO = i, U(i,i) is exactly zero. The factorization !> has been completed, but the factor U is exactly !> singular, and division by zero will occur if it is used !> to solve a system of equations. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Date: December 2016

Definition at line 101 of file dgetrf.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INFO, LDA, M, N
*     ..
*     .. Array Arguments ..
      INTEGER            IPIV( * )
      DOUBLE PRECISION   A( LDA, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ONE
      parameter( one = 1.0d+0 )
*     ..
*     .. Local Scalars ..
      INTEGER            I, IINFO, J, JB, NB
*     ..
*     .. External Subroutines ..
      EXTERNAL           dgemm, dgetf2, dlaswp, dtrsm, xerbla
*     ..
*     .. External Functions ..
      INTEGER            ILAENV
      EXTERNAL           ilaenv
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, min
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      IF( m.LT.0 ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( lda.LT.max( 1, m ) ) THEN
         info = -4
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'DGETRF', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( m.EQ.0 .OR. n.EQ.0 )
     $   RETURN
*
*     Determine the block size for this environment.
*
      nb = ilaenv( 1, 'DGETRF', ' ', m, n, -1, -1 )
      IF( nb.LE.1 .OR. nb.GE.min( m, n ) ) THEN
*
*        Use unblocked code.
*
         CALL dgetf2( m, n, a, lda, ipiv, info )
      ELSE
*
*        Use blocked code.
*
         DO 20 j = 1, min( m, n ), nb
            jb = min( min( m, n )-j+1, nb )
*
*           Update current block.
*
            CALL dgemm( 'No transpose', 'No transpose',
     $                 m-j+1, jb, j-1, -one,
     $                 a( j, 1 ), lda, a( 1, j ), lda, one,
     $                 a( j, j ), lda )
 
*
*           Factor diagonal and subdiagonal blocks and test for exact
*           singularity.
*
            CALL dgetf2( m-j+1, jb, a( j, j ), lda, ipiv( j ), iinfo )
*
*           Adjust INFO and the pivot indices.
*
            IF( info.EQ.0 .AND. iinfo.GT.0 )
     $         info = iinfo + j - 1
            DO 10 i = j, min( m, j+jb-1 )
               ipiv( i ) = j - 1 + ipiv( i )
   10       CONTINUE
*
*           Apply interchanges to column 1:J-1
*
            CALL dlaswp( j-1, a, lda, j, j+jb-1, ipiv, 1 )
*
            IF ( j+jb.LE.n ) THEN
*
*              Apply interchanges to column J+JB:N
*
               CALL dlaswp( n-j-jb+1, a( 1, j+jb ), lda, j, j+jb-1,
     $                     ipiv, 1 )
*
               CALL dgemm( 'No transpose', 'No transpose',
     $                    jb, n-j-jb+1, j-1, -one,
     $                    a( j, 1 ), lda, a( 1, j+jb ), lda, one,
     $                    a( j, j+jb ), lda )
*
*              Compute block row of U.
*
               CALL dtrsm( 'Left', 'Lower', 'No transpose', 'Unit',
     $                    jb, n-j-jb+1, one, a( j, j ), lda,
     $                    a( j, j+jb ), lda )
            END IF
 
   20    CONTINUE
 
      END IF
      RETURN
*
*     End of DGETRF
*

◆ sgeqrf()

subroutine sgeqrf	(	integer	m,
		integer	n,
		real, dimension( lda, * )	a,
		integer	lda,
		real, dimension( * )	tau,
		real, dimension( * )	work,
		integer	lwork,
		integer	info )

SGEQRF VARIANT: left-looking Level 3 BLAS version of the algorithm.

Purpose:

!>
!> SGEQRF computes a QR factorization of a real M-by-N matrix A:
!> A = Q * R.
!>
!> This is the left-looking Level 3 BLAS version of the algorithm.
!>
!>

Parameters

[in]	M	!> M is INTEGER !> The number of rows of the matrix A. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix A. N >= 0. !>
[in,out]	A	!> A is REAL array, dimension (LDA,N) !> On entry, the M-by-N matrix A. !> On exit, the elements on and above the diagonal of the array !> contain the min(M,N)-by-N upper trapezoidal matrix R (R is !> upper triangular if m >= n); the elements below the diagonal, !> with the array TAU, represent the orthogonal matrix Q as a !> product of min(m,n) elementary reflectors (see Further !> Details). !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,M). !>
[out]	TAU	!> TAU is REAL array, dimension (min(M,N)) !> The scalar factors of the elementary reflectors (see Further !> Details). !>
[out]	WORK	!> WORK is REAL array, dimension (MAX(1,LWORK)) !> On exit, if INFO = 0, WORK(1) returns the optimal LWORK. !>
[in]	LWORK	!> LWORK is INTEGER !> !> The dimension of the array WORK. The dimension can be divided into three parts. !> !> 1) The part for the triangular factor T. If the very last T is not bigger !> than any of the rest, then this part is NB x ceiling(K/NB), otherwise, !> NB x (K-NT), where K = min(M,N) and NT is the dimension of the very last T !> !> 2) The part for the very last T when T is bigger than any of the rest T. !> The size of this part is NT x NT, where NT = K - ceiling ((K-NX)/NB) x NB, !> where K = min(M,N), NX is calculated by !> NX = MAX( 0, ILAENV( 3, 'SGEQRF', ' ', M, N, -1, -1 ) ) !> !> 3) The part for dlarfb is of size max((N-M)K, (N-M)NB, KNB, NBNB) !> !> So LWORK = part1 + part2 + part3 !> !> If LWORK = -1, then a workspace query is assumed; the routine !> only calculates the optimal size of the WORK array, returns !> this value as the first entry of the WORK array, and no error !> message related to LWORK is issued by XERBLA. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Date: December 2016

Further Details

!>
!>  The matrix Q is represented as a product of elementary reflectors
!>
!>     Q = H(1) H(2) . . . H(k), where k = min(m,n).
!>
!>  Each H(i) has the form
!>
!>     H(i) = I - tau * v * v'
!>
!>  where tau is a real scalar, and v is a real vector with
!>  v(1:i-1) = 0 and v(i) = 1; v(i+1:m) is stored on exit in A(i+1:m,i),
!>  and tau in TAU(i).
!>
!>

Definition at line 150 of file sgeqrf.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INFO, LDA, LWORK, M, N
*     ..
*     .. Array Arguments ..
      REAL               A( LDA, * ), TAU( * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Local Scalars ..
      LOGICAL            LQUERY
      INTEGER            I, IB, IINFO, IWS, J, K, LWKOPT, NB,
     $                   NBMIN, NX, LBWORK, NT, LLWORK
*     ..
*     .. External Subroutines ..
      EXTERNAL           sgeqr2, slarfb, slarft, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, min
*     ..
*     .. External Functions ..
      INTEGER            ILAENV
      REAL               SCEIL
      EXTERNAL           ilaenv, sceil
*     ..
*     .. Executable Statements ..
 
      info = 0
      nbmin = 2
      nx = 0
      iws = n
      k = min( m, n )
      nb = ilaenv( 1, 'SGEQRF', ' ', m, n, -1, -1 )
 
      IF( nb.GT.1 .AND. nb.LT.k ) THEN
*
*        Determine when to cross over from blocked to unblocked code.
*
         nx = max( 0, ilaenv( 3, 'SGEQRF', ' ', m, n, -1, -1 ) )
      END IF
*
*     Get NT, the size of the very last T, which is the left-over from in-between K-NX and K to K, eg.:
*
*            NB=3     2NB=6       K=10
*            |        |           |
*      1--2--3--4--5--6--7--8--9--10
*                  |     \________/
*               K-NX=5      NT=4
*
*     So here 4 x 4 is the last T stored in the workspace
*
      nt = k-sceil(real(k-nx)/real(nb))*nb
 
*
*     optimal workspace = space for dlarfb + space for normal T's + space for the last T
*
      llwork = max(max((n-m)*k, (n-m)*nb), max(k*nb, nb*nb))
      llwork = sceil(real(llwork)/real(nb))
 
      IF ( nt.GT.nb ) THEN
 
          lbwork = k-nt
*
*         Optimal workspace for dlarfb = MAX(1,N)*NT
*
          lwkopt = (lbwork+llwork)*nb
          work( 1 ) = (lwkopt+nt*nt)
 
      ELSE
 
          lbwork = sceil(real(k)/real(nb))*nb
          lwkopt = (lbwork+llwork-nb)*nb
          work( 1 ) = lwkopt
 
      END IF
 
*
*     Test the input arguments
*
      lquery = ( lwork.EQ.-1 )
      IF( m.LT.0 ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( lda.LT.max( 1, m ) ) THEN
         info = -4
      ELSE IF( lwork.LT.max( 1, n ) .AND. .NOT.lquery ) THEN
         info = -7
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'SGEQRF', -info )
         RETURN
      ELSE IF( lquery ) THEN
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( k.EQ.0 ) THEN
         work( 1 ) = 1
         RETURN
      END IF
*
      IF( nb.GT.1 .AND. nb.LT.k ) THEN
 
         IF( nx.LT.k ) THEN
*
*           Determine if workspace is large enough for blocked code.
*
            IF ( nt.LE.nb ) THEN
                iws = (lbwork+llwork-nb)*nb
            ELSE
                iws = (lbwork+llwork)*nb+nt*nt
            END IF
 
            IF( lwork.LT.iws ) THEN
*
*              Not enough workspace to use optimal NB:  reduce NB and
*              determine the minimum value of NB.
*
               IF ( nt.LE.nb ) THEN
                    nb = lwork / (llwork+(lbwork-nb))
               ELSE
                    nb = (lwork-nt*nt)/(lbwork+llwork)
               END IF
 
               nbmin = max( 2, ilaenv( 2, 'SGEQRF', ' ', m, n, -1,
     $                 -1 ) )
            END IF
         END IF
      END IF
*
      IF( nb.GE.nbmin .AND. nb.LT.k .AND. nx.LT.k ) THEN
*
*        Use blocked code initially
*
         DO 10 i = 1, k - nx, nb
            ib = min( k-i+1, nb )
*
*           Update the current column using old T's
*
            DO 20 j = 1, i - nb, nb
*
*              Apply H' to A(J:M,I:I+IB-1) from the left
*
               CALL slarfb( 'Left', 'Transpose', 'Forward',
     $                      'Columnwise', m-j+1, ib, nb,
     $                      a( j, j ), lda, work(j), lbwork,
     $                      a( j, i ), lda, work(lbwork*nb+nt*nt+1),
     $                      ib)
 
20          CONTINUE
*
*           Compute the QR factorization of the current block
*           A(I:M,I:I+IB-1)
*
            CALL sgeqr2( m-i+1, ib, a( i, i ), lda, tau( i ),
     $                        work(lbwork*nb+nt*nt+1), iinfo )
 
            IF( i+ib.LE.n ) THEN
*
*              Form the triangular factor of the block reflector
*              H = H(i) H(i+1) . . . H(i+ib-1)
*
               CALL slarft( 'Forward', 'Columnwise', m-i+1, ib,
     $                      a( i, i ), lda, tau( i ),
     $                      work(i), lbwork )
*
            END IF
   10    CONTINUE
      ELSE
         i = 1
      END IF
*
*     Use unblocked code to factor the last or only block.
*
      IF( i.LE.k ) THEN
 
         IF ( i .NE. 1 )   THEN
 
             DO 30 j = 1, i - nb, nb
*
*                Apply H' to A(J:M,I:K) from the left
*
                 CALL slarfb( 'Left', 'Transpose', 'Forward',
     $                       'Columnwise', m-j+1, k-i+1, nb,
     $                       a( j, j ), lda, work(j), lbwork,
     $                       a( j, i ), lda, work(lbwork*nb+nt*nt+1),
     $                       k-i+1)
30           CONTINUE
 
             CALL sgeqr2( m-i+1, k-i+1, a( i, i ), lda, tau( i ),
     $                   work(lbwork*nb+nt*nt+1),iinfo )
 
         ELSE
*
*        Use unblocked code to factor the last or only block.
*
         CALL sgeqr2( m-i+1, n-i+1, a( i, i ), lda, tau( i ),
     $               work,iinfo )
 
         END IF
      END IF
 
 
*
*     Apply update to the column M+1:N when N > M
*
      IF ( m.LT.n .AND. i.NE.1) THEN
*
*         Form the last triangular factor of the block reflector
*         H = H(i) H(i+1) . . . H(i+ib-1)
*
          IF ( nt .LE. nb ) THEN
               CALL slarft( 'Forward', 'Columnwise', m-i+1, k-i+1,
     $                     a( i, i ), lda, tau( i ), work(i), lbwork )
          ELSE
               CALL slarft( 'Forward', 'Columnwise', m-i+1, k-i+1,
     $                     a( i, i ), lda, tau( i ),
     $                     work(lbwork*nb+1), nt )
          END IF
 
*
*         Apply H' to A(1:M,M+1:N) from the left
*
          DO 40 j = 1, k-nx, nb
 
               ib = min( k-j+1, nb )
 
               CALL slarfb( 'Left', 'Transpose', 'Forward',
     $                     'Columnwise', m-j+1, n-m, ib,
     $                     a( j, j ), lda, work(j), lbwork,
     $                     a( j, m+1 ), lda, work(lbwork*nb+nt*nt+1),
     $                     n-m)
 
40       CONTINUE
 
         IF ( nt.LE.nb ) THEN
             CALL slarfb( 'Left', 'Transpose', 'Forward',
     $                   'Columnwise', m-j+1, n-m, k-j+1,
     $                   a( j, j ), lda, work(j), lbwork,
     $                   a( j, m+1 ), lda, work(lbwork*nb+nt*nt+1),
     $                   n-m)
         ELSE
             CALL slarfb( 'Left', 'Transpose', 'Forward',
     $                   'Columnwise', m-j+1, n-m, k-j+1,
     $                   a( j, j ), lda,
     $                   work(lbwork*nb+1),
     $                   nt, a( j, m+1 ), lda, work(lbwork*nb+nt*nt+1),
     $                   n-m)
         END IF
 
      END IF
 
      work( 1 ) = iws
      RETURN
*
*     End of SGEQRF
*

◆ sgetrf()

subroutine sgetrf	(	integer	m,
		integer	n,
		real, dimension( lda, * )	a,
		integer	lda,
		integer, dimension( * )	ipiv,
		integer	info )

SGETRF VARIANT: Crout Level 3 BLAS version of the algorithm.

SGETRF VARIANT: iterative version of Sivan Toledo's recursive LU algorithm

SGETRF VARIANT: left-looking Level 3 BLAS version of the algorithm.

Purpose:

!>
!> SGETRF computes an LU factorization of a general M-by-N matrix A
!> using partial pivoting with row interchanges.
!>
!> The factorization has the form
!>    A = P * L * U
!> where P is a permutation matrix, L is lower triangular with unit
!> diagonal elements (lower trapezoidal if m > n), and U is upper
!> triangular (upper trapezoidal if m < n).
!>
!> This is the Crout Level 3 BLAS version of the algorithm.
!>
!>

Parameters

[in]	M	!> M is INTEGER !> The number of rows of the matrix A. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix A. N >= 0. !>
[in,out]	A	!> A is REAL array, dimension (LDA,N) !> On entry, the M-by-N matrix to be factored. !> On exit, the factors L and U from the factorization !> A = PLU; the unit diagonal elements of L are not stored. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,M). !>
[out]	IPIV	!> IPIV is INTEGER array, dimension (min(M,N)) !> The pivot indices; for 1 <= i <= min(M,N), row i of the !> matrix was interchanged with row IPIV(i). !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !> > 0: if INFO = i, U(i,i) is exactly zero. The factorization !> has been completed, but the factor U is exactly !> singular, and division by zero will occur if it is used !> to solve a system of equations. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Date: December 2016

Purpose:

!>
!> SGETRF computes an LU factorization of a general M-by-N matrix A
!> using partial pivoting with row interchanges.
!>
!> The factorization has the form
!>    A = P * L * U
!> where P is a permutation matrix, L is lower triangular with unit
!> diagonal elements (lower trapezoidal if m > n), and U is upper
!> triangular (upper trapezoidal if m < n).
!>
!> This is the left-looking Level 3 BLAS version of the algorithm.
!>
!>

Parameters

[in]	M	!> M is INTEGER !> The number of rows of the matrix A. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix A. N >= 0. !>
[in,out]	A	!> A is REAL array, dimension (LDA,N) !> On entry, the M-by-N matrix to be factored. !> On exit, the factors L and U from the factorization !> A = PLU; the unit diagonal elements of L are not stored. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,M). !>
[out]	IPIV	!> IPIV is INTEGER array, dimension (min(M,N)) !> The pivot indices; for 1 <= i <= min(M,N), row i of the !> matrix was interchanged with row IPIV(i). !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !> > 0: if INFO = i, U(i,i) is exactly zero. The factorization !> has been completed, but the factor U is exactly !> singular, and division by zero will occur if it is used !> to solve a system of equations. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Date: December 2016

Purpose:

!>
!> SGETRF computes an LU factorization of a general M-by-N matrix A
!> using partial pivoting with row interchanges.
!>
!> The factorization has the form
!>    A = P * L * U
!> where P is a permutation matrix, L is lower triangular with unit
!> diagonal elements (lower trapezoidal if m > n), and U is upper
!> triangular (upper trapezoidal if m < n).
!>
!> This code implements an iterative version of Sivan Toledo's recursive
!> LU algorithm[1].  For square matrices, this iterative versions should
!> be within a factor of two of the optimum number of memory transfers.
!>
!> The pattern is as follows, with the large blocks of U being updated
!> in one call to STRSM, and the dotted lines denoting sections that
!> have had all pending permutations applied:
!>
!>  1 2 3 4 5 6 7 8
!> +-+-+---+-------+------
!> | |1|   |       |
!> |.+-+ 2 |       |
!> | | |   |       |
!> |.|.+-+-+   4   |
!> | | | |1|       |
!> | | |.+-+       |
!> | | | | |       |
!> |.|.|.|.+-+-+---+  8
!> | | | | | |1|   |
!> | | | | |.+-+ 2 |
!> | | | | | | |   |
!> | | | | |.|.+-+-+
!> | | | | | | | |1|
!> | | | | | | |.+-+
!> | | | | | | | | |
!> |.|.|.|.|.|.|.|.+-----
!> | | | | | | | | |
!>
!> The 1-2-1-4-1-2-1-8-... pattern is the position of the last 1 bit in
!> the binary expansion of the current column.  Each Schur update is
!> applied as soon as the necessary portion of U is available.
!>
!> [1] Toledo, S. 1997. Locality of Reference in LU Decomposition with
!> Partial Pivoting. SIAM J. Matrix Anal. Appl. 18, 4 (Oct. 1997),
!> 1065-1081. http://dx.doi.org/10.1137/S0895479896297744
!>
!>

Parameters

[in]	M	!> M is INTEGER !> The number of rows of the matrix A. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix A. N >= 0. !>
[in,out]	A	!> A is REAL array, dimension (LDA,N) !> On entry, the M-by-N matrix to be factored. !> On exit, the factors L and U from the factorization !> A = PLU; the unit diagonal elements of L are not stored. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,M). !>
[out]	IPIV	!> IPIV is INTEGER array, dimension (min(M,N)) !> The pivot indices; for 1 <= i <= min(M,N), row i of the !> matrix was interchanged with row IPIV(i). !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !> > 0: if INFO = i, U(i,i) is exactly zero. The factorization !> has been completed, but the factor U is exactly !> singular, and division by zero will occur if it is used !> to solve a system of equations. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Date: December 2016

Definition at line 101 of file sgetrf.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INFO, LDA, M, N
*     ..
*     .. Array Arguments ..
      INTEGER            IPIV( * )
      REAL               A( LDA, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ONE
      parameter( one = 1.0e+0 )
*     ..
*     .. Local Scalars ..
      INTEGER            I, IINFO, J, JB, NB
*     ..
*     .. External Subroutines ..
      EXTERNAL           sgemm, sgetf2, slaswp, strsm, xerbla
*     ..
*     .. External Functions ..
      INTEGER            ILAENV
      EXTERNAL           ilaenv
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, min
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      IF( m.LT.0 ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( lda.LT.max( 1, m ) ) THEN
         info = -4
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'SGETRF', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( m.EQ.0 .OR. n.EQ.0 )
     $   RETURN
*
*     Determine the block size for this environment.
*
      nb = ilaenv( 1, 'SGETRF', ' ', m, n, -1, -1 )
      IF( nb.LE.1 .OR. nb.GE.min( m, n ) ) THEN
*
*        Use unblocked code.
*
         CALL sgetf2( m, n, a, lda, ipiv, info )
      ELSE
*
*        Use blocked code.
*
         DO 20 j = 1, min( m, n ), nb
            jb = min( min( m, n )-j+1, nb )
*
*           Update current block.
*
            CALL sgemm( 'No transpose', 'No transpose',
     $                 m-j+1, jb, j-1, -one,
     $                 a( j, 1 ), lda, a( 1, j ), lda, one,
     $                 a( j, j ), lda )
 
*
*           Factor diagonal and subdiagonal blocks and test for exact
*           singularity.
*
            CALL sgetf2( m-j+1, jb, a( j, j ), lda, ipiv( j ), iinfo )
*
*           Adjust INFO and the pivot indices.
*
            IF( info.EQ.0 .AND. iinfo.GT.0 )
     $         info = iinfo + j - 1
            DO 10 i = j, min( m, j+jb-1 )
               ipiv( i ) = j - 1 + ipiv( i )
   10       CONTINUE
*
*           Apply interchanges to column 1:J-1
*
            CALL slaswp( j-1, a, lda, j, j+jb-1, ipiv, 1 )
*
            IF ( j+jb.LE.n ) THEN
*
*              Apply interchanges to column J+JB:N
*
               CALL slaswp( n-j-jb+1, a( 1, j+jb ), lda, j, j+jb-1,
     $                     ipiv, 1 )
*
               CALL sgemm( 'No transpose', 'No transpose',
     $                    jb, n-j-jb+1, j-1, -one,
     $                    a( j, 1 ), lda, a( 1, j+jb ), lda, one,
     $                    a( j, j+jb ), lda )
*
*              Compute block row of U.
*
               CALL strsm( 'Left', 'Lower', 'No transpose', 'Unit',
     $                    jb, n-j-jb+1, one, a( j, j ), lda,
     $                    a( j, j+jb ), lda )
            END IF
 
   20    CONTINUE
 
      END IF
      RETURN
*
*     End of SGETRF
*

◆ zgeqrf()

subroutine zgeqrf	(	integer	m,
		integer	n,
		complex16, dimension( lda, )	a,
		integer	lda,
		complex16, dimension( )	tau,
		complex16, dimension( )	work,
		integer	lwork,
		integer	info )

ZGEQRF VARIANT: left-looking Level 3 BLAS of the algorithm.

Purpose:

!>
!> ZGEQRF computes a QR factorization of a real M-by-N matrix A:
!> A = Q * R.
!>
!> This is the left-looking Level 3 BLAS version of the algorithm.
!>
!>

Parameters

[in]	M	!> M is INTEGER !> The number of rows of the matrix A. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix A. N >= 0. !>
[in,out]	A	!> A is COMPLEX*16 array, dimension (LDA,N) !> On entry, the M-by-N matrix A. !> On exit, the elements on and above the diagonal of the array !> contain the min(M,N)-by-N upper trapezoidal matrix R (R is !> upper triangular if m >= n); the elements below the diagonal, !> with the array TAU, represent the orthogonal matrix Q as a !> product of min(m,n) elementary reflectors (see Further !> Details). !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,M). !>
[out]	TAU	!> TAU is COMPLEX*16 array, dimension (min(M,N)) !> The scalar factors of the elementary reflectors (see Further !> Details). !>
[out]	WORK	!> WORK is COMPLEX*16 array, dimension (MAX(1,LWORK)) !> On exit, if INFO = 0, WORK(1) returns the optimal LWORK. !>
[in]	LWORK	!> LWORK is INTEGER !> !> The dimension of the array WORK. The dimension can be divided into three parts. !> !> 1) The part for the triangular factor T. If the very last T is not bigger !> than any of the rest, then this part is NB x ceiling(K/NB), otherwise, !> NB x (K-NT), where K = min(M,N) and NT is the dimension of the very last T !> !> 2) The part for the very last T when T is bigger than any of the rest T. !> The size of this part is NT x NT, where NT = K - ceiling ((K-NX)/NB) x NB, !> where K = min(M,N), NX is calculated by !> NX = MAX( 0, ILAENV( 3, 'ZGEQRF', ' ', M, N, -1, -1 ) ) !> !> 3) The part for dlarfb is of size max((N-M)K, (N-M)NB, KNB, NBNB) !> !> So LWORK = part1 + part2 + part3 !> !> If LWORK = -1, then a workspace query is assumed; the routine !> only calculates the optimal size of the WORK array, returns !> this value as the first entry of the WORK array, and no error !> message related to LWORK is issued by XERBLA. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Date: December 2016

Further Details

!>
!>  The matrix Q is represented as a product of elementary reflectors
!>
!>     Q = H(1) H(2) . . . H(k), where k = min(m,n).
!>
!>  Each H(i) has the form
!>
!>     H(i) = I - tau * v * v'
!>
!>  where tau is a real scalar, and v is a real vector with
!>  v(1:i-1) = 0 and v(i) = 1; v(i+1:m) is stored on exit in A(i+1:m,i),
!>  and tau in TAU(i).
!>
!>

Definition at line 150 of file zgeqrf.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INFO, LDA, LWORK, M, N
*     ..
*     .. Array Arguments ..
      COMPLEX*16         A( LDA, * ), TAU( * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Local Scalars ..
      LOGICAL            LQUERY
      INTEGER            I, IB, IINFO, IWS, J, K, LWKOPT, NB,
     $                   NBMIN, NX, LBWORK, NT, LLWORK
*     ..
*     .. External Subroutines ..
      EXTERNAL           zgeqr2, zlarfb, zlarft, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, min
*     ..
*     .. External Functions ..
      INTEGER            ILAENV
      REAL               SCEIL
      EXTERNAL           ilaenv, sceil
*     ..
*     .. Executable Statements ..
 
      info = 0
      nbmin = 2
      nx = 0
      iws = n
      k = min( m, n )
      nb = ilaenv( 1, 'ZGEQRF', ' ', m, n, -1, -1 )
 
      IF( nb.GT.1 .AND. nb.LT.k ) THEN
*
*        Determine when to cross over from blocked to unblocked code.
*
         nx = max( 0, ilaenv( 3, 'ZGEQRF', ' ', m, n, -1, -1 ) )
      END IF
*
*     Get NT, the size of the very last T, which is the left-over from in-between K-NX and K to K, eg.:
*
*            NB=3     2NB=6       K=10
*            |        |           |
*      1--2--3--4--5--6--7--8--9--10
*                  |     \________/
*               K-NX=5      NT=4
*
*     So here 4 x 4 is the last T stored in the workspace
*
      nt = k-sceil(real(k-nx)/real(nb))*nb
 
*
*     optimal workspace = space for dlarfb + space for normal T's + space for the last T
*
      llwork = max(max((n-m)*k, (n-m)*nb), max(k*nb, nb*nb))
      llwork = sceil(real(llwork)/real(nb))
 
      IF ( nt.GT.nb ) THEN
 
          lbwork = k-nt
*
*         Optimal workspace for dlarfb = MAX(1,N)*NT
*
          lwkopt = (lbwork+llwork)*nb
          work( 1 ) = (lwkopt+nt*nt)
 
      ELSE
 
          lbwork = sceil(real(k)/real(nb))*nb
          lwkopt = (lbwork+llwork-nb)*nb
          work( 1 ) = lwkopt
 
      END IF
 
*
*     Test the input arguments
*
      lquery = ( lwork.EQ.-1 )
      IF( m.LT.0 ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( lda.LT.max( 1, m ) ) THEN
         info = -4
      ELSE IF( lwork.LT.max( 1, n ) .AND. .NOT.lquery ) THEN
         info = -7
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'ZGEQRF', -info )
         RETURN
      ELSE IF( lquery ) THEN
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( k.EQ.0 ) THEN
         work( 1 ) = 1
         RETURN
      END IF
*
      IF( nb.GT.1 .AND. nb.LT.k ) THEN
 
         IF( nx.LT.k ) THEN
*
*           Determine if workspace is large enough for blocked code.
*
            IF ( nt.LE.nb ) THEN
                iws = (lbwork+llwork-nb)*nb
            ELSE
                iws = (lbwork+llwork)*nb+nt*nt
            END IF
 
            IF( lwork.LT.iws ) THEN
*
*              Not enough workspace to use optimal NB:  reduce NB and
*              determine the minimum value of NB.
*
               IF ( nt.LE.nb ) THEN
                    nb = lwork / (llwork+(lbwork-nb))
               ELSE
                    nb = (lwork-nt*nt)/(lbwork+llwork)
               END IF
 
               nbmin = max( 2, ilaenv( 2, 'ZGEQRF', ' ', m, n, -1,
     $                 -1 ) )
            END IF
         END IF
      END IF
*
      IF( nb.GE.nbmin .AND. nb.LT.k .AND. nx.LT.k ) THEN
*
*        Use blocked code initially
*
         DO 10 i = 1, k - nx, nb
            ib = min( k-i+1, nb )
*
*           Update the current column using old T's
*
            DO 20 j = 1, i - nb, nb
*
*              Apply H' to A(J:M,I:I+IB-1) from the left
*
               CALL zlarfb( 'Left', 'Transpose', 'Forward',
     $                      'Columnwise', m-j+1, ib, nb,
     $                      a( j, j ), lda, work(j), lbwork,
     $                      a( j, i ), lda, work(lbwork*nb+nt*nt+1),
     $                      ib)
 
20          CONTINUE
*
*           Compute the QR factorization of the current block
*           A(I:M,I:I+IB-1)
*
            CALL zgeqr2( m-i+1, ib, a( i, i ), lda, tau( i ),
     $                        work(lbwork*nb+nt*nt+1), iinfo )
 
            IF( i+ib.LE.n ) THEN
*
*              Form the triangular factor of the block reflector
*              H = H(i) H(i+1) . . . H(i+ib-1)
*
               CALL zlarft( 'Forward', 'Columnwise', m-i+1, ib,
     $                      a( i, i ), lda, tau( i ),
     $                      work(i), lbwork )
*
            END IF
   10    CONTINUE
      ELSE
         i = 1
      END IF
*
*     Use unblocked code to factor the last or only block.
*
      IF( i.LE.k ) THEN
 
         IF ( i .NE. 1 )   THEN
 
             DO 30 j = 1, i - nb, nb
*
*                Apply H' to A(J:M,I:K) from the left
*
                 CALL zlarfb( 'Left', 'Transpose', 'Forward',
     $                       'Columnwise', m-j+1, k-i+1, nb,
     $                       a( j, j ), lda, work(j), lbwork,
     $                       a( j, i ), lda, work(lbwork*nb+nt*nt+1),
     $                       k-i+1)
30           CONTINUE
 
             CALL zgeqr2( m-i+1, k-i+1, a( i, i ), lda, tau( i ),
     $                   work(lbwork*nb+nt*nt+1),iinfo )
 
         ELSE
*
*        Use unblocked code to factor the last or only block.
*
         CALL zgeqr2( m-i+1, n-i+1, a( i, i ), lda, tau( i ),
     $               work,iinfo )
 
         END IF
      END IF
 
 
*
*     Apply update to the column M+1:N when N > M
*
      IF ( m.LT.n .AND. i.NE.1) THEN
*
*         Form the last triangular factor of the block reflector
*         H = H(i) H(i+1) . . . H(i+ib-1)
*
          IF ( nt .LE. nb ) THEN
               CALL zlarft( 'Forward', 'Columnwise', m-i+1, k-i+1,
     $                     a( i, i ), lda, tau( i ), work(i), lbwork )
          ELSE
               CALL zlarft( 'Forward', 'Columnwise', m-i+1, k-i+1,
     $                     a( i, i ), lda, tau( i ),
     $                     work(lbwork*nb+1), nt )
          END IF
 
*
*         Apply H' to A(1:M,M+1:N) from the left
*
          DO 40 j = 1, k-nx, nb
 
               ib = min( k-j+1, nb )
 
               CALL zlarfb( 'Left', 'Transpose', 'Forward',
     $                     'Columnwise', m-j+1, n-m, ib,
     $                     a( j, j ), lda, work(j), lbwork,
     $                     a( j, m+1 ), lda, work(lbwork*nb+nt*nt+1),
     $                     n-m)
 
40       CONTINUE
 
         IF ( nt.LE.nb ) THEN
             CALL zlarfb( 'Left', 'Transpose', 'Forward',
     $                   'Columnwise', m-j+1, n-m, k-j+1,
     $                   a( j, j ), lda, work(j), lbwork,
     $                   a( j, m+1 ), lda, work(lbwork*nb+nt*nt+1),
     $                   n-m)
         ELSE
             CALL zlarfb( 'Left', 'Transpose', 'Forward',
     $                   'Columnwise', m-j+1, n-m, k-j+1,
     $                   a( j, j ), lda,
     $                   work(lbwork*nb+1),
     $                   nt, a( j, m+1 ), lda, work(lbwork*nb+nt*nt+1),
     $                   n-m)
         END IF
 
      END IF
 
      work( 1 ) = iws
      RETURN
*
*     End of ZGEQRF
*

◆ zgetrf()

subroutine zgetrf	(	integer	m,
		integer	n,
		complex16, dimension( lda, )	a,
		integer	lda,
		integer, dimension( * )	ipiv,
		integer	info )

ZGETRF VARIANT: Crout Level 3 BLAS version of the algorithm.

ZGETRF VARIANT: iterative version of Sivan Toledo's recursive LU algorithm

ZGETRF VARIANT: left-looking Level 3 BLAS version of the algorithm.

Purpose:

!>
!> ZGETRF computes an LU factorization of a general M-by-N matrix A
!> using partial pivoting with row interchanges.
!>
!> The factorization has the form
!>    A = P * L * U
!> where P is a permutation matrix, L is lower triangular with unit
!> diagonal elements (lower trapezoidal if m > n), and U is upper
!> triangular (upper trapezoidal if m < n).
!>
!> This is the Crout Level 3 BLAS version of the algorithm.
!>
!>

Parameters

[in]	M	!> M is INTEGER !> The number of rows of the matrix A. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix A. N >= 0. !>
[in,out]	A	!> A is COMPLEX16 array, dimension (LDA,N) !> On entry, the M-by-N matrix to be factored. !> On exit, the factors L and U from the factorization !> A = PL*U; the unit diagonal elements of L are not stored. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,M). !>
[out]	IPIV	!> IPIV is INTEGER array, dimension (min(M,N)) !> The pivot indices; for 1 <= i <= min(M,N), row i of the !> matrix was interchanged with row IPIV(i). !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !> > 0: if INFO = i, U(i,i) is exactly zero. The factorization !> has been completed, but the factor U is exactly !> singular, and division by zero will occur if it is used !> to solve a system of equations. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Date: December 2016

Purpose:

!>
!> ZGETRF computes an LU factorization of a general M-by-N matrix A
!> using partial pivoting with row interchanges.
!>
!> The factorization has the form
!>    A = P * L * U
!> where P is a permutation matrix, L is lower triangular with unit
!> diagonal elements (lower trapezoidal if m > n), and U is upper
!> triangular (upper trapezoidal if m < n).
!>
!> This is the left-looking Level 3 BLAS version of the algorithm.
!>
!>

Parameters

[in]	M	!> M is INTEGER !> The number of rows of the matrix A. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix A. N >= 0. !>
[in,out]	A	!> A is COMPLEX16 array, dimension (LDA,N) !> On entry, the M-by-N matrix to be factored. !> On exit, the factors L and U from the factorization !> A = PL*U; the unit diagonal elements of L are not stored. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,M). !>
[out]	IPIV	!> IPIV is INTEGER array, dimension (min(M,N)) !> The pivot indices; for 1 <= i <= min(M,N), row i of the !> matrix was interchanged with row IPIV(i). !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !> > 0: if INFO = i, U(i,i) is exactly zero. The factorization !> has been completed, but the factor U is exactly !> singular, and division by zero will occur if it is used !> to solve a system of equations. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Date: December 2016

Purpose:

!>
!> ZGETRF computes an LU factorization of a general M-by-N matrix A
!> using partial pivoting with row interchanges.
!>
!> The factorization has the form
!>    A = P * L * U
!> where P is a permutation matrix, L is lower triangular with unit
!> diagonal elements (lower trapezoidal if m > n), and U is upper
!> triangular (upper trapezoidal if m < n).
!>
!> This code implements an iterative version of Sivan Toledo's recursive
!> LU algorithm[1].  For square matrices, this iterative versions should
!> be within a factor of two of the optimum number of memory transfers.
!>
!> The pattern is as follows, with the large blocks of U being updated
!> in one call to DTRSM, and the dotted lines denoting sections that
!> have had all pending permutations applied:
!>
!>  1 2 3 4 5 6 7 8
!> +-+-+---+-------+------
!> | |1|   |       |
!> |.+-+ 2 |       |
!> | | |   |       |
!> |.|.+-+-+   4   |
!> | | | |1|       |
!> | | |.+-+       |
!> | | | | |       |
!> |.|.|.|.+-+-+---+  8
!> | | | | | |1|   |
!> | | | | |.+-+ 2 |
!> | | | | | | |   |
!> | | | | |.|.+-+-+
!> | | | | | | | |1|
!> | | | | | | |.+-+
!> | | | | | | | | |
!> |.|.|.|.|.|.|.|.+-----
!> | | | | | | | | |
!>
!> The 1-2-1-4-1-2-1-8-... pattern is the position of the last 1 bit in
!> the binary expansion of the current column.  Each Schur update is
!> applied as soon as the necessary portion of U is available.
!>
!> [1] Toledo, S. 1997. Locality of Reference in LU Decomposition with
!> Partial Pivoting. SIAM J. Matrix Anal. Appl. 18, 4 (Oct. 1997),
!> 1065-1081. http://dx.doi.org/10.1137/S0895479896297744
!>
!>

Parameters

[in]	M	!> M is INTEGER !> The number of rows of the matrix A. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix A. N >= 0. !>
[in,out]	A	!> A is COMPLEX16 array, dimension (LDA,N) !> On entry, the M-by-N matrix to be factored. !> On exit, the factors L and U from the factorization !> A = PL*U; the unit diagonal elements of L are not stored. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,M). !>
[out]	IPIV	!> IPIV is INTEGER array, dimension (min(M,N)) !> The pivot indices; for 1 <= i <= min(M,N), row i of the !> matrix was interchanged with row IPIV(i). !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -i, the i-th argument had an illegal value !> > 0: if INFO = i, U(i,i) is exactly zero. The factorization !> has been completed, but the factor U is exactly !> singular, and division by zero will occur if it is used !> to solve a system of equations. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Date: December 2016

Definition at line 101 of file zgetrf.f.

*
*  -- LAPACK computational routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INFO, LDA, M, N
*     ..
*     .. Array Arguments ..
      INTEGER            IPIV( * )
      COMPLEX*16         A( LDA, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      COMPLEX*16         ONE
      parameter( one = ( 1.0d+0, 0.0d+0 ) )
*     ..
*     .. Local Scalars ..
      INTEGER            I, IINFO, J, JB, NB
*     ..
*     .. External Subroutines ..
      EXTERNAL           zgemm, zgetf2, zlaswp, ztrsm, xerbla
*     ..
*     .. External Functions ..
      INTEGER            ILAENV
      EXTERNAL           ilaenv
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, min
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      IF( m.LT.0 ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( lda.LT.max( 1, m ) ) THEN
         info = -4
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'ZGETRF', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( m.EQ.0 .OR. n.EQ.0 )
     $   RETURN
*
*     Determine the block size for this environment.
*
      nb = ilaenv( 1, 'ZGETRF', ' ', m, n, -1, -1 )
      IF( nb.LE.1 .OR. nb.GE.min( m, n ) ) THEN
*
*        Use unblocked code.
*
         CALL zgetf2( m, n, a, lda, ipiv, info )
      ELSE
*
*        Use blocked code.
*
         DO 20 j = 1, min( m, n ), nb
            jb = min( min( m, n )-j+1, nb )
*
*           Update current block.
*
            CALL zgemm( 'No transpose', 'No transpose',
     $                 m-j+1, jb, j-1, -one,
     $                 a( j, 1 ), lda, a( 1, j ), lda, one,
     $                 a( j, j ), lda )
 
*
*           Factor diagonal and subdiagonal blocks and test for exact
*           singularity.
*
            CALL zgetf2( m-j+1, jb, a( j, j ), lda, ipiv( j ), iinfo )
*
*           Adjust INFO and the pivot indices.
*
            IF( info.EQ.0 .AND. iinfo.GT.0 )
     $         info = iinfo + j - 1
            DO 10 i = j, min( m, j+jb-1 )
               ipiv( i ) = j - 1 + ipiv( i )
   10       CONTINUE
*
*           Apply interchanges to column 1:J-1
*
            CALL zlaswp( j-1, a, lda, j, j+jb-1, ipiv, 1 )
*
            IF ( j+jb.LE.n ) THEN
*
*              Apply interchanges to column J+JB:N
*
               CALL zlaswp( n-j-jb+1, a( 1, j+jb ), lda, j, j+jb-1,
     $                     ipiv, 1 )
*
               CALL zgemm( 'No transpose', 'No transpose',
     $                    jb, n-j-jb+1, j-1, -one,
     $                    a( j, 1 ), lda, a( 1, j+jb ), lda, one,
     $                    a( j, j+jb ), lda )
*
*              Compute block row of U.
*
               CALL ztrsm( 'Left', 'Lower', 'No transpose', 'Unit',
     $                    jb, n-j-jb+1, one, a( j, j ), lda,
     $                    a( j, j+jb ), lda )
            END IF
 
   20    CONTINUE
 
      END IF
      RETURN
*
*     End of ZGETRF
*

OpenRadioss 2025.1.11 OpenRadioss project