d5/d0a/cgelst_8f_source.html

*> \brief <b> CGELST solves overdetermined or underdetermined systems for GE matrices using QR or LQ factorization with compact WY representation of Q.</b>

*

*  =========== DOCUMENTATION ===========

*

* Online html documentation available at

*            http://www.netlib.org/lapack/explore-html/

*

*> Download CGELST + dependencies

*> <a href="http://www.netlib.org/cgi-bin/netlibfiles.tgz?format=tgz&filename=/lapack/lapack_routine/cgelst.f">

*> [TGZ]</a>

*> <a href="http://www.netlib.org/cgi-bin/netlibfiles.zip?format=zip&filename=/lapack/lapack_routine/cgelst.f">

*> [ZIP]</a>

*> <a href="http://www.netlib.org/cgi-bin/netlibfiles.txt?format=txt&filename=/lapack/lapack_routine/cgelst.f">

*> [TXT]</a>

*

*  Definition:

*  ===========

*

*       SUBROUTINE CGELST( TRANS, M, N, NRHS, A, LDA, B, LDB, WORK, LWORK,

*                          INFO )

*

*       .. Scalar Arguments ..

*       CHARACTER          TRANS

*       INTEGER            INFO, LDA, LDB, LWORK, M, N, NRHS

*       ..

*       .. Array Arguments ..

*       COMPLEX            A( LDA, * ), B( LDB, * ), WORK( * )

*       ..

*

*

*> \par Purpose:

*  =============

*>

*> \verbatim

*>

*> CGELST solves overdetermined or underdetermined real linear systems

*> involving an M-by-N matrix A, or its conjugate-transpose, using a QR

*> or LQ factorization of A with compact WY representation of Q.

*>

*> It is assumed that A has full rank, and only a rudimentary protection

*> against rank-deficient matrices is provided. This subroutine only detects

*> exact rank-deficiency, where a diagonal element of the triangular factor

*> of A is exactly zero.

*>

*> It is conceivable for one (or more) of the diagonal elements of the triangular

*> factor of A to be subnormally tiny numbers without this subroutine signalling

*> an error. The solutions computed for such almost-rank-deficient matrices may

*> be less accurate due to a loss of numerical precision.

*>

*> The following options are provided:

*>

*> 1. If TRANS = 'N' and m >= n:  find the least squares solution of

*>    an overdetermined system, i.e., solve the least squares problem

*>                 minimize || B - A*X ||.

*>

*> 2. If TRANS = 'N' and m < n:  find the minimum norm solution of

*>    an underdetermined system A * X = B.

*>

*> 3. If TRANS = 'C' and m >= n:  find the minimum norm solution of

*>    an underdetermined system A**T * X = B.

*>

*> 4. If TRANS = 'C' and m < n:  find the least squares solution of

*>    an overdetermined system, i.e., solve the least squares problem

*>                 minimize || B - A**T * X ||.

*>

*> Several right hand side vectors b and solution vectors x can be

*> handled in a single call; they are stored as the columns of the

*> M-by-NRHS right hand side matrix B and the N-by-NRHS solution

*> matrix X.

*> \endverbatim

*

*  Arguments:

*  ==========

*

*> \param[in] TRANS

*> \verbatim

*>          TRANS is CHARACTER*1

*>          = 'N': the linear system involves A;

*>          = 'C': the linear system involves A**H.

*> \endverbatim

*>

*> \param[in] M

*> \verbatim

*>          M is INTEGER

*>          The number of rows of the matrix A.  M >= 0.

*> \endverbatim

*>

*> \param[in] N

*> \verbatim

*>          N is INTEGER

*>          The number of columns of the matrix A.  N >= 0.

*> \endverbatim

*>

*> \param[in] NRHS

*> \verbatim

*>          NRHS is INTEGER

*>          The number of right hand sides, i.e., the number of

*>          columns of the matrices B and X. NRHS >=0.

*> \endverbatim

*>

*> \param[in,out] A

*> \verbatim

*>          A is COMPLEX array, dimension (LDA,N)

*>          On entry, the M-by-N matrix A.

*>          On exit,

*>            if M >= N, A is overwritten by details of its QR

*>                       factorization as returned by CGEQRT;

*>            if M <  N, A is overwritten by details of its LQ

*>                       factorization as returned by CGELQT.

*> \endverbatim

*>

*> \param[in] LDA

*> \verbatim

*>          LDA is INTEGER

*>          The leading dimension of the array A.  LDA >= max(1,M).

*> \endverbatim

*>

*> \param[in,out] B

*> \verbatim

*>          B is COMPLEX array, dimension (LDB,NRHS)

*>          On entry, the matrix B of right hand side vectors, stored

*>          columnwise; B is M-by-NRHS if TRANS = 'N', or N-by-NRHS

*>          if TRANS = 'C'.

*>          On exit, if INFO = 0, B is overwritten by the solution

*>          vectors, stored columnwise:

*>          if TRANS = 'N' and m >= n, rows 1 to n of B contain the least

*>          squares solution vectors; the residual sum of squares for the

*>          solution in each column is given by the sum of squares of

*>          modulus of elements N+1 to M in that column;

*>          if TRANS = 'N' and m < n, rows 1 to N of B contain the

*>          minimum norm solution vectors;

*>          if TRANS = 'C' and m >= n, rows 1 to M of B contain the

*>          minimum norm solution vectors;

*>          if TRANS = 'C' and m < n, rows 1 to M of B contain the

*>          least squares solution vectors; the residual sum of squares

*>          for the solution in each column is given by the sum of

*>          squares of the modulus of elements M+1 to N in that column.

*> \endverbatim

*>

*> \param[in] LDB

*> \verbatim

*>          LDB is INTEGER

*>          The leading dimension of the array B. LDB >= MAX(1,M,N).

*> \endverbatim

*>

*> \param[out] WORK

*> \verbatim

*>          WORK is COMPLEX array, dimension (MAX(1,LWORK))

*>          On exit, if INFO = 0, WORK(1) returns the optimal LWORK.

*> \endverbatim

*>

*> \param[in] LWORK

*> \verbatim

*>          LWORK is INTEGER

*>          The dimension of the array WORK.

*>          LWORK >= max( 1, MN + max( MN, NRHS ) ).

*>          For optimal performance,

*>          LWORK >= max( 1, (MN + max( MN, NRHS ))*NB ).

*>          where MN = min(M,N) and NB is the optimum block size.

*>

*>          If LWORK = -1, then a workspace query is assumed; the routine

*>          only calculates the optimal size of the WORK array, returns

*>          this value as the first entry of the WORK array, and no error

*>          message related to LWORK is issued by XERBLA.

*> \endverbatim

*>

*> \param[out] INFO

*> \verbatim

*>          INFO is INTEGER

*>          = 0:  successful exit

*>          < 0:  if INFO = -i, the i-th argument had an illegal value

*>          > 0:  if INFO =  i, the i-th diagonal element of the

*>                triangular factor of A is exactly zero, so that A does not have

*>                full rank; the least squares solution could not be

*>                computed.

*> \endverbatim

*

*  Authors:

*  ========

*

*> \author Univ. of Tennessee

*> \author Univ. of California Berkeley

*> \author Univ. of Colorado Denver

*> \author NAG Ltd.

*

*> \ingroup gelst

*

*> \par Contributors:

*  ==================

*>

*> \verbatim

*>

*>  November 2022,  Igor Kozachenko,

*>                  Computer Science Division,

*>                  University of California, Berkeley

*> \endverbatim

*

*  =====================================================================


      SUBROUTINE cgelst( TRANS, M, N, NRHS, A, LDA, B, LDB, WORK,

     $                   LWORK,

     $                   INFO )

*

*  -- LAPACK driver routine --

*  -- LAPACK is a software package provided by Univ. of Tennessee,    --

*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--

*

*     .. Scalar Arguments ..

      CHARACTER          TRANS

      INTEGER            INFO, LDA, LDB, LWORK, M, N, NRHS

*     ..

*     .. Array Arguments ..

      COMPLEX            A( LDA, * ), B( LDB, * ), WORK( * )

*     ..

*

*  =====================================================================

*

*     .. Parameters ..

      REAL               ZERO, ONE

      PARAMETER          ( ZERO = 0.0e+0, one = 1.0e+0 )

      COMPLEX            CZERO

      parameter( czero = ( 0.0e+0, 0.0e+0 ) )

*     ..

*     .. Local Scalars ..

      LOGICAL            LQUERY, TPSD

      INTEGER            BROW, I, IASCL, IBSCL, J, LWOPT, MN, MNNRHS,

     $                   nb, nbmin, scllen

      REAL               ANRM, BIGNUM, BNRM, SMLNUM

*     ..

*     .. Local Arrays ..

      REAL               RWORK( 1 )

*     ..

*     .. External Functions ..

      LOGICAL            LSAME

      INTEGER            ILAENV

      REAL               SLAMCH, CLANGE, SROUNDUP_LWORK

      EXTERNAL           lsame, ilaenv, slamch, clange,

     $                   sroundup_lwork

*     ..

*     .. External Subroutines ..

      EXTERNAL           cgelqt, cgeqrt, cgemlqt, cgemqrt,

     $                   clascl, claset, ctrtrs, xerbla

*     ..

*     .. Intrinsic Functions ..

      INTRINSIC          max, min

*     ..

*     .. Executable Statements ..

*

*     Test the input arguments.

*

      info = 0

      mn = min( m, n )

      lquery = ( lwork.EQ.-1 )

      IF( .NOT.( lsame( trans, 'N' ) .OR.

     $    lsame( trans, 'C' ) ) ) THEN

         info = -1

      ELSE IF( m.LT.0 ) THEN

         info = -2

      ELSE IF( n.LT.0 ) THEN

         info = -3

      ELSE IF( nrhs.LT.0 ) THEN

         info = -4

      ELSE IF( lda.LT.max( 1, m ) ) THEN

         info = -6

      ELSE IF( ldb.LT.max( 1, m, n ) ) THEN

         info = -8

      ELSE IF( lwork.LT.max( 1, mn+max( mn, nrhs ) ) .AND. .NOT.lquery )

     $          THEN

         info = -10

      END IF

*

*     Figure out optimal block size and optimal workspace size

*

      IF( info.EQ.0 .OR. info.EQ.-10 ) THEN

*

         tpsd = .true.

         IF( lsame( trans, 'N' ) )

     $      tpsd = .false.

*

         nb = ilaenv( 1, 'CGELST', ' ', m, n, -1, -1 )

*

         mnnrhs = max( mn, nrhs )

         lwopt = max( 1, (mn+mnnrhs)*nb )

         work( 1 ) = sroundup_lwork( lwopt )

*

      END IF

*

      IF( info.NE.0 ) THEN

         CALL xerbla( 'CGELST ', -info )

         RETURN

      ELSE IF( lquery ) THEN

         RETURN

      END IF

*

*     Quick return if possible

*

      IF( min( m, n, nrhs ).EQ.0 ) THEN

         CALL claset( 'Full', max( m, n ), nrhs, czero, czero,

     $                 b, ldb )

         work( 1 ) = sroundup_lwork( lwopt )

         RETURN

      END IF

*

*     *GEQRT and *GELQT routines cannot accept NB larger than min(M,N)

*

      IF( nb.GT.mn ) nb = mn

*

*     Determine the block size from the supplied LWORK

*     ( at this stage we know that LWORK >= (minimum required workspace,

*     but it may be less than optimal)

*

      nb = min( nb, lwork/( mn + mnnrhs ) )

*

*     The minimum value of NB, when blocked code is used

*

      nbmin = max( 2, ilaenv( 2, 'CGELST', ' ', m, n, -1, -1 ) )

*

      IF( nb.LT.nbmin ) THEN

         nb = 1

      END IF

*

*     Get machine parameters

*

      smlnum = slamch( 'S' ) / slamch( 'P' )

      bignum = one / smlnum

*

*     Scale A, B if max element outside range [SMLNUM,BIGNUM]

*

      anrm = clange( 'M', m, n, a, lda, rwork )

      iascl = 0

      IF( anrm.GT.zero .AND. anrm.LT.smlnum ) THEN

*

*        Scale matrix norm up to SMLNUM

*

         CALL clascl( 'G', 0, 0, anrm, smlnum, m, n, a, lda, info )

         iascl = 1

      ELSE IF( anrm.GT.bignum ) THEN

*

*        Scale matrix norm down to BIGNUM

*

         CALL clascl( 'G', 0, 0, anrm, bignum, m, n, a, lda, info )

         iascl = 2

      ELSE IF( anrm.EQ.zero ) THEN

*

*        Matrix all zero. Return zero solution.

*

         CALL claset( 'Full', max( m, n ), nrhs, czero, czero,

     $                b, ldb )

         work( 1 ) = sroundup_lwork( lwopt )

         RETURN

      END IF

*

      brow = m

      IF( tpsd )

     $   brow = n

      bnrm = clange( 'M', brow, nrhs, b, ldb, rwork )

      ibscl = 0

      IF( bnrm.GT.zero .AND. bnrm.LT.smlnum ) THEN

*

*        Scale matrix norm up to SMLNUM

*

         CALL clascl( 'G', 0, 0, bnrm, smlnum, brow, nrhs, b, ldb,

     $                info )

         ibscl = 1

      ELSE IF( bnrm.GT.bignum ) THEN

*

*        Scale matrix norm down to BIGNUM

*

         CALL clascl( 'G', 0, 0, bnrm, bignum, brow, nrhs, b, ldb,

     $                info )

         ibscl = 2

      END IF

*

      IF( m.GE.n ) THEN

*

*        M > N:

*        Compute the blocked QR factorization of A,

*        using the compact WY representation of Q,

*        workspace at least N, optimally N*NB.

*

         CALL cgeqrt( m, n, nb, a, lda, work( 1 ), nb,

     $                work( mn*nb+1 ), info )

*

         IF( .NOT.tpsd ) THEN

*

*           M > N, A is not transposed:

*           Overdetermined system of equations,

*           least-squares problem, min || A * X - B ||.

*

*           Compute B(1:M,1:NRHS) := Q**T * B(1:M,1:NRHS),

*           using the compact WY representation of Q,

*           workspace at least NRHS, optimally NRHS*NB.

*

            CALL cgemqrt( 'Left', 'Conjugate transpose', m, nrhs, n,

     $                    nb,

     $                    a, lda, work( 1 ), nb, b, ldb,

     $                    work( mn*nb+1 ), info )

*

*           Compute B(1:N,1:NRHS) := inv(R) * B(1:N,1:NRHS)

*

            CALL ctrtrs( 'Upper', 'No transpose', 'Non-unit', n,

     $                   nrhs,

     $                   a, lda, b, ldb, info )

*

            IF( info.GT.0 ) THEN

               RETURN

            END IF

*

            scllen = n

*

         ELSE

*

*           M > N, A is transposed:

*           Underdetermined system of equations,

*           minimum norm solution of A**T * X = B.

*

*           Compute B := inv(R**T) * B in two row blocks of B.

*

*           Block 1: B(1:N,1:NRHS) := inv(R**T) * B(1:N,1:NRHS)

*

            CALL ctrtrs( 'Upper', 'Conjugate transpose', 'Non-unit',

     $                   n, nrhs, a, lda, b, ldb, info )

*

            IF( info.GT.0 ) THEN

               RETURN

            END IF

*

*           Block 2: Zero out all rows below the N-th row in B:

*           B(N+1:M,1:NRHS) = ZERO

*

            DO  j = 1, nrhs

               DO i = n + 1, m

                  b( i, j ) = zero

               END DO

            END DO

*

*           Compute B(1:M,1:NRHS) := Q(1:N,:) * B(1:N,1:NRHS),

*           using the compact WY representation of Q,

*           workspace at least NRHS, optimally NRHS*NB.

*

            CALL cgemqrt( 'Left', 'No transpose', m, nrhs, n, nb,

     $                    a, lda, work( 1 ), nb, b, ldb,

     $                    work( mn*nb+1 ), info )

*

            scllen = m

*

         END IF

*

      ELSE

*

*        M < N:

*        Compute the blocked LQ factorization of A,

*        using the compact WY representation of Q,

*        workspace at least M, optimally M*NB.

*

         CALL cgelqt( m, n, nb, a, lda, work( 1 ), nb,

     $                work( mn*nb+1 ), info )

*

         IF( .NOT.tpsd ) THEN

*

*           M < N, A is not transposed:

*           Underdetermined system of equations,

*           minimum norm solution of A * X = B.

*

*           Compute B := inv(L) * B in two row blocks of B.

*

*           Block 1: B(1:M,1:NRHS) := inv(L) * B(1:M,1:NRHS)

*

            CALL ctrtrs( 'Lower', 'No transpose', 'Non-unit', m,

     $                   nrhs,

     $                   a, lda, b, ldb, info )

*

            IF( info.GT.0 ) THEN

               RETURN

            END IF

*

*           Block 2: Zero out all rows below the M-th row in B:

*           B(M+1:N,1:NRHS) = ZERO

*

            DO j = 1, nrhs

               DO i = m + 1, n

                  b( i, j ) = zero

               END DO

            END DO

*

*           Compute B(1:N,1:NRHS) := Q(1:N,:)**T * B(1:M,1:NRHS),

*           using the compact WY representation of Q,

*           workspace at least NRHS, optimally NRHS*NB.

*

            CALL cgemlqt( 'Left', 'Conjugate transpose', n, nrhs, m,

     $                    nb,

     $                   a, lda, work( 1 ), nb, b, ldb,

     $                   work( mn*nb+1 ), info )

*

            scllen = n

*

         ELSE

*

*           M < N, A is transposed:

*           Overdetermined system of equations,

*           least-squares problem, min || A**T * X - B ||.

*

*           Compute B(1:N,1:NRHS) := Q * B(1:N,1:NRHS),

*           using the compact WY representation of Q,

*           workspace at least NRHS, optimally NRHS*NB.

*

            CALL cgemlqt( 'Left', 'No transpose', n, nrhs, m, nb,

     $                    a, lda, work( 1 ), nb, b, ldb,

     $                    work( mn*nb+1), info )

*

*           Compute B(1:M,1:NRHS) := inv(L**T) * B(1:M,1:NRHS)

*

            CALL ctrtrs( 'Lower', 'Conjugate transpose', 'Non-unit',

     $                   m, nrhs, a, lda, b, ldb, info )

*

            IF( info.GT.0 ) THEN

               RETURN

            END IF

*

            scllen = m

*

         END IF

*

      END IF

*

*     Undo scaling

*

      IF( iascl.EQ.1 ) THEN

         CALL clascl( 'G', 0, 0, anrm, smlnum, scllen, nrhs, b, ldb,

     $                info )

      ELSE IF( iascl.EQ.2 ) THEN

         CALL clascl( 'G', 0, 0, anrm, bignum, scllen, nrhs, b, ldb,

     $                info )

      END IF

      IF( ibscl.EQ.1 ) THEN

         CALL clascl( 'G', 0, 0, smlnum, bnrm, scllen, nrhs, b, ldb,

     $                info )

      ELSE IF( ibscl.EQ.2 ) THEN

         CALL clascl( 'G', 0, 0, bignum, bnrm, scllen, nrhs, b, ldb,

     $                info )

      END IF

*

      work( 1 ) = sroundup_lwork( lwopt )

*

      RETURN

*

*     End of CGELST

*


      END

xerbla
subroutine xerbla(srname, info)
Definition cblat2.f:3285

cgelqt
subroutine cgelqt(m, n, mb, a, lda, t, ldt, work, info)
CGELQT
Definition cgelqt.f:124

cgelst
subroutine cgelst(trans, m, n, nrhs, a, lda, b, ldb, work, lwork, info)
CGELST solves overdetermined or underdetermined systems for GE matrices using QR or LQ factorization ...
Definition cgelst.f:202

cgemlqt
subroutine cgemlqt(side, trans, m, n, k, mb, v, ldv, t, ldt, c, ldc, work, info)
CGEMLQT
Definition cgemlqt.f:153

cgemqrt
subroutine cgemqrt(side, trans, m, n, k, nb, v, ldv, t, ldt, c, ldc, work, info)
CGEMQRT
Definition cgemqrt.f:166

cgeqrt
subroutine cgeqrt(m, n, nb, a, lda, t, ldt, work, info)
CGEQRT
Definition cgeqrt.f:139

clascl
subroutine clascl(type, kl, ku, cfrom, cto, m, n, a, lda, info)
CLASCL multiplies a general rectangular matrix by a real scalar defined as cto/cfrom.
Definition clascl.f:142

claset
subroutine claset(uplo, m, n, alpha, beta, a, lda)
CLASET initializes the off-diagonal elements and the diagonal elements of a matrix to given values.
Definition claset.f:104

ctrtrs
subroutine ctrtrs(uplo, trans, diag, n, nrhs, a, lda, b, ldb, info)
CTRTRS
Definition ctrtrs.f:144