d1/dfc/dgelst_8f_source.html

*> \brief <b> DGELST solves overdetermined or underdetermined systems for GE matrices using QR or LQ factorization with compact WY representation of Q.</b>

*

*  =========== DOCUMENTATION ===========

*

* Online html documentation available at

*            http://www.netlib.org/lapack/explore-html/

*

*> Download DGELST + dependencies

*> <a href="http://www.netlib.org/cgi-bin/netlibfiles.tgz?format=tgz&filename=/lapack/lapack_routine/dgelst.f">

*> [TGZ]</a>

*> <a href="http://www.netlib.org/cgi-bin/netlibfiles.zip?format=zip&filename=/lapack/lapack_routine/dgelst.f">

*> [ZIP]</a>

*> <a href="http://www.netlib.org/cgi-bin/netlibfiles.txt?format=txt&filename=/lapack/lapack_routine/dgelst.f">

*> [TXT]</a>

*

*  Definition:

*  ===========

*

*       SUBROUTINE DGELST( TRANS, M, N, NRHS, A, LDA, B, LDB, WORK, LWORK,

*                          INFO )

*

*       .. Scalar Arguments ..

*       CHARACTER          TRANS

*       INTEGER            INFO, LDA, LDB, LWORK, M, N, NRHS

*       ..

*       .. Array Arguments ..

*       DOUBLE PRECISION   A( LDA, * ), B( LDB, * ), WORK( * )

*       ..

*

*

*> \par Purpose:

*  =============

*>

*> \verbatim

*>

*> DGELST solves overdetermined or underdetermined real linear systems

*> involving an M-by-N matrix A, or its transpose, using a QR or LQ

*> factorization of A with compact WY representation of Q.

*>

*> It is assumed that A has full rank, and only a rudimentary protection

*> against rank-deficient matrices is provided. This subroutine only detects

*> exact rank-deficiency, where a diagonal element of the triangular factor

*> of A is exactly zero.

*>

*> It is conceivable for one (or more) of the diagonal elements of the triangular

*> factor of A to be subnormally tiny numbers without this subroutine signalling

*> an error. The solutions computed for such almost-rank-deficient matrices may

*> be less accurate due to a loss of numerical precision.

*>

*> The following options are provided:

*>

*> 1. If TRANS = 'N' and m >= n:  find the least squares solution of

*>    an overdetermined system, i.e., solve the least squares problem

*>                 minimize || B - A*X ||.

*>

*> 2. If TRANS = 'N' and m < n:  find the minimum norm solution of

*>    an underdetermined system A * X = B.

*>

*> 3. If TRANS = 'T' and m >= n:  find the minimum norm solution of

*>    an underdetermined system A**T * X = B.

*>

*> 4. If TRANS = 'T' and m < n:  find the least squares solution of

*>    an overdetermined system, i.e., solve the least squares problem

*>                 minimize || B - A**T * X ||.

*>

*> Several right hand side vectors b and solution vectors x can be

*> handled in a single call; they are stored as the columns of the

*> M-by-NRHS right hand side matrix B and the N-by-NRHS solution

*> matrix X.

*> \endverbatim

*

*  Arguments:

*  ==========

*

*> \param[in] TRANS

*> \verbatim

*>          TRANS is CHARACTER*1

*>          = 'N': the linear system involves A;

*>          = 'T': the linear system involves A**T.

*> \endverbatim

*>

*> \param[in] M

*> \verbatim

*>          M is INTEGER

*>          The number of rows of the matrix A.  M >= 0.

*> \endverbatim

*>

*> \param[in] N

*> \verbatim

*>          N is INTEGER

*>          The number of columns of the matrix A.  N >= 0.

*> \endverbatim

*>

*> \param[in] NRHS

*> \verbatim

*>          NRHS is INTEGER

*>          The number of right hand sides, i.e., the number of

*>          columns of the matrices B and X. NRHS >=0.

*> \endverbatim

*>

*> \param[in,out] A

*> \verbatim

*>          A is DOUBLE PRECISION array, dimension (LDA,N)

*>          On entry, the M-by-N matrix A.

*>          On exit,

*>            if M >= N, A is overwritten by details of its QR

*>                       factorization as returned by DGEQRT;

*>            if M <  N, A is overwritten by details of its LQ

*>                       factorization as returned by DGELQT.

*> \endverbatim

*>

*> \param[in] LDA

*> \verbatim

*>          LDA is INTEGER

*>          The leading dimension of the array A.  LDA >= max(1,M).

*> \endverbatim

*>

*> \param[in,out] B

*> \verbatim

*>          B is DOUBLE PRECISION array, dimension (LDB,NRHS)

*>          On entry, the matrix B of right hand side vectors, stored

*>          columnwise; B is M-by-NRHS if TRANS = 'N', or N-by-NRHS

*>          if TRANS = 'T'.

*>          On exit, if INFO = 0, B is overwritten by the solution

*>          vectors, stored columnwise:

*>          if TRANS = 'N' and m >= n, rows 1 to n of B contain the least

*>          squares solution vectors; the residual sum of squares for the

*>          solution in each column is given by the sum of squares of

*>          elements N+1 to M in that column;

*>          if TRANS = 'N' and m < n, rows 1 to N of B contain the

*>          minimum norm solution vectors;

*>          if TRANS = 'T' and m >= n, rows 1 to M of B contain the

*>          minimum norm solution vectors;

*>          if TRANS = 'T' and m < n, rows 1 to M of B contain the

*>          least squares solution vectors; the residual sum of squares

*>          for the solution in each column is given by the sum of

*>          squares of elements M+1 to N in that column.

*> \endverbatim

*>

*> \param[in] LDB

*> \verbatim

*>          LDB is INTEGER

*>          The leading dimension of the array B. LDB >= MAX(1,M,N).

*> \endverbatim

*>

*> \param[out] WORK

*> \verbatim

*>          WORK is DOUBLE PRECISION array, dimension (MAX(1,LWORK))

*>          On exit, if INFO = 0, WORK(1) returns the optimal LWORK.

*> \endverbatim

*>

*> \param[in] LWORK

*> \verbatim

*>          LWORK is INTEGER

*>          The dimension of the array WORK.

*>          LWORK >= max( 1, MN + max( MN, NRHS ) ).

*>          For optimal performance,

*>          LWORK >= max( 1, (MN + max( MN, NRHS ))*NB ).

*>          where MN = min(M,N) and NB is the optimum block size.

*>

*>          If LWORK = -1, then a workspace query is assumed; the routine

*>          only calculates the optimal size of the WORK array, returns

*>          this value as the first entry of the WORK array, and no error

*>          message related to LWORK is issued by XERBLA.

*> \endverbatim

*>

*> \param[out] INFO

*> \verbatim

*>          INFO is INTEGER

*>          = 0:  successful exit

*>          < 0:  if INFO = -i, the i-th argument had an illegal value

*>          > 0:  if INFO =  i, the i-th diagonal element of the

*>                triangular factor of A is exactly zero, so that A does not have

*>                full rank; the least squares solution could not be

*>                computed.

*> \endverbatim

*

*  Authors:

*  ========

*

*> \author Univ. of Tennessee

*> \author Univ. of California Berkeley

*> \author Univ. of Colorado Denver

*> \author NAG Ltd.

*

*> \ingroup gelst

*

*> \par Contributors:

*  ==================

*>

*> \verbatim

*>

*>  November 2022,  Igor Kozachenko,

*>                  Computer Science Division,

*>                  University of California, Berkeley

*> \endverbatim

*

*  =====================================================================


      SUBROUTINE dgelst( TRANS, M, N, NRHS, A, LDA, B, LDB, WORK,

     $                   LWORK,

     $                   INFO )

*

*  -- LAPACK driver routine --

*  -- LAPACK is a software package provided by Univ. of Tennessee,    --

*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--

*

*     .. Scalar Arguments ..

      CHARACTER          TRANS

      INTEGER            INFO, LDA, LDB, LWORK, M, N, NRHS

*     ..

*     .. Array Arguments ..

      DOUBLE PRECISION   A( LDA, * ), B( LDB, * ), WORK( * )

*     ..

*

*  =====================================================================

*

*     .. Parameters ..

      DOUBLE PRECISION   ZERO, ONE

      PARAMETER          ( ZERO = 0.0d+0, one = 1.0d+0 )

*     ..

*     .. Local Scalars ..

      LOGICAL            LQUERY, TPSD

      INTEGER            BROW, I, IASCL, IBSCL, J, LWOPT, MN, MNNRHS,

     $                   nb, nbmin, scllen

      DOUBLE PRECISION   ANRM, BIGNUM, BNRM, SMLNUM

*     ..

*     .. Local Arrays ..

      DOUBLE PRECISION   RWORK( 1 )

*     ..

*     .. External Functions ..

      LOGICAL            LSAME

      INTEGER            ILAENV

      DOUBLE PRECISION   DLAMCH, DLANGE

      EXTERNAL           lsame, ilaenv, dlamch, dlange

*     ..

*     .. External Subroutines ..

      EXTERNAL           dgelqt, dgeqrt, dgemlqt, dgemqrt,

     $                   dlascl,

     $                   dlaset, dtrtrs, xerbla

*     ..

*     .. Intrinsic Functions ..

      INTRINSIC          dble, max, min

*     ..

*     .. Executable Statements ..

*

*     Test the input arguments.

*

      info = 0

      mn = min( m, n )

      lquery = ( lwork.EQ.-1 )

      IF( .NOT.( lsame( trans, 'N' ) .OR.

     $    lsame( trans, 'T' ) ) ) THEN

         info = -1

      ELSE IF( m.LT.0 ) THEN

         info = -2

      ELSE IF( n.LT.0 ) THEN

         info = -3

      ELSE IF( nrhs.LT.0 ) THEN

         info = -4

      ELSE IF( lda.LT.max( 1, m ) ) THEN

         info = -6

      ELSE IF( ldb.LT.max( 1, m, n ) ) THEN

         info = -8

      ELSE IF( lwork.LT.max( 1, mn+max( mn, nrhs ) ) .AND. .NOT.lquery )

     $          THEN

         info = -10

      END IF

*

*     Figure out optimal block size and optimal workspace size

*

      IF( info.EQ.0 .OR. info.EQ.-10 ) THEN

*

         tpsd = .true.

         IF( lsame( trans, 'N' ) )

     $      tpsd = .false.

*

         nb = ilaenv( 1, 'DGELST', ' ', m, n, -1, -1 )

*

         mnnrhs = max( mn, nrhs )

         lwopt = max( 1, (mn+mnnrhs)*nb )

         work( 1 ) = dble( lwopt )

*

      END IF

*

      IF( info.NE.0 ) THEN

         CALL xerbla( 'DGELST ', -info )

         RETURN

      ELSE IF( lquery ) THEN

         RETURN

      END IF

*

*     Quick return if possible

*

      IF( min( m, n, nrhs ).EQ.0 ) THEN

         CALL dlaset( 'Full', max( m, n ), nrhs, zero, zero, b, ldb )

         work( 1 ) = dble( lwopt )

         RETURN

      END IF

*

*     *GEQRT and *GELQT routines cannot accept NB larger than min(M,N)

*

      IF( nb.GT.mn ) nb = mn

*

*     Determine the block size from the supplied LWORK

*     ( at this stage we know that LWORK >= (minimum required workspace,

*     but it may be less than optimal)

*

      nb = min( nb, lwork/( mn + mnnrhs ) )

*

*     The minimum value of NB, when blocked code is used

*

      nbmin = max( 2, ilaenv( 2, 'DGELST', ' ', m, n, -1, -1 ) )

*

      IF( nb.LT.nbmin ) THEN

         nb = 1

      END IF

*

*     Get machine parameters

*

      smlnum = dlamch( 'S' ) / dlamch( 'P' )

      bignum = one / smlnum

*

*     Scale A, B if max element outside range [SMLNUM,BIGNUM]

*

      anrm = dlange( 'M', m, n, a, lda, rwork )

      iascl = 0

      IF( anrm.GT.zero .AND. anrm.LT.smlnum ) THEN

*

*        Scale matrix norm up to SMLNUM

*

         CALL dlascl( 'G', 0, 0, anrm, smlnum, m, n, a, lda, info )

         iascl = 1

      ELSE IF( anrm.GT.bignum ) THEN

*

*        Scale matrix norm down to BIGNUM

*

         CALL dlascl( 'G', 0, 0, anrm, bignum, m, n, a, lda, info )

         iascl = 2

      ELSE IF( anrm.EQ.zero ) THEN

*

*        Matrix all zero. Return zero solution.

*

         CALL dlaset( 'Full', max( m, n ), nrhs, zero, zero, b, ldb )

         work( 1 ) = dble( lwopt )

         RETURN

      END IF

*

      brow = m

      IF( tpsd )

     $   brow = n

      bnrm = dlange( 'M', brow, nrhs, b, ldb, rwork )

      ibscl = 0

      IF( bnrm.GT.zero .AND. bnrm.LT.smlnum ) THEN

*

*        Scale matrix norm up to SMLNUM

*

         CALL dlascl( 'G', 0, 0, bnrm, smlnum, brow, nrhs, b, ldb,

     $                info )

         ibscl = 1

      ELSE IF( bnrm.GT.bignum ) THEN

*

*        Scale matrix norm down to BIGNUM

*

         CALL dlascl( 'G', 0, 0, bnrm, bignum, brow, nrhs, b, ldb,

     $                info )

         ibscl = 2

      END IF

*

      IF( m.GE.n ) THEN

*

*        M > N:

*        Compute the blocked QR factorization of A,

*        using the compact WY representation of Q,

*        workspace at least N, optimally N*NB.

*

         CALL dgeqrt( m, n, nb, a, lda, work( 1 ), nb,

     $                work( mn*nb+1 ), info )

*

         IF( .NOT.tpsd ) THEN

*

*           M > N, A is not transposed:

*           Overdetermined system of equations,

*           least-squares problem, min || A * X - B ||.

*

*           Compute B(1:M,1:NRHS) := Q**T * B(1:M,1:NRHS),

*           using the compact WY representation of Q,

*           workspace at least NRHS, optimally NRHS*NB.

*

            CALL dgemqrt( 'Left', 'Transpose', m, nrhs, n, nb, a,

     $                    lda,

     $                    work( 1 ), nb, b, ldb, work( mn*nb+1 ),

     $                    info )

*

*           Compute B(1:N,1:NRHS) := inv(R) * B(1:N,1:NRHS)

*

            CALL dtrtrs( 'Upper', 'No transpose', 'Non-unit', n,

     $                   nrhs,

     $                   a, lda, b, ldb, info )

*

            IF( info.GT.0 ) THEN

               RETURN

            END IF

*

            scllen = n

*

         ELSE

*

*           M > N, A is transposed:

*           Underdetermined system of equations,

*           minimum norm solution of A**T * X = B.

*

*           Compute B := inv(R**T) * B in two row blocks of B.

*

*           Block 1: B(1:N,1:NRHS) := inv(R**T) * B(1:N,1:NRHS)

*

            CALL dtrtrs( 'Upper', 'Transpose', 'Non-unit', n, nrhs,

     $                   a, lda, b, ldb, info )

*

            IF( info.GT.0 ) THEN

               RETURN

            END IF

*

*           Block 2: Zero out all rows below the N-th row in B:

*           B(N+1:M,1:NRHS) = ZERO

*

            DO  j = 1, nrhs

               DO i = n + 1, m

                  b( i, j ) = zero

               END DO

            END DO

*

*           Compute B(1:M,1:NRHS) := Q(1:N,:) * B(1:N,1:NRHS),

*           using the compact WY representation of Q,

*           workspace at least NRHS, optimally NRHS*NB.

*

            CALL dgemqrt( 'Left', 'No transpose', m, nrhs, n, nb,

     $                    a, lda, work( 1 ), nb, b, ldb,

     $                    work( mn*nb+1 ), info )

*

            scllen = m

*

         END IF

*

      ELSE

*

*        M < N:

*        Compute the blocked LQ factorization of A,

*        using the compact WY representation of Q,

*        workspace at least M, optimally M*NB.

*

         CALL dgelqt( m, n, nb, a, lda, work( 1 ), nb,

     $                work( mn*nb+1 ), info )

*

         IF( .NOT.tpsd ) THEN

*

*           M < N, A is not transposed:

*           Underdetermined system of equations,

*           minimum norm solution of A * X = B.

*

*           Compute B := inv(L) * B in two row blocks of B.

*

*           Block 1: B(1:M,1:NRHS) := inv(L) * B(1:M,1:NRHS)

*

            CALL dtrtrs( 'Lower', 'No transpose', 'Non-unit', m,

     $                   nrhs,

     $                   a, lda, b, ldb, info )

*

            IF( info.GT.0 ) THEN

               RETURN

            END IF

*

*           Block 2: Zero out all rows below the M-th row in B:

*           B(M+1:N,1:NRHS) = ZERO

*

            DO j = 1, nrhs

               DO i = m + 1, n

                  b( i, j ) = zero

               END DO

            END DO

*

*           Compute B(1:N,1:NRHS) := Q(1:N,:)**T * B(1:M,1:NRHS),

*           using the compact WY representation of Q,

*           workspace at least NRHS, optimally NRHS*NB.

*

            CALL dgemlqt( 'Left', 'Transpose', n, nrhs, m, nb, a,

     $                    lda,

     $                   work( 1 ), nb, b, ldb,

     $                   work( mn*nb+1 ), info )

*

            scllen = n

*

         ELSE

*

*           M < N, A is transposed:

*           Overdetermined system of equations,

*           least-squares problem, min || A**T * X - B ||.

*

*           Compute B(1:N,1:NRHS) := Q * B(1:N,1:NRHS),

*           using the compact WY representation of Q,

*           workspace at least NRHS, optimally NRHS*NB.

*

            CALL dgemlqt( 'Left', 'No transpose', n, nrhs, m, nb,

     $                    a, lda, work( 1 ), nb, b, ldb,

     $                    work( mn*nb+1), info )

*

*           Compute B(1:M,1:NRHS) := inv(L**T) * B(1:M,1:NRHS)

*

            CALL dtrtrs( 'Lower', 'Transpose', 'Non-unit', m, nrhs,

     $                   a, lda, b, ldb, info )

*

            IF( info.GT.0 ) THEN

               RETURN

            END IF

*

            scllen = m

*

         END IF

*

      END IF

*

*     Undo scaling

*

      IF( iascl.EQ.1 ) THEN

         CALL dlascl( 'G', 0, 0, anrm, smlnum, scllen, nrhs, b, ldb,

     $                info )

      ELSE IF( iascl.EQ.2 ) THEN

         CALL dlascl( 'G', 0, 0, anrm, bignum, scllen, nrhs, b, ldb,

     $                info )

      END IF

      IF( ibscl.EQ.1 ) THEN

         CALL dlascl( 'G', 0, 0, smlnum, bnrm, scllen, nrhs, b, ldb,

     $                info )

      ELSE IF( ibscl.EQ.2 ) THEN

         CALL dlascl( 'G', 0, 0, bignum, bnrm, scllen, nrhs, b, ldb,

     $                info )

      END IF

*

      work( 1 ) = dble( lwopt )

*

      RETURN

*

*     End of DGELST

*


      END

xerbla
subroutine xerbla(srname, info)
Definition cblat2.f:3285

dgelqt
subroutine dgelqt(m, n, mb, a, lda, t, ldt, work, info)
DGELQT
Definition dgelqt.f:137

dgelst
subroutine dgelst(trans, m, n, nrhs, a, lda, b, ldb, work, lwork, info)
DGELST solves overdetermined or underdetermined systems for GE matrices using QR or LQ factorization ...
Definition dgelst.f:202

dgemlqt
subroutine dgemlqt(side, trans, m, n, k, mb, v, ldv, t, ldt, c, ldc, work, info)
DGEMLQT
Definition dgemlqt.f:166

dgemqrt
subroutine dgemqrt(side, trans, m, n, k, nb, v, ldv, t, ldt, c, ldc, work, info)
DGEMQRT
Definition dgemqrt.f:166

dgeqrt
subroutine dgeqrt(m, n, nb, a, lda, t, ldt, work, info)
DGEQRT
Definition dgeqrt.f:139

dlascl
subroutine dlascl(type, kl, ku, cfrom, cto, m, n, a, lda, info)
DLASCL multiplies a general rectangular matrix by a real scalar defined as cto/cfrom.
Definition dlascl.f:142

dlaset
subroutine dlaset(uplo, m, n, alpha, beta, a, lda)
DLASET initializes the off-diagonal elements and the diagonal elements of a matrix to given values.
Definition dlaset.f:108

dtrtrs
subroutine dtrtrs(uplo, trans, diag, n, nrhs, a, lda, b, ldb, info)
DTRTRS
Definition dtrtrs.f:144