dd/d17/sgelst_8f_source.html

*> \brief <b> SGELST solves overdetermined or underdetermined systems for GE matrices using QR or LQ factorization with compact WY representation of Q.</b>

*

*  =========== DOCUMENTATION ===========

*

* Online html documentation available at

*            http://www.netlib.org/lapack/explore-html/

*

*> Download SGELST + dependencies

*> <a href="http://www.netlib.org/cgi-bin/netlibfiles.tgz?format=tgz&filename=/lapack/lapack_routine/sgelst.f">

*> [TGZ]</a>

*> <a href="http://www.netlib.org/cgi-bin/netlibfiles.zip?format=zip&filename=/lapack/lapack_routine/sgelst.f">

*> [ZIP]</a>

*> <a href="http://www.netlib.org/cgi-bin/netlibfiles.txt?format=txt&filename=/lapack/lapack_routine/sgelst.f">

*> [TXT]</a>

*

*  Definition:

*  ===========

*

*       SUBROUTINE SGELST( TRANS, M, N, NRHS, A, LDA, B, LDB, WORK, LWORK,

*                          INFO )

*

*       .. Scalar Arguments ..

*       CHARACTER          TRANS

*       INTEGER            INFO, LDA, LDB, LWORK, M, N, NRHS

*       ..

*       .. Array Arguments ..

*       REAL               A( LDA, * ), B( LDB, * ), WORK( * )

*       ..

*

*

*> \par Purpose:

*  =============

*>

*> \verbatim

*>

*> SGELST solves overdetermined or underdetermined real linear systems

*> involving an M-by-N matrix A, or its transpose, using a QR or LQ

*> factorization of A with compact WY representation of Q.

*>

*> It is assumed that A has full rank, and only a rudimentary protection

*> against rank-deficient matrices is provided. This subroutine only detects

*> exact rank-deficiency, where a diagonal element of the triangular factor

*> of A is exactly zero.

*>

*> It is conceivable for one (or more) of the diagonal elements of the triangular

*> factor of A to be subnormally tiny numbers without this subroutine signalling

*> an error. The solutions computed for such almost-rank-deficient matrices may

*> be less accurate due to a loss of numerical precision.

*>

*> The following options are provided:

*>

*> 1. If TRANS = 'N' and m >= n:  find the least squares solution of

*>    an overdetermined system, i.e., solve the least squares problem

*>                 minimize || B - A*X ||.

*>

*> 2. If TRANS = 'N' and m < n:  find the minimum norm solution of

*>    an underdetermined system A * X = B.

*>

*> 3. If TRANS = 'T' and m >= n:  find the minimum norm solution of

*>    an underdetermined system A**T * X = B.

*>

*> 4. If TRANS = 'T' and m < n:  find the least squares solution of

*>    an overdetermined system, i.e., solve the least squares problem

*>                 minimize || B - A**T * X ||.

*>

*> Several right hand side vectors b and solution vectors x can be

*> handled in a single call; they are stored as the columns of the

*> M-by-NRHS right hand side matrix B and the N-by-NRHS solution

*> matrix X.

*> \endverbatim

*

*  Arguments:

*  ==========

*

*> \param[in] TRANS

*> \verbatim

*>          TRANS is CHARACTER*1

*>          = 'N': the linear system involves A;

*>          = 'T': the linear system involves A**T.

*> \endverbatim

*>

*> \param[in] M

*> \verbatim

*>          M is INTEGER

*>          The number of rows of the matrix A.  M >= 0.

*> \endverbatim

*>

*> \param[in] N

*> \verbatim

*>          N is INTEGER

*>          The number of columns of the matrix A.  N >= 0.

*> \endverbatim

*>

*> \param[in] NRHS

*> \verbatim

*>          NRHS is INTEGER

*>          The number of right hand sides, i.e., the number of

*>          columns of the matrices B and X. NRHS >=0.

*> \endverbatim

*>

*> \param[in,out] A

*> \verbatim

*>          A is REAL array, dimension (LDA,N)

*>          On entry, the M-by-N matrix A.

*>          On exit,

*>            if M >= N, A is overwritten by details of its QR

*>                       factorization as returned by SGEQRT;

*>            if M <  N, A is overwritten by details of its LQ

*>                       factorization as returned by SGELQT.

*> \endverbatim

*>

*> \param[in] LDA

*> \verbatim

*>          LDA is INTEGER

*>          The leading dimension of the array A.  LDA >= max(1,M).

*> \endverbatim

*>

*> \param[in,out] B

*> \verbatim

*>          B is REAL array, dimension (LDB,NRHS)

*>          On entry, the matrix B of right hand side vectors, stored

*>          columnwise; B is M-by-NRHS if TRANS = 'N', or N-by-NRHS

*>          if TRANS = 'T'.

*>          On exit, if INFO = 0, B is overwritten by the solution

*>          vectors, stored columnwise:

*>          if TRANS = 'N' and m >= n, rows 1 to n of B contain the least

*>          squares solution vectors; the residual sum of squares for the

*>          solution in each column is given by the sum of squares of

*>          elements N+1 to M in that column;

*>          if TRANS = 'N' and m < n, rows 1 to N of B contain the

*>          minimum norm solution vectors;

*>          if TRANS = 'T' and m >= n, rows 1 to M of B contain the

*>          minimum norm solution vectors;

*>          if TRANS = 'T' and m < n, rows 1 to M of B contain the

*>          least squares solution vectors; the residual sum of squares

*>          for the solution in each column is given by the sum of

*>          squares of elements M+1 to N in that column.

*> \endverbatim

*>

*> \param[in] LDB

*> \verbatim

*>          LDB is INTEGER

*>          The leading dimension of the array B. LDB >= MAX(1,M,N).

*> \endverbatim

*>

*> \param[out] WORK

*> \verbatim

*>          WORK is REAL array, dimension (MAX(1,LWORK))

*>          On exit, if INFO = 0, WORK(1) returns the optimal LWORK.

*> \endverbatim

*>

*> \param[in] LWORK

*> \verbatim

*>          LWORK is INTEGER

*>          The dimension of the array WORK.

*>          LWORK >= max( 1, MN + max( MN, NRHS ) ).

*>          For optimal performance,

*>          LWORK >= max( 1, (MN + max( MN, NRHS ))*NB ).

*>          where MN = min(M,N) and NB is the optimum block size.

*>

*>          If LWORK = -1, then a workspace query is assumed; the routine

*>          only calculates the optimal size of the WORK array, returns

*>          this value as the first entry of the WORK array, and no error

*>          message related to LWORK is issued by XERBLA.

*> \endverbatim

*>

*> \param[out] INFO

*> \verbatim

*>          INFO is INTEGER

*>          = 0:  successful exit

*>          < 0:  if INFO = -i, the i-th argument had an illegal value

*>          > 0:  if INFO =  i, the i-th diagonal element of the

*>                triangular factor of A is exactly zero, so that A does not have

*>                full rank; the least squares solution could not be

*>                computed.

*> \endverbatim

*

*  Authors:

*  ========

*

*> \author Univ. of Tennessee

*> \author Univ. of California Berkeley

*> \author Univ. of Colorado Denver

*> \author NAG Ltd.

*

*> \ingroup gelst

*

*> \par Contributors:

*  ==================

*>

*> \verbatim

*>

*>  November 2022,  Igor Kozachenko,

*>                  Computer Science Division,

*>                  University of California, Berkeley

*> \endverbatim

*

*  =====================================================================


      SUBROUTINE sgelst( TRANS, M, N, NRHS, A, LDA, B, LDB, WORK,

     $                   LWORK,

     $                   INFO )

*

*  -- LAPACK driver routine --

*  -- LAPACK is a software package provided by Univ. of Tennessee,    --

*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--

*

*     .. Scalar Arguments ..

      CHARACTER          TRANS

      INTEGER            INFO, LDA, LDB, LWORK, M, N, NRHS

*     ..

*     .. Array Arguments ..

      REAL               A( LDA, * ), B( LDB, * ), WORK( * )

*     ..

*

*  =====================================================================

*

*     .. Parameters ..

      REAL               ZERO, ONE

      PARAMETER          ( ZERO = 0.0e+0, one = 1.0e+0 )

*     ..

*     .. Local Scalars ..

      LOGICAL            LQUERY, TPSD

      INTEGER            BROW, I, IASCL, IBSCL, J, LWOPT, MN, MNNRHS,

     $                   nb, nbmin, scllen

      REAL               ANRM, BIGNUM, BNRM, SMLNUM

*     ..

*     .. Local Arrays ..

      REAL               RWORK( 1 )

*     ..

*     .. External Functions ..

      LOGICAL            LSAME

      INTEGER            ILAENV

      REAL               SLAMCH, SLANGE, SROUNDUP_LWORK

      EXTERNAL           lsame, ilaenv, slamch, slange,

     $                   sroundup_lwork

*     ..

*     .. External Subroutines ..

      EXTERNAL           sgelqt, sgeqrt, sgemlqt, sgemqrt,

     $                   slascl, slaset, strtrs, xerbla

*     ..

*     .. Intrinsic Functions ..

      INTRINSIC          max, min

*     ..

*     .. Executable Statements ..

*

*     Test the input arguments.

*

      info = 0

      mn = min( m, n )

      lquery = ( lwork.EQ.-1 )

      IF( .NOT.( lsame( trans, 'N' ) .OR.

     $    lsame( trans, 'T' ) ) ) THEN

         info = -1

      ELSE IF( m.LT.0 ) THEN

         info = -2

      ELSE IF( n.LT.0 ) THEN

         info = -3

      ELSE IF( nrhs.LT.0 ) THEN

         info = -4

      ELSE IF( lda.LT.max( 1, m ) ) THEN

         info = -6

      ELSE IF( ldb.LT.max( 1, m, n ) ) THEN

         info = -8

      ELSE IF( lwork.LT.max( 1, mn+max( mn, nrhs ) ) .AND. .NOT.lquery )

     $          THEN

         info = -10

      END IF

*

*     Figure out optimal block size and optimal workspace size

*

      IF( info.EQ.0 .OR. info.EQ.-10 ) THEN

*

         tpsd = .true.

         IF( lsame( trans, 'N' ) )

     $      tpsd = .false.

*

         nb = ilaenv( 1, 'SGELST', ' ', m, n, -1, -1 )

*

         mnnrhs = max( mn, nrhs )

         lwopt = max( 1, (mn+mnnrhs)*nb )

         work( 1 ) = sroundup_lwork( lwopt )

*

      END IF

*

      IF( info.NE.0 ) THEN

         CALL xerbla( 'SGELST ', -info )

         RETURN

      ELSE IF( lquery ) THEN

         RETURN

      END IF

*

*     Quick return if possible

*

      IF( min( m, n, nrhs ).EQ.0 ) THEN

         CALL slaset( 'Full', max( m, n ), nrhs, zero, zero, b, ldb )

         work( 1 ) = sroundup_lwork( lwopt )

         RETURN

      END IF

*

*     *GEQRT and *GELQT routines cannot accept NB larger than min(M,N)

*

      IF( nb.GT.mn ) nb = mn

*

*     Determine the block size from the supplied LWORK

*     ( at this stage we know that LWORK >= (minimum required workspace,

*     but it may be less than optimal)

*

      nb = min( nb, lwork/( mn + mnnrhs ) )

*

*     The minimum value of NB, when blocked code is used

*

      nbmin = max( 2, ilaenv( 2, 'SGELST', ' ', m, n, -1, -1 ) )

*

      IF( nb.LT.nbmin ) THEN

         nb = 1

      END IF

*

*     Get machine parameters

*

      smlnum = slamch( 'S' ) / slamch( 'P' )

      bignum = one / smlnum

*

*     Scale A, B if max element outside range [SMLNUM,BIGNUM]

*

      anrm = slange( 'M', m, n, a, lda, rwork )

      iascl = 0

      IF( anrm.GT.zero .AND. anrm.LT.smlnum ) THEN

*

*        Scale matrix norm up to SMLNUM

*

         CALL slascl( 'G', 0, 0, anrm, smlnum, m, n, a, lda, info )

         iascl = 1

      ELSE IF( anrm.GT.bignum ) THEN

*

*        Scale matrix norm down to BIGNUM

*

         CALL slascl( 'G', 0, 0, anrm, bignum, m, n, a, lda, info )

         iascl = 2

      ELSE IF( anrm.EQ.zero ) THEN

*

*        Matrix all zero. Return zero solution.

*

         CALL slaset( 'Full', max( m, n ), nrhs, zero, zero, b, ldb )

         work( 1 ) = sroundup_lwork( lwopt )

         RETURN

      END IF

*

      brow = m

      IF( tpsd )

     $   brow = n

      bnrm = slange( 'M', brow, nrhs, b, ldb, rwork )

      ibscl = 0

      IF( bnrm.GT.zero .AND. bnrm.LT.smlnum ) THEN

*

*        Scale matrix norm up to SMLNUM

*

         CALL slascl( 'G', 0, 0, bnrm, smlnum, brow, nrhs, b, ldb,

     $                info )

         ibscl = 1

      ELSE IF( bnrm.GT.bignum ) THEN

*

*        Scale matrix norm down to BIGNUM

*

         CALL slascl( 'G', 0, 0, bnrm, bignum, brow, nrhs, b, ldb,

     $                info )

         ibscl = 2

      END IF

*

      IF( m.GE.n ) THEN

*

*        M > N:

*        Compute the blocked QR factorization of A,

*        using the compact WY representation of Q,

*        workspace at least N, optimally N*NB.

*

         CALL sgeqrt( m, n, nb, a, lda, work( 1 ), nb,

     $                work( mn*nb+1 ), info )

*

         IF( .NOT.tpsd ) THEN

*

*           M > N, A is not transposed:

*           Overdetermined system of equations,

*           least-squares problem, min || A * X - B ||.

*

*           Compute B(1:M,1:NRHS) := Q**T * B(1:M,1:NRHS),

*           using the compact WY representation of Q,

*           workspace at least NRHS, optimally NRHS*NB.

*

            CALL sgemqrt( 'Left', 'Transpose', m, nrhs, n, nb, a,

     $                    lda,

     $                    work( 1 ), nb, b, ldb, work( mn*nb+1 ),

     $                    info )

*

*           Compute B(1:N,1:NRHS) := inv(R) * B(1:N,1:NRHS)

*

            CALL strtrs( 'Upper', 'No transpose', 'Non-unit', n,

     $                   nrhs,

     $                   a, lda, b, ldb, info )

*

            IF( info.GT.0 ) THEN

               RETURN

            END IF

*

            scllen = n

*

         ELSE

*

*           M > N, A is transposed:

*           Underdetermined system of equations,

*           minimum norm solution of A**T * X = B.

*

*           Compute B := inv(R**T) * B in two row blocks of B.

*

*           Block 1: B(1:N,1:NRHS) := inv(R**T) * B(1:N,1:NRHS)

*

            CALL strtrs( 'Upper', 'Transpose', 'Non-unit', n, nrhs,

     $                   a, lda, b, ldb, info )

*

            IF( info.GT.0 ) THEN

               RETURN

            END IF

*

*           Block 2: Zero out all rows below the N-th row in B:

*           B(N+1:M,1:NRHS) = ZERO

*

            DO  j = 1, nrhs

               DO i = n + 1, m

                  b( i, j ) = zero

               END DO

            END DO

*

*           Compute B(1:M,1:NRHS) := Q(1:N,:) * B(1:N,1:NRHS),

*           using the compact WY representation of Q,

*           workspace at least NRHS, optimally NRHS*NB.

*

            CALL sgemqrt( 'Left', 'No transpose', m, nrhs, n, nb,

     $                    a, lda, work( 1 ), nb, b, ldb,

     $                    work( mn*nb+1 ), info )

*

            scllen = m

*

         END IF

*

      ELSE

*

*        M < N:

*        Compute the blocked LQ factorization of A,

*        using the compact WY representation of Q,

*        workspace at least M, optimally M*NB.

*

         CALL sgelqt( m, n, nb, a, lda, work( 1 ), nb,

     $                work( mn*nb+1 ), info )

*

         IF( .NOT.tpsd ) THEN

*

*           M < N, A is not transposed:

*           Underdetermined system of equations,

*           minimum norm solution of A * X = B.

*

*           Compute B := inv(L) * B in two row blocks of B.

*

*           Block 1: B(1:M,1:NRHS) := inv(L) * B(1:M,1:NRHS)

*

            CALL strtrs( 'Lower', 'No transpose', 'Non-unit', m,

     $                   nrhs,

     $                   a, lda, b, ldb, info )

*

            IF( info.GT.0 ) THEN

               RETURN

            END IF

*

*           Block 2: Zero out all rows below the M-th row in B:

*           B(M+1:N,1:NRHS) = ZERO

*

            DO j = 1, nrhs

               DO i = m + 1, n

                  b( i, j ) = zero

               END DO

            END DO

*

*           Compute B(1:N,1:NRHS) := Q(1:N,:)**T * B(1:M,1:NRHS),

*           using the compact WY representation of Q,

*           workspace at least NRHS, optimally NRHS*NB.

*

            CALL sgemlqt( 'Left', 'Transpose', n, nrhs, m, nb, a,

     $                    lda,

     $                   work( 1 ), nb, b, ldb,

     $                   work( mn*nb+1 ), info )

*

            scllen = n

*

         ELSE

*

*           M < N, A is transposed:

*           Overdetermined system of equations,

*           least-squares problem, min || A**T * X - B ||.

*

*           Compute B(1:N,1:NRHS) := Q * B(1:N,1:NRHS),

*           using the compact WY representation of Q,

*           workspace at least NRHS, optimally NRHS*NB.

*

            CALL sgemlqt( 'Left', 'No transpose', n, nrhs, m, nb,

     $                    a, lda, work( 1 ), nb, b, ldb,

     $                    work( mn*nb+1), info )

*

*           Compute B(1:M,1:NRHS) := inv(L**T) * B(1:M,1:NRHS)

*

            CALL strtrs( 'Lower', 'Transpose', 'Non-unit', m, nrhs,

     $                   a, lda, b, ldb, info )

*

            IF( info.GT.0 ) THEN

               RETURN

            END IF

*

            scllen = m

*

         END IF

*

      END IF

*

*     Undo scaling

*

      IF( iascl.EQ.1 ) THEN

         CALL slascl( 'G', 0, 0, anrm, smlnum, scllen, nrhs, b, ldb,

     $                info )

      ELSE IF( iascl.EQ.2 ) THEN

         CALL slascl( 'G', 0, 0, anrm, bignum, scllen, nrhs, b, ldb,

     $                info )

      END IF

      IF( ibscl.EQ.1 ) THEN

         CALL slascl( 'G', 0, 0, smlnum, bnrm, scllen, nrhs, b, ldb,

     $                info )

      ELSE IF( ibscl.EQ.2 ) THEN

         CALL slascl( 'G', 0, 0, bignum, bnrm, scllen, nrhs, b, ldb,

     $                info )

      END IF

*

      work( 1 ) = sroundup_lwork( lwopt )

*

      RETURN

*

*     End of SGELST

*


      END

xerbla
subroutine xerbla(srname, info)
Definition cblat2.f:3285

sgelqt
subroutine sgelqt(m, n, mb, a, lda, t, ldt, work, info)
SGELQT
Definition sgelqt.f:124

sgelst
subroutine sgelst(trans, m, n, nrhs, a, lda, b, ldb, work, lwork, info)
SGELST solves overdetermined or underdetermined systems for GE matrices using QR or LQ factorization ...
Definition sgelst.f:202

sgemlqt
subroutine sgemlqt(side, trans, m, n, k, mb, v, ldv, t, ldt, c, ldc, work, info)
SGEMLQT
Definition sgemlqt.f:153

sgemqrt
subroutine sgemqrt(side, trans, m, n, k, nb, v, ldv, t, ldt, c, ldc, work, info)
SGEMQRT
Definition sgemqrt.f:166

sgeqrt
subroutine sgeqrt(m, n, nb, a, lda, t, ldt, work, info)
SGEQRT
Definition sgeqrt.f:139

slascl
subroutine slascl(type, kl, ku, cfrom, cto, m, n, a, lda, info)
SLASCL multiplies a general rectangular matrix by a real scalar defined as cto/cfrom.
Definition slascl.f:142

slaset
subroutine slaset(uplo, m, n, alpha, beta, a, lda)
SLASET initializes the off-diagonal elements and the diagonal elements of a matrix to given values.
Definition slaset.f:108

strtrs
subroutine strtrs(uplo, trans, diag, n, nrhs, a, lda, b, ldb, info)
STRTRS
Definition strtrs.f:144