d6/d4b/dgelsy_8f_source.html

*> \brief <b> DGELSY solves overdetermined or underdetermined systems for GE matrices</b>

*

*  =========== DOCUMENTATION ===========

*

* Online html documentation available at

*            http://www.netlib.org/lapack/explore-html/

*

*> \htmlonly

*> Download DGELSY + dependencies

*> <a href="http://www.netlib.org/cgi-bin/netlibfiles.tgz?format=tgz&filename=/lapack/lapack_routine/dgelsy.f">

*> [TGZ]</a>

*> <a href="http://www.netlib.org/cgi-bin/netlibfiles.zip?format=zip&filename=/lapack/lapack_routine/dgelsy.f">

*> [ZIP]</a>

*> <a href="http://www.netlib.org/cgi-bin/netlibfiles.txt?format=txt&filename=/lapack/lapack_routine/dgelsy.f">

*> [TXT]</a>

*> \endhtmlonly

*

*  Definition:

*  ===========

*

*       SUBROUTINE DGELSY( M, N, NRHS, A, LDA, B, LDB, JPVT, RCOND, RANK,

*                          WORK, LWORK, INFO )

*

*       .. Scalar Arguments ..

*       INTEGER            INFO, LDA, LDB, LWORK, M, N, NRHS, RANK

*       DOUBLE PRECISION   RCOND

*       ..

*       .. Array Arguments ..

*       INTEGER            JPVT( * )

*       DOUBLE PRECISION   A( LDA, * ), B( LDB, * ), WORK( * )

*       ..

*

*

*> \par Purpose:

*  =============

*>

*> \verbatim

*>

*> DGELSY computes the minimum-norm solution to a real linear least

*> squares problem:

*>     minimize || A * X - B ||

*> using a complete orthogonal factorization of A.  A is an M-by-N

*> matrix which may be rank-deficient.

*>

*> Several right hand side vectors b and solution vectors x can be

*> handled in a single call; they are stored as the columns of the

*> M-by-NRHS right hand side matrix B and the N-by-NRHS solution

*> matrix X.

*>

*> The routine first computes a QR factorization with column pivoting:

*>     A * P = Q * [ R11 R12 ]

*>                 [  0  R22 ]

*> with R11 defined as the largest leading submatrix whose estimated

*> condition number is less than 1/RCOND.  The order of R11, RANK,

*> is the effective rank of A.

*>

*> Then, R22 is considered to be negligible, and R12 is annihilated

*> by orthogonal transformations from the right, arriving at the

*> complete orthogonal factorization:

*>    A * P = Q * [ T11 0 ] * Z

*>                [  0  0 ]

*> The minimum-norm solution is then

*>    X = P * Z**T [ inv(T11)*Q1**T*B ]

*>                 [        0         ]

*> where Q1 consists of the first RANK columns of Q.

*>

*> This routine is basically identical to the original xGELSX except

*> three differences:

*>   o The call to the subroutine xGEQPF has been substituted by the

*>     the call to the subroutine xGEQP3. This subroutine is a Blas-3

*>     version of the QR factorization with column pivoting.

*>   o Matrix B (the right hand side) is updated with Blas-3.

*>   o The permutation of matrix B (the right hand side) is faster and

*>     more simple.

*> \endverbatim

*

*  Arguments:

*  ==========

*

*> \param[in] M

*> \verbatim

*>          M is INTEGER

*>          The number of rows of the matrix A.  M >= 0.

*> \endverbatim

*>

*> \param[in] N

*> \verbatim

*>          N is INTEGER

*>          The number of columns of the matrix A.  N >= 0.

*> \endverbatim

*>

*> \param[in] NRHS

*> \verbatim

*>          NRHS is INTEGER

*>          The number of right hand sides, i.e., the number of

*>          columns of matrices B and X. NRHS >= 0.

*> \endverbatim

*>

*> \param[in,out] A

*> \verbatim

*>          A is DOUBLE PRECISION array, dimension (LDA,N)

*>          On entry, the M-by-N matrix A.

*>          On exit, A has been overwritten by details of its

*>          complete orthogonal factorization.

*> \endverbatim

*>

*> \param[in] LDA

*> \verbatim

*>          LDA is INTEGER

*>          The leading dimension of the array A.  LDA >= max(1,M).

*> \endverbatim

*>

*> \param[in,out] B

*> \verbatim

*>          B is DOUBLE PRECISION array, dimension (LDB,NRHS)

*>          On entry, the M-by-NRHS right hand side matrix B.

*>          On exit, the N-by-NRHS solution matrix X.

*> \endverbatim

*>

*> \param[in] LDB

*> \verbatim

*>          LDB is INTEGER

*>          The leading dimension of the array B. LDB >= max(1,M,N).

*> \endverbatim

*>

*> \param[in,out] JPVT

*> \verbatim

*>          JPVT is INTEGER array, dimension (N)

*>          On entry, if JPVT(i) .ne. 0, the i-th column of A is permuted

*>          to the front of AP, otherwise column i is a free column.

*>          On exit, if JPVT(i) = k, then the i-th column of AP

*>          was the k-th column of A.

*> \endverbatim

*>

*> \param[in] RCOND

*> \verbatim

*>          RCOND is DOUBLE PRECISION

*>          RCOND is used to determine the effective rank of A, which

*>          is defined as the order of the largest leading triangular

*>          submatrix R11 in the QR factorization with pivoting of A,

*>          whose estimated condition number < 1/RCOND.

*> \endverbatim

*>

*> \param[out] RANK

*> \verbatim

*>          RANK is INTEGER

*>          The effective rank of A, i.e., the order of the submatrix

*>          R11.  This is the same as the order of the submatrix T11

*>          in the complete orthogonal factorization of A.

*> \endverbatim

*>

*> \param[out] WORK

*> \verbatim

*>          WORK is DOUBLE PRECISION array, dimension (MAX(1,LWORK))

*>          On exit, if INFO = 0, WORK(1) returns the optimal LWORK.

*> \endverbatim

*>

*> \param[in] LWORK

*> \verbatim

*>          LWORK is INTEGER

*>          The dimension of the array WORK.

*>          The unblocked strategy requires that:

*>             LWORK >= MAX( MN+3*N+1, 2*MN+NRHS ),

*>          where MN = min( M, N ).

*>          The block algorithm requires that:

*>             LWORK >= MAX( MN+2*N+NB*(N+1), 2*MN+NB*NRHS ),

*>          where NB is an upper bound on the blocksize returned

*>          by ILAENV for the routines DGEQP3, DTZRZF, STZRQF, DORMQR,

*>          and DORMRZ.

*>

*>          If LWORK = -1, then a workspace query is assumed; the routine

*>          only calculates the optimal size of the WORK array, returns

*>          this value as the first entry of the WORK array, and no error

*>          message related to LWORK is issued by XERBLA.

*> \endverbatim

*>

*> \param[out] INFO

*> \verbatim

*>          INFO is INTEGER

*>          = 0: successful exit

*>          < 0: If INFO = -i, the i-th argument had an illegal value.

*> \endverbatim

*

*  Authors:

*  ========

*

*> \author Univ. of Tennessee

*> \author Univ. of California Berkeley

*> \author Univ. of Colorado Denver

*> \author NAG Ltd.

*

*> \date November 2011

*

*> \ingroup doubleGEsolve

*

*> \par Contributors:

*  ==================

*>

*>    A. Petitet, Computer Science Dept., Univ. of Tenn., Knoxville, USA \n

*>    E. Quintana-Orti, Depto. de Informatica, Universidad Jaime I, Spain \n

*>    G. Quintana-Orti, Depto. de Informatica, Universidad Jaime I, Spain \n

*>

*  =====================================================================

      SUBROUTINE dgelsy( M, N, NRHS, A, LDA, B, LDB, JPVT, RCOND, RANK,

     $                   work, lwork, info )

*

*  -- LAPACK driver routine (version 3.4.0) --

*  -- LAPACK is a software package provided by Univ. of Tennessee,    --

*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--

*     November 2011

*

*     .. Scalar Arguments ..

      INTEGER            info, lda, ldb, lwork, m, n, nrhs, rank

      DOUBLE PRECISION   rcond

*     ..

*     .. Array Arguments ..

      INTEGER            jpvt( * )

      DOUBLE PRECISION   a( lda, * ), b( ldb, * ), work( * )

*     ..

*

*  =====================================================================

*

*     .. Parameters ..

      INTEGER            imax, imin

      parameter( imax = 1, imin = 2 )

      DOUBLE PRECISION   zero, one

      parameter( zero = 0.0d+0, one = 1.0d+0 )

*     ..

*     .. Local Scalars ..

      LOGICAL            lquery

      INTEGER            i, iascl, ibscl, ismax, ismin, j, lwkmin,

     $                   lwkopt, mn, nb, nb1, nb2, nb3, nb4

      DOUBLE PRECISION   anrm, bignum, bnrm, c1, c2, s1, s2, smax,

     $                   smaxpr, smin, sminpr, smlnum, wsize

*     ..

*     .. External Functions ..

      INTEGER            ilaenv

      DOUBLE PRECISION   dlamch, dlange

      EXTERNAL           ilaenv, dlamch, dlange

*     ..

*     .. External Subroutines ..

      EXTERNAL           dcopy, dgeqp3, dlabad, dlaic1, dlascl, dlaset,

     $                   dormqr, dormrz, dtrsm, dtzrzf, xerbla

*     ..

*     .. Intrinsic Functions ..

      INTRINSIC          abs, max, min

*     ..

*     .. Executable Statements ..

*

      mn = min( m, n )

      ismin = mn + 1

      ismax = 2*mn + 1

*

*     Test the input arguments.

*

      info = 0

      lquery = ( lwork.EQ.-1 )

      IF( m.LT.0 ) THEN

         info = -1

      ELSE IF( n.LT.0 ) THEN

         info = -2

      ELSE IF( nrhs.LT.0 ) THEN

         info = -3

      ELSE IF( lda.LT.max( 1, m ) ) THEN

         info = -5

      ELSE IF( ldb.LT.max( 1, m, n ) ) THEN

         info = -7

      END IF

*

*     Figure out optimal block size

*

      IF( info.EQ.0 ) THEN

         IF( mn.EQ.0 .OR. nrhs.EQ.0 ) THEN

            lwkmin = 1

            lwkopt = 1

         ELSE

            nb1 = ilaenv( 1, 'DGEQRF', ' ', m, n, -1, -1 )

            nb2 = ilaenv( 1, 'DGERQF', ' ', m, n, -1, -1 )

            nb3 = ilaenv( 1, 'DORMQR', ' ', m, n, nrhs, -1 )

            nb4 = ilaenv( 1, 'DORMRQ', ' ', m, n, nrhs, -1 )

            nb = max( nb1, nb2, nb3, nb4 )

            lwkmin = mn + max( 2*mn, n + 1, mn + nrhs )

            lwkopt = max( lwkmin,

     $                    mn + 2*n + nb*( n + 1 ), 2*mn + nb*nrhs )

         END IF

         work( 1 ) = lwkopt

*

         IF( lwork.LT.lwkmin .AND. .NOT.lquery ) THEN

            info = -12

         END IF

      END IF

*

      IF( info.NE.0 ) THEN

         CALL xerbla( 'DGELSY', -info )

         return

      ELSE IF( lquery ) THEN

         return

      END IF

*

*     Quick return if possible

*

      IF( mn.EQ.0 .OR. nrhs.EQ.0 ) THEN

         rank = 0

         return

      END IF

*

*     Get machine parameters

*

      smlnum = dlamch( 'S' ) / dlamch( 'P' )

      bignum = one / smlnum

      CALL dlabad( smlnum, bignum )

*

*     Scale A, B if max entries outside range [SMLNUM,BIGNUM]

*

      anrm = dlange( 'M', m, n, a, lda, work )

      iascl = 0

      IF( anrm.GT.zero .AND. anrm.LT.smlnum ) THEN

*

*        Scale matrix norm up to SMLNUM

*

         CALL dlascl( 'G', 0, 0, anrm, smlnum, m, n, a, lda, info )

         iascl = 1

      ELSE IF( anrm.GT.bignum ) THEN

*

*        Scale matrix norm down to BIGNUM

*

         CALL dlascl( 'G', 0, 0, anrm, bignum, m, n, a, lda, info )

         iascl = 2

      ELSE IF( anrm.EQ.zero ) THEN

*

*        Matrix all zero. Return zero solution.

*

         CALL dlaset( 'F', max( m, n ), nrhs, zero, zero, b, ldb )

         rank = 0

         go to 70

      END IF

*

      bnrm = dlange( 'M', m, nrhs, b, ldb, work )

      ibscl = 0

      IF( bnrm.GT.zero .AND. bnrm.LT.smlnum ) THEN

*

*        Scale matrix norm up to SMLNUM

*

         CALL dlascl( 'G', 0, 0, bnrm, smlnum, m, nrhs, b, ldb, info )

         ibscl = 1

      ELSE IF( bnrm.GT.bignum ) THEN

*

*        Scale matrix norm down to BIGNUM

*

         CALL dlascl( 'G', 0, 0, bnrm, bignum, m, nrhs, b, ldb, info )

         ibscl = 2

      END IF

*

*     Compute QR factorization with column pivoting of A:

*        A * P = Q * R

*

      CALL dgeqp3( m, n, a, lda, jpvt, work( 1 ), work( mn+1 ),

     $             lwork-mn, info )

      wsize = mn + work( mn+1 )

*

*     workspace: MN+2*N+NB*(N+1).

*     Details of Householder rotations stored in WORK(1:MN).

*

*     Determine RANK using incremental condition estimation

*

      work( ismin ) = one

      work( ismax ) = one

      smax = abs( a( 1, 1 ) )

      smin = smax

      IF( abs( a( 1, 1 ) ).EQ.zero ) THEN

         rank = 0

         CALL dlaset( 'F', max( m, n ), nrhs, zero, zero, b, ldb )

         go to 70

      ELSE

         rank = 1

      END IF

*

   10 continue

      IF( rank.LT.mn ) THEN

         i = rank + 1

         CALL dlaic1( imin, rank, work( ismin ), smin, a( 1, i ),

     $                a( i, i ), sminpr, s1, c1 )

         CALL dlaic1( imax, rank, work( ismax ), smax, a( 1, i ),

     $                a( i, i ), smaxpr, s2, c2 )

*

         IF( smaxpr*rcond.LE.sminpr ) THEN

            DO 20 i = 1, rank

               work( ismin+i-1 ) = s1*work( ismin+i-1 )

               work( ismax+i-1 ) = s2*work( ismax+i-1 )

   20       continue

            work( ismin+rank ) = c1

            work( ismax+rank ) = c2

            smin = sminpr

            smax = smaxpr

            rank = rank + 1

            go to 10

         END IF

      END IF

*

*     workspace: 3*MN.

*

*     Logically partition R = [ R11 R12 ]

*                             [  0  R22 ]

*     where R11 = R(1:RANK,1:RANK)

*

*     [R11,R12] = [ T11, 0 ] * Y

*

      IF( rank.LT.n )

     $   CALL dtzrzf( rank, n, a, lda, work( mn+1 ), work( 2*mn+1 ),

     $                lwork-2*mn, info )

*

*     workspace: 2*MN.

*     Details of Householder rotations stored in WORK(MN+1:2*MN)

*

*     B(1:M,1:NRHS) := Q**T * B(1:M,1:NRHS)

*

      CALL dormqr( 'Left', 'Transpose', m, nrhs, mn, a, lda, work( 1 ),

     $             b, ldb, work( 2*mn+1 ), lwork-2*mn, info )

      wsize = max( wsize, 2*mn+work( 2*mn+1 ) )

*

*     workspace: 2*MN+NB*NRHS.

*

*     B(1:RANK,1:NRHS) := inv(T11) * B(1:RANK,1:NRHS)

*

      CALL dtrsm( 'Left', 'Upper', 'No transpose', 'Non-unit', rank,

     $            nrhs, one, a, lda, b, ldb )

*

      DO 40 j = 1, nrhs

         DO 30 i = rank + 1, n

            b( i, j ) = zero

   30    continue

   40 continue

*

*     B(1:N,1:NRHS) := Y**T * B(1:N,1:NRHS)

*

      IF( rank.LT.n ) THEN

         CALL dormrz( 'Left', 'Transpose', n, nrhs, rank, n-rank, a,

     $                lda, work( mn+1 ), b, ldb, work( 2*mn+1 ),

     $                lwork-2*mn, info )

      END IF

*

*     workspace: 2*MN+NRHS.

*

*     B(1:N,1:NRHS) := P * B(1:N,1:NRHS)

*

      DO 60 j = 1, nrhs

         DO 50 i = 1, n

            work( jpvt( i ) ) = b( i, j )

   50    continue

         CALL dcopy( n, work( 1 ), 1, b( 1, j ), 1 )

   60 continue

*

*     workspace: N.

*

*     Undo scaling

*

      IF( iascl.EQ.1 ) THEN

         CALL dlascl( 'G', 0, 0, anrm, smlnum, n, nrhs, b, ldb, info )

         CALL dlascl( 'U', 0, 0, smlnum, anrm, rank, rank, a, lda,

     $                info )

      ELSE IF( iascl.EQ.2 ) THEN

         CALL dlascl( 'G', 0, 0, anrm, bignum, n, nrhs, b, ldb, info )

         CALL dlascl( 'U', 0, 0, bignum, anrm, rank, rank, a, lda,

     $                info )

      END IF

      IF( ibscl.EQ.1 ) THEN

         CALL dlascl( 'G', 0, 0, smlnum, bnrm, n, nrhs, b, ldb, info )

      ELSE IF( ibscl.EQ.2 ) THEN

         CALL dlascl( 'G', 0, 0, bignum, bnrm, n, nrhs, b, ldb, info )

      END IF

*

   70 continue

      work( 1 ) = lwkopt

*

      return

*

*     End of DGELSY

*

      END