db/d43/sgesvdq_8f_source.html

*> \brief <b> SGESVDQ computes the singular value decomposition (SVD) with a QR-Preconditioned QR SVD Method for GE matrices</b>

*

*  =========== DOCUMENTATION ===========

*

* Online html documentation available at

*            http://www.netlib.org/lapack/explore-html/

*

*> Download SGESVDQ + dependencies

*> <a href="http://www.netlib.org/cgi-bin/netlibfiles.tgz?format=tgz&filename=/lapack/lapack_routine/sgesvdq.f">

*> [TGZ]</a>

*> <a href="http://www.netlib.org/cgi-bin/netlibfiles.zip?format=zip&filename=/lapack/lapack_routine/sgesvdq.f">

*> [ZIP]</a>

*> <a href="http://www.netlib.org/cgi-bin/netlibfiles.txt?format=txt&filename=/lapack/lapack_routine/sgesvdq.f">

*> [TXT]</a>

*

*  Definition:

*  ===========

*

*      SUBROUTINE SGESVDQ( JOBA, JOBP, JOBR, JOBU, JOBV, M, N, A, LDA,

*                          S, U, LDU, V, LDV, NUMRANK, IWORK, LIWORK,

*                          WORK, LWORK, RWORK, LRWORK, INFO )

*

*     .. Scalar Arguments ..

*      IMPLICIT    NONE

*      CHARACTER   JOBA, JOBP, JOBR, JOBU, JOBV

*      INTEGER     M, N, LDA, LDU, LDV, NUMRANK, LIWORK, LWORK, LRWORK,

*                  INFO

*     ..

*     .. Array Arguments ..

*      REAL        A( LDA, * ), U( LDU, * ), V( LDV, * ), WORK( * )

*      REAL        S( * ), RWORK( * )

*      INTEGER     IWORK( * )

*       ..

*

*

*> \par Purpose:

*  =============

*>

*> \verbatim

*>

*> SGESVDQ computes the singular value decomposition (SVD) of a real

*> M-by-N matrix A, where M >= N. The SVD of A is written as

*>                                    [++]   [xx]   [x0]   [xx]

*>              A = U * SIGMA * V^*,  [++] = [xx] * [ox] * [xx]

*>                                    [++]   [xx]

*> where SIGMA is an N-by-N diagonal matrix, U is an M-by-N orthonormal

*> matrix, and V is an N-by-N orthogonal matrix. The diagonal elements

*> of SIGMA are the singular values of A. The columns of U and V are the

*> left and the right singular vectors of A, respectively.

*> \endverbatim

*

*  Arguments:

*  ==========

*

*> \param[in] JOBA

*> \verbatim

*>  JOBA is CHARACTER*1

*>  Specifies the level of accuracy in the computed SVD

*>  = 'A' The requested accuracy corresponds to having the backward

*>        error bounded by || delta A ||_F <= f(m,n) * EPS * || A ||_F,

*>        where EPS = SLAMCH('Epsilon'). This authorises CGESVDQ to

*>        truncate the computed triangular factor in a rank revealing

*>        QR factorization whenever the truncated part is below the

*>        threshold of the order of EPS * ||A||_F. This is aggressive

*>        truncation level.

*>  = 'M' Similarly as with 'A', but the truncation is more gentle: it

*>        is allowed only when there is a drop on the diagonal of the

*>        triangular factor in the QR factorization. This is medium

*>        truncation level.

*>  = 'H' High accuracy requested. No numerical rank determination based

*>        on the rank revealing QR factorization is attempted.

*>  = 'E' Same as 'H', and in addition the condition number of column

*>        scaled A is estimated and returned in  RWORK(1).

*>        N^(-1/4)*RWORK(1) <= ||pinv(A_scaled)||_2 <= N^(1/4)*RWORK(1)

*> \endverbatim

*>

*> \param[in] JOBP

*> \verbatim

*>  JOBP is CHARACTER*1

*>  = 'P' The rows of A are ordered in decreasing order with respect to

*>        ||A(i,:)||_\infty. This enhances numerical accuracy at the cost

*>        of extra data movement. Recommended for numerical robustness.

*>  = 'N' No row pivoting.

*> \endverbatim

*>

*> \param[in] JOBR

*> \verbatim

*>          JOBR is CHARACTER*1

*>          = 'T' After the initial pivoted QR factorization, SGESVD is applied to

*>          the transposed R**T of the computed triangular factor R. This involves

*>          some extra data movement (matrix transpositions). Useful for

*>          experiments, research and development.

*>          = 'N' The triangular factor R is given as input to SGESVD. This may be

*>          preferred as it involves less data movement.

*> \endverbatim

*>

*> \param[in] JOBU

*> \verbatim

*>          JOBU is CHARACTER*1

*>          = 'A' All M left singular vectors are computed and returned in the

*>          matrix U. See the description of U.

*>          = 'S' or 'U' N = min(M,N) left singular vectors are computed and returned

*>          in the matrix U. See the description of U.

*>          = 'R' Numerical rank NUMRANK is determined and only NUMRANK left singular

*>          vectors are computed and returned in the matrix U.

*>          = 'F' The N left singular vectors are returned in factored form as the

*>          product of the Q factor from the initial QR factorization and the

*>          N left singular vectors of (R**T , 0)**T. If row pivoting is used,

*>          then the necessary information on the row pivoting is stored in

*>          IWORK(N+1:N+M-1).

*>          = 'N' The left singular vectors are not computed.

*> \endverbatim

*>

*> \param[in] JOBV

*> \verbatim

*>          JOBV is CHARACTER*1

*>          = 'A', 'V' All N right singular vectors are computed and returned in

*>          the matrix V.

*>          = 'R' Numerical rank NUMRANK is determined and only NUMRANK right singular

*>          vectors are computed and returned in the matrix V. This option is

*>          allowed only if JOBU = 'R' or JOBU = 'N'; otherwise it is illegal.

*>          = 'N' The right singular vectors are not computed.

*> \endverbatim

*>

*> \param[in] M

*> \verbatim

*>          M is INTEGER

*>          The number of rows of the input matrix A.  M >= 0.

*> \endverbatim

*>

*> \param[in] N

*> \verbatim

*>          N is INTEGER

*>          The number of columns of the input matrix A.  M >= N >= 0.

*> \endverbatim

*>

*> \param[in,out] A

*> \verbatim

*>          A is REAL array of dimensions LDA x N

*>          On entry, the input matrix A.

*>          On exit, if JOBU .NE. 'N' or JOBV .NE. 'N', the lower triangle of A contains

*>          the Householder vectors as stored by SGEQP3. If JOBU = 'F', these Householder

*>          vectors together with WORK(1:N) can be used to restore the Q factors from

*>          the initial pivoted QR factorization of A. See the description of U.

*> \endverbatim

*>

*> \param[in] LDA

*> \verbatim

*>          LDA is INTEGER.

*>          The leading dimension of the array A.  LDA >= max(1,M).

*> \endverbatim

*>

*> \param[out] S

*> \verbatim

*>          S is REAL array of dimension N.

*>          The singular values of A, ordered so that S(i) >= S(i+1).

*> \endverbatim

*>

*> \param[out] U

*> \verbatim

*>          U is REAL array, dimension

*>          LDU x M if JOBU = 'A'; see the description of LDU. In this case,

*>          on exit, U contains the M left singular vectors.

*>          LDU x N if JOBU = 'S', 'U', 'R' ; see the description of LDU. In this

*>          case, U contains the leading N or the leading NUMRANK left singular vectors.

*>          LDU x N if JOBU = 'F' ; see the description of LDU. In this case U

*>          contains N x N orthogonal matrix that can be used to form the left

*>          singular vectors.

*>          If JOBU = 'N', U is not referenced.

*> \endverbatim

*>

*> \param[in] LDU

*> \verbatim

*>          LDU is INTEGER.

*>          The leading dimension of the array U.

*>          If JOBU = 'A', 'S', 'U', 'R',  LDU >= max(1,M).

*>          If JOBU = 'F',                 LDU >= max(1,N).

*>          Otherwise,                     LDU >= 1.

*> \endverbatim

*>

*> \param[out] V

*> \verbatim

*>          V is REAL array, dimension

*>          LDV x N if JOBV = 'A', 'V', 'R' or if JOBA = 'E' .

*>          If JOBV = 'A', or 'V',  V contains the N-by-N orthogonal matrix  V**T;

*>          If JOBV = 'R', V contains the first NUMRANK rows of V**T (the right

*>          singular vectors, stored rowwise, of the NUMRANK largest singular values).

*>          If JOBV = 'N' and JOBA = 'E', V is used as a workspace.

*>          If JOBV = 'N', and JOBA.NE.'E', V is not referenced.

*> \endverbatim

*>

*> \param[in] LDV

*> \verbatim

*>          LDV is INTEGER

*>          The leading dimension of the array V.

*>          If JOBV = 'A', 'V', 'R',  or JOBA = 'E', LDV >= max(1,N).

*>          Otherwise,                               LDV >= 1.

*> \endverbatim

*>

*> \param[out] NUMRANK

*> \verbatim

*>          NUMRANK is INTEGER

*>          NUMRANK is the numerical rank first determined after the rank

*>          revealing QR factorization, following the strategy specified by the

*>          value of JOBA. If JOBV = 'R' and JOBU = 'R', only NUMRANK

*>          leading singular values and vectors are then requested in the call

*>          of SGESVD. The final value of NUMRANK might be further reduced if

*>          some singular values are computed as zeros.

*> \endverbatim

*>

*> \param[out] IWORK

*> \verbatim

*>          IWORK is INTEGER array, dimension (max(1, LIWORK)).

*>          On exit, IWORK(1:N) contains column pivoting permutation of the

*>          rank revealing QR factorization.

*>          If JOBP = 'P', IWORK(N+1:N+M-1) contains the indices of the sequence

*>          of row swaps used in row pivoting. These can be used to restore the

*>          left singular vectors in the case JOBU = 'F'.

*>

*>          If LIWORK, LWORK, or LRWORK = -1, then on exit, if INFO = 0,

*>          IWORK(1) returns the minimal LIWORK.

*> \endverbatim

*>

*> \param[in] LIWORK

*> \verbatim

*>          LIWORK is INTEGER

*>          The dimension of the array IWORK.

*>          LIWORK >= N + M - 1,     if JOBP = 'P' and JOBA .NE. 'E';

*>          LIWORK >= N              if JOBP = 'N' and JOBA .NE. 'E';

*>          LIWORK >= N + M - 1 + N, if JOBP = 'P' and JOBA = 'E';

*>          LIWORK >= N + N          if JOBP = 'N' and JOBA = 'E'.

*>

*>          If LIWORK = -1, then a workspace query is assumed; the routine

*>          only calculates and returns the optimal and minimal sizes

*>          for the WORK, IWORK, and RWORK arrays, and no error

*>          message related to LWORK is issued by XERBLA.

*> \endverbatim

*>

*> \param[out] WORK

*> \verbatim

*>          WORK is REAL array, dimension (max(2, LWORK)), used as a workspace.

*>          On exit, if, on entry, LWORK.NE.-1, WORK(1:N) contains parameters

*>          needed to recover the Q factor from the QR factorization computed by

*>          SGEQP3.

*>

*>          If LIWORK, LWORK, or LRWORK = -1, then on exit, if INFO = 0,

*>          WORK(1) returns the optimal LWORK, and

*>          WORK(2) returns the minimal LWORK.

*> \endverbatim

*>

*> \param[in,out] LWORK

*> \verbatim

*>          LWORK is INTEGER

*>          The dimension of the array WORK. It is determined as follows:

*>          Let  LWQP3 = 3*N+1,  LWCON = 3*N, and let

*>          LWORQ = { MAX( N, 1 ),  if JOBU = 'R', 'S', or 'U'

*>                  { MAX( M, 1 ),  if JOBU = 'A'

*>          LWSVD = MAX( 5*N, 1 )

*>          LWLQF = MAX( N/2, 1 ), LWSVD2 = MAX( 5*(N/2), 1 ), LWORLQ = MAX( N, 1 ),

*>          LWQRF = MAX( N/2, 1 ), LWORQ2 = MAX( N, 1 )

*>          Then the minimal value of LWORK is:

*>          = MAX( N + LWQP3, LWSVD )        if only the singular values are needed;

*>          = MAX( N + LWQP3, LWCON, LWSVD ) if only the singular values are needed,

*>                                   and a scaled condition estimate requested;

*>

*>          = N + MAX( LWQP3, LWSVD, LWORQ ) if the singular values and the left

*>                                   singular vectors are requested;

*>          = N + MAX( LWQP3, LWCON, LWSVD, LWORQ ) if the singular values and the left

*>                                   singular vectors are requested, and also

*>                                   a scaled condition estimate requested;

*>

*>          = N + MAX( LWQP3, LWSVD )        if the singular values and the right

*>                                   singular vectors are requested;

*>          = N + MAX( LWQP3, LWCON, LWSVD ) if the singular values and the right

*>                                   singular vectors are requested, and also

*>                                   a scaled condition etimate requested;

*>

*>          = N + MAX( LWQP3, LWSVD, LWORQ ) if the full SVD is requested with JOBV = 'R';

*>                                   independent of JOBR;

*>          = N + MAX( LWQP3, LWCON, LWSVD, LWORQ ) if the full SVD is requested,

*>                                   JOBV = 'R' and, also a scaled condition

*>                                   estimate requested; independent of JOBR;

*>          = MAX( N + MAX( LWQP3, LWSVD, LWORQ ),

*>         N + MAX( LWQP3, N/2+LWLQF, N/2+LWSVD2, N/2+LWORLQ, LWORQ) ) if the

*>                         full SVD is requested with JOBV = 'A' or 'V', and

*>                         JOBR ='N'

*>          = MAX( N + MAX( LWQP3, LWCON, LWSVD, LWORQ ),

*>         N + MAX( LWQP3, LWCON, N/2+LWLQF, N/2+LWSVD2, N/2+LWORLQ, LWORQ ) )

*>                         if the full SVD is requested with JOBV = 'A' or 'V', and

*>                         JOBR ='N', and also a scaled condition number estimate

*>                         requested.

*>          = MAX( N + MAX( LWQP3, LWSVD, LWORQ ),

*>         N + MAX( LWQP3, N/2+LWQRF, N/2+LWSVD2, N/2+LWORQ2, LWORQ ) ) if the

*>                         full SVD is requested with JOBV = 'A', 'V', and JOBR ='T'

*>          = MAX( N + MAX( LWQP3, LWCON, LWSVD, LWORQ ),

*>         N + MAX( LWQP3, LWCON, N/2+LWQRF, N/2+LWSVD2, N/2+LWORQ2, LWORQ ) )

*>                         if the full SVD is requested with JOBV = 'A' or 'V', and

*>                         JOBR ='T', and also a scaled condition number estimate

*>                         requested.

*>          Finally, LWORK must be at least two: LWORK = MAX( 2, LWORK ).

*>

*>          If LWORK = -1, then a workspace query is assumed; the routine

*>          only calculates and returns the optimal and minimal sizes

*>          for the WORK, IWORK, and RWORK arrays, and no error

*>          message related to LWORK is issued by XERBLA.

*> \endverbatim

*>

*> \param[out] RWORK

*> \verbatim

*>          RWORK is REAL array, dimension (max(1, LRWORK)).

*>          On exit,

*>          1. If JOBA = 'E', RWORK(1) contains an estimate of the condition

*>          number of column scaled A. If A = C * D where D is diagonal and C

*>          has unit columns in the Euclidean norm, then, assuming full column rank,

*>          N^(-1/4) * RWORK(1) <= ||pinv(C)||_2 <= N^(1/4) * RWORK(1).

*>          Otherwise, RWORK(1) = -1.

*>          2. RWORK(2) contains the number of singular values computed as

*>          exact zeros in SGESVD applied to the upper triangular or trapezoidal

*>          R (from the initial QR factorization). In case of early exit (no call to

*>          SGESVD, such as in the case of zero matrix) RWORK(2) = -1.

*>

*>          If LIWORK, LWORK, or LRWORK = -1, then on exit, if INFO = 0,

*>          RWORK(1) returns the minimal LRWORK.

*> \endverbatim

*>

*> \param[in] LRWORK

*> \verbatim

*>          LRWORK is INTEGER.

*>          The dimension of the array RWORK.

*>          If JOBP ='P', then LRWORK >= MAX(2, M).

*>          Otherwise, LRWORK >= 2

*>

*>          If LRWORK = -1, then a workspace query is assumed; the routine

*>          only calculates and returns the optimal and minimal sizes

*>          for the WORK, IWORK, and RWORK arrays, and no error

*>          message related to LWORK is issued by XERBLA.

*> \endverbatim

*>

*> \param[out] INFO

*> \verbatim

*>          INFO is INTEGER

*>          = 0:  successful exit.

*>          < 0:  if INFO = -i, the i-th argument had an illegal value.

*>          > 0:  if SBDSQR did not converge, INFO specifies how many superdiagonals

*>          of an intermediate bidiagonal form B (computed in SGESVD) did not

*>          converge to zero.

*> \endverbatim

*

*> \par Further Details:

*  ========================

*>

*> \verbatim

*>

*>   1. The data movement (matrix transpose) is coded using simple nested

*>   DO-loops because BLAS and LAPACK do not provide corresponding subroutines.

*>   Those DO-loops are easily identified in this source code - by the CONTINUE

*>   statements labeled with 11**. In an optimized version of this code, the

*>   nested DO loops should be replaced with calls to an optimized subroutine.

*>   2. This code scales A by 1/SQRT(M) if the largest ABS(A(i,j)) could cause

*>   column norm overflow. This is the minial precaution and it is left to the

*>   SVD routine (CGESVD) to do its own preemptive scaling if potential over-

*>   or underflows are detected. To avoid repeated scanning of the array A,

*>   an optimal implementation would do all necessary scaling before calling

*>   CGESVD and the scaling in CGESVD can be switched off.

*>   3. Other comments related to code optimization are given in comments in the

*>   code, enclosed in [[double brackets]].

*> \endverbatim

*

*> \par Bugs, examples and comments

*  ===========================

*

*> \verbatim

*>  Please report all bugs and send interesting examples and/or comments to

*>  drmac@math.hr. Thank you.

*> \endverbatim

*

*> \par References

*  ===============

*

*> \verbatim

*>  [1] Zlatko Drmac, Algorithm 977: A QR-Preconditioned QR SVD Method for

*>      Computing the SVD with High Accuracy. ACM Trans. Math. Softw.

*>      44(1): 11:1-11:30 (2017)

*>

*>  SIGMA library, xGESVDQ section updated February 2016.

*>  Developed and coded by Zlatko Drmac, Department of Mathematics

*>  University of Zagreb, Croatia, drmac@math.hr

*> \endverbatim

*

*

*> \par Contributors:

*  ==================

*>

*> \verbatim

*> Developed and coded by Zlatko Drmac, Department of Mathematics

*>  University of Zagreb, Croatia, drmac@math.hr

*> \endverbatim

*

*  Authors:

*  ========

*

*> \author Univ. of Tennessee

*> \author Univ. of California Berkeley

*> \author Univ. of Colorado Denver

*> \author NAG Ltd.

*

*> \ingroup gesvdq

*

*  =====================================================================


      SUBROUTINE sgesvdq( JOBA, JOBP, JOBR, JOBU, JOBV, M, N, A, LDA,

     $                    S, U, LDU, V, LDV, NUMRANK, IWORK, LIWORK,

     $                    WORK, LWORK, RWORK, LRWORK, INFO )

*     .. Scalar Arguments ..

      IMPLICIT    NONE

      CHARACTER   JOBA, JOBP, JOBR, JOBU, JOBV

      INTEGER     M, N, LDA, LDU, LDV, NUMRANK, LIWORK, LWORK, LRWORK,

     $            info

*     ..

*     .. Array Arguments ..

      REAL        A( LDA, * ), U( LDU, * ), V( LDV, * ), WORK( * )

      REAL        S( * ), RWORK( * )

      INTEGER     IWORK( * )

*

*  =====================================================================

*

*     .. Parameters ..

      REAL        ZERO,         ONE

      PARAMETER ( ZERO = 0.0e0, one = 1.0e0 )

*     ..

*     .. Local Scalars ..

      INTEGER     IERR, IWOFF, NR, N1, OPTRATIO, p, q

      INTEGER     LWCON, LWQP3, LWRK_SGELQF, LWRK_SGESVD, LWRK_SGESVD2,

     $            lwrk_sgeqp3,  lwrk_sgeqrf, lwrk_sormlq, lwrk_sormqr,

     $            lwrk_sormqr2, lwlqf, lwqrf, lwsvd, lwsvd2, lworq,

     $            lworq2, lwunlq, minwrk, minwrk2, optwrk, optwrk2,

     $            iminwrk, rminwrk

      LOGICAL     ACCLA,  ACCLM, ACCLH, ASCALED, CONDA, DNTWU,  DNTWV,

     $            LQUERY, LSVC0, LSVEC, ROWPRM,  RSVEC, RTRANS, WNTUA,

     $            wntuf,  wntur, wntus, wntva,   wntvr

      REAL        BIG, EPSLN, RTMP, SCONDA, SFMIN

*     ..

*     .. Local Arrays

      REAL        RDUMMY(1)

*     ..

*     .. External Subroutines (BLAS, LAPACK)

      EXTERNAL    sgelqf, sgeqp3, sgeqrf, sgesvd, slacpy,

     $            slapmt, slascl, slaset, slaswp, sscal,

     $            spocon, sormlq, sormqr, xerbla

*     ..

*     .. External Functions (BLAS, LAPACK)

      LOGICAL    LSAME

      INTEGER    ISAMAX

      REAL        SLANGE, SNRM2, SLAMCH

      EXTERNAL    slange, lsame, isamax, snrm2, slamch

*     ..

*     .. Intrinsic Functions ..

      INTRINSIC   abs, max, min, real, sqrt

*     ..

*     .. Executable Statements ..

*

*     Test the input arguments

*

      wntus  = lsame( jobu, 'S' ) .OR. lsame( jobu, 'U' )

      wntur  = lsame( jobu, 'R' )

      wntua  = lsame( jobu, 'A' )

      wntuf  = lsame( jobu, 'F' )

      lsvc0  = wntus .OR. wntur .OR. wntua

      lsvec  = lsvc0 .OR. wntuf

      dntwu  = lsame( jobu, 'N' )

*

      wntvr  = lsame( jobv, 'R' )

      wntva  = lsame( jobv, 'A' ) .OR. lsame( jobv, 'V' )

      rsvec  = wntvr .OR. wntva

      dntwv  = lsame( jobv, 'N' )

*

      accla  = lsame( joba, 'A' )

      acclm  = lsame( joba, 'M' )

      conda  = lsame( joba, 'E' )

      acclh  = lsame( joba, 'H' ) .OR. conda

*

      rowprm = lsame( jobp, 'P' )

      rtrans = lsame( jobr, 'T' )

*

      IF ( rowprm ) THEN

         IF ( conda ) THEN

            iminwrk = max( 1, n + m - 1 + n )

         ELSE

            iminwrk = max( 1, n + m - 1 )

         END IF

         rminwrk = max( 2, m )

      ELSE

         IF ( conda ) THEN

            iminwrk = max( 1, n + n )

         ELSE

            iminwrk = max( 1, n )

         END IF

         rminwrk = 2

      END IF

      lquery = (liwork .EQ. -1 .OR. lwork .EQ. -1 .OR. lrwork .EQ. -1)

      info  = 0

      IF ( .NOT. ( accla .OR. acclm .OR. acclh ) ) THEN

         info = -1

      ELSE IF ( .NOT.( rowprm .OR. lsame( jobp, 'N' ) ) ) THEN

          info = -2

      ELSE IF ( .NOT.( rtrans .OR. lsame( jobr, 'N' ) ) ) THEN

          info = -3

      ELSE IF ( .NOT.( lsvec .OR. dntwu ) ) THEN

         info = -4

      ELSE IF ( wntur .AND. wntva ) THEN

         info = -5

      ELSE IF ( .NOT.( rsvec .OR. dntwv )) THEN

         info = -5

      ELSE IF ( m.LT.0 ) THEN

         info = -6

      ELSE IF ( ( n.LT.0 ) .OR. ( n.GT.m ) ) THEN

         info = -7

      ELSE IF ( lda.LT.max( 1, m ) ) THEN

         info = -9

      ELSE IF ( ldu.LT.1 .OR. ( lsvc0 .AND. ldu.LT.m ) .OR.

     $       ( wntuf .AND. ldu.LT.n ) ) THEN

         info = -12

      ELSE IF ( ldv.LT.1 .OR. ( rsvec .AND. ldv.LT.n ) .OR.

     $          ( conda .AND. ldv.LT.n ) ) THEN

         info = -14

      ELSE IF ( liwork .LT. iminwrk .AND. .NOT. lquery ) THEN

         info = -17

      END IF

*

*

      IF ( info .EQ. 0 ) THEN

*        .. compute the minimal and the optimal workspace lengths

*        [[The expressions for computing the minimal and the optimal

*        values of LWORK are written with a lot of redundancy and

*        can be simplified. However, this detailed form is easier for

*        maintenance and modifications of the code.]]

*

*        .. minimal workspace length for SGEQP3 of an M x N matrix

         lwqp3 = 3 * n + 1

*        .. minimal workspace length for SORMQR to build left singular vectors

         IF ( wntus .OR. wntur ) THEN

             lworq  = max( n  , 1 )

         ELSE IF ( wntua ) THEN

             lworq = max( m , 1 )

         END IF

*        .. minimal workspace length for SPOCON of an N x N matrix

         lwcon = 3 * n

*        .. SGESVD of an N x N matrix

         lwsvd = max( 5 * n, 1 )

         IF ( lquery ) THEN

             CALL sgeqp3( m, n, a, lda, iwork, rdummy, rdummy, -1,

     $           ierr )

             lwrk_sgeqp3 = int( rdummy(1) )

             IF ( wntus .OR. wntur ) THEN

                 CALL sormqr( 'L', 'N', m, n, n, a, lda, rdummy, u,

     $                ldu, rdummy, -1, ierr )

                 lwrk_sormqr = int( rdummy(1) )

             ELSE IF ( wntua ) THEN

                 CALL sormqr( 'L', 'N', m, m, n, a, lda, rdummy, u,

     $                ldu, rdummy, -1, ierr )

                 lwrk_sormqr = int( rdummy(1) )

             ELSE

                 lwrk_sormqr = 0

             END IF

         END IF

         minwrk = 2

         optwrk = 2

         IF ( .NOT. (lsvec .OR. rsvec )) THEN

*            .. minimal and optimal sizes of the workspace if

*            only the singular values are requested

             IF ( conda ) THEN

                minwrk = max( n+lwqp3, lwcon, lwsvd )

             ELSE

                minwrk = max( n+lwqp3, lwsvd )

             END IF

             IF ( lquery ) THEN

                 CALL sgesvd( 'N', 'N', n, n, a, lda, s, u, ldu,

     $                v, ldv, rdummy, -1, ierr )

                 lwrk_sgesvd = int( rdummy(1) )

                 IF ( conda ) THEN

                    optwrk = max( n+lwrk_sgeqp3, n+lwcon, lwrk_sgesvd )

                 ELSE

                    optwrk = max( n+lwrk_sgeqp3, lwrk_sgesvd )

                 END IF

             END IF

         ELSE IF ( lsvec .AND. (.NOT.rsvec) ) THEN

*            .. minimal and optimal sizes of the workspace if the

*            singular values and the left singular vectors are requested

             IF ( conda ) THEN

                 minwrk = n + max( lwqp3, lwcon, lwsvd, lworq )

             ELSE

                 minwrk = n + max( lwqp3, lwsvd, lworq )

             END IF

             IF ( lquery ) THEN

                IF ( rtrans ) THEN

                   CALL sgesvd( 'N', 'O', n, n, a, lda, s, u, ldu,

     $                  v, ldv, rdummy, -1, ierr )

                ELSE

                   CALL sgesvd( 'O', 'N', n, n, a, lda, s, u, ldu,

     $                  v, ldv, rdummy, -1, ierr )

                END IF

                lwrk_sgesvd = int( rdummy(1) )

                IF ( conda ) THEN

                    optwrk = n + max( lwrk_sgeqp3, lwcon, lwrk_sgesvd,

     $                               lwrk_sormqr )

                ELSE

                    optwrk = n + max( lwrk_sgeqp3, lwrk_sgesvd,

     $                               lwrk_sormqr )

                END IF

             END IF

         ELSE IF ( rsvec .AND. (.NOT.lsvec) ) THEN

*            .. minimal and optimal sizes of the workspace if the

*            singular values and the right singular vectors are requested

             IF ( conda ) THEN

                 minwrk = n + max( lwqp3, lwcon, lwsvd )

             ELSE

                 minwrk = n + max( lwqp3, lwsvd )

             END IF

             IF ( lquery ) THEN

                 IF ( rtrans ) THEN

                     CALL sgesvd( 'O', 'N', n, n, a, lda, s, u, ldu,

     $                    v, ldv, rdummy, -1, ierr )

                 ELSE

                     CALL sgesvd( 'N', 'O', n, n, a, lda, s, u, ldu,

     $                    v, ldv, rdummy, -1, ierr )

                 END IF

                 lwrk_sgesvd = int( rdummy(1) )

                 IF ( conda ) THEN

                     optwrk = n + max( lwrk_sgeqp3, lwcon, lwrk_sgesvd )

                 ELSE

                     optwrk = n + max( lwrk_sgeqp3, lwrk_sgesvd )

                 END IF

             END IF

         ELSE

*            .. minimal and optimal sizes of the workspace if the

*            full SVD is requested

             IF ( rtrans ) THEN

                 minwrk = max( lwqp3, lwsvd, lworq )

                 IF ( conda ) minwrk = max( minwrk, lwcon )

                 minwrk = minwrk + n

                 IF ( wntva ) THEN

*                   .. minimal workspace length for N x N/2 SGEQRF

                    lwqrf  = max( n/2, 1 )

*                   .. minimal workspace length for N/2 x N/2 SGESVD

                    lwsvd2 = max( 5 * (n/2), 1 )

                    lworq2 = max( n, 1 )

                    minwrk2 = max( lwqp3, n/2+lwqrf, n/2+lwsvd2,

     $                        n/2+lworq2, lworq )

                    IF ( conda ) minwrk2 = max( minwrk2, lwcon )

                    minwrk2 = n + minwrk2

                    minwrk = max( minwrk, minwrk2 )

                 END IF

             ELSE

                 minwrk = max( lwqp3, lwsvd, lworq )

                 IF ( conda ) minwrk = max( minwrk, lwcon )

                 minwrk = minwrk + n

                 IF ( wntva ) THEN

*                   .. minimal workspace length for N/2 x N SGELQF

                    lwlqf  = max( n/2, 1 )

                    lwsvd2 = max( 5 * (n/2), 1 )

                    lwunlq = max( n , 1 )

                    minwrk2 = max( lwqp3, n/2+lwlqf, n/2+lwsvd2,

     $                        n/2+lwunlq, lworq )

                    IF ( conda ) minwrk2 = max( minwrk2, lwcon )

                    minwrk2 = n + minwrk2

                    minwrk = max( minwrk, minwrk2 )

                 END IF

             END IF

             IF ( lquery ) THEN

                IF ( rtrans ) THEN

                   CALL sgesvd( 'O', 'A', n, n, a, lda, s, u, ldu,

     $                  v, ldv, rdummy, -1, ierr )

                   lwrk_sgesvd = int( rdummy(1) )

                   optwrk = max(lwrk_sgeqp3,lwrk_sgesvd,lwrk_sormqr)

                   IF ( conda ) optwrk = max( optwrk, lwcon )

                   optwrk = n + optwrk

                   IF ( wntva ) THEN

                       CALL sgeqrf(n,n/2,u,ldu,rdummy,rdummy,-1,ierr)

                       lwrk_sgeqrf = int( rdummy(1) )

                       CALL sgesvd( 'S', 'O', n/2,n/2, v,ldv, s, u,

     $                              ldu,

     $                      v, ldv, rdummy, -1, ierr )

                       lwrk_sgesvd2 = int( rdummy(1) )

                       CALL sormqr( 'R', 'C', n, n, n/2, u, ldu,

     $                              rdummy,

     $                      v, ldv, rdummy, -1, ierr )

                       lwrk_sormqr2 = int( rdummy(1) )

                       optwrk2 = max( lwrk_sgeqp3, n/2+lwrk_sgeqrf,

     $                           n/2+lwrk_sgesvd2, n/2+lwrk_sormqr2 )

                       IF ( conda ) optwrk2 = max( optwrk2, lwcon )

                       optwrk2 = n + optwrk2

                       optwrk = max( optwrk, optwrk2 )

                   END IF

                ELSE

                   CALL sgesvd( 'S', 'O', n, n, a, lda, s, u, ldu,

     $                  v, ldv, rdummy, -1, ierr )

                   lwrk_sgesvd = int( rdummy(1) )

                   optwrk = max(lwrk_sgeqp3,lwrk_sgesvd,lwrk_sormqr)

                   IF ( conda ) optwrk = max( optwrk, lwcon )

                   optwrk = n + optwrk

                   IF ( wntva ) THEN

                      CALL sgelqf(n/2,n,u,ldu,rdummy,rdummy,-1,ierr)

                      lwrk_sgelqf = int( rdummy(1) )

                      CALL sgesvd( 'S','O', n/2,n/2, v, ldv, s, u,

     $                             ldu,

     $                     v, ldv, rdummy, -1, ierr )

                      lwrk_sgesvd2 = int( rdummy(1) )

                      CALL sormlq( 'R', 'N', n, n, n/2, u, ldu,

     $                             rdummy,

     $                     v, ldv, rdummy,-1,ierr )

                      lwrk_sormlq = int( rdummy(1) )

                      optwrk2 = max( lwrk_sgeqp3, n/2+lwrk_sgelqf,

     $                           n/2+lwrk_sgesvd2, n/2+lwrk_sormlq )

                       IF ( conda ) optwrk2 = max( optwrk2, lwcon )

                       optwrk2 = n + optwrk2

                       optwrk = max( optwrk, optwrk2 )

                   END IF

                END IF

             END IF

         END IF

*

         minwrk = max( 2, minwrk )

         optwrk = max( 2, optwrk )

         IF ( lwork .LT. minwrk .AND. (.NOT.lquery) ) info = -19

*

      END IF

*

      IF (info .EQ. 0 .AND. lrwork .LT. rminwrk .AND. .NOT. lquery) THEN

         info = -21

      END IF

      IF( info.NE.0 ) THEN

         CALL xerbla( 'SGESVDQ', -info )

         RETURN

      ELSE IF ( lquery ) THEN

*

*     Return optimal workspace

*

          iwork(1) = iminwrk

          work(1) = real( optwrk )

          work(2) = real( minwrk )

          rwork(1) = real( rminwrk )

          RETURN

      END IF

*

*     Quick return if the matrix is void.

*

      IF( ( m.EQ.0 ) .OR. ( n.EQ.0 ) ) THEN

*     .. all output is void.

         RETURN

      END IF

*

      big = slamch('O')

      ascaled = .false.

      iwoff = 1

      IF ( rowprm ) THEN

            iwoff = m

*           .. reordering the rows in decreasing sequence in the

*           ell-infinity norm - this enhances numerical robustness in

*           the case of differently scaled rows.

            DO 1904 p = 1, m

*               RWORK(p) = ABS( A(p,ICAMAX(N,A(p,1),LDA)) )

*               [[SLANGE will return NaN if an entry of the p-th row is Nan]]

                rwork(p) = slange( 'M', 1, n, a(p,1), lda, rdummy )

*               .. check for NaN's and Inf's

                IF ( ( rwork(p) .NE. rwork(p) ) .OR.

     $               ( (rwork(p)*zero) .NE. zero ) ) THEN

                    info = -8

                    CALL xerbla( 'SGESVDQ', -info )

                    RETURN

                END IF

 1904       CONTINUE

            DO 1952 p = 1, m - 1

            q = isamax( m-p+1, rwork(p), 1 ) + p - 1

            iwork(n+p) = q

            IF ( p .NE. q ) THEN

               rtmp     = rwork(p)

               rwork(p) = rwork(q)

               rwork(q) = rtmp

            END IF

 1952       CONTINUE

*

            IF ( rwork(1) .EQ. zero ) THEN

*              Quick return: A is the M x N zero matrix.

               numrank = 0

               CALL slaset( 'G', n, 1, zero, zero, s, n )

               IF ( wntus ) CALL slaset('G', m, n, zero, one, u, ldu)

               IF ( wntua ) CALL slaset('G', m, m, zero, one, u, ldu)

               IF ( wntva ) CALL slaset('G', n, n, zero, one, v, ldv)

               IF ( wntuf ) THEN

                   CALL slaset( 'G', n, 1, zero, zero, work, n )

                   CALL slaset( 'G', m, n, zero,  one, u, ldu )

               END IF

               DO 5001 p = 1, n

                   iwork(p) = p

 5001          CONTINUE

               IF ( rowprm ) THEN

                   DO 5002 p = n + 1, n + m - 1

                       iwork(p) = p - n

 5002              CONTINUE

               END IF

               IF ( conda ) rwork(1) = -1

               rwork(2) = -1

               RETURN

            END IF

*

            IF ( rwork(1) .GT. big / sqrt(real(m)) ) THEN

*               .. to prevent overflow in the QR factorization, scale the

*               matrix by 1/sqrt(M) if too large entry detected

                CALL slascl('G',0,0,sqrt(real(m)),one, m,n, a,lda,

     $                       ierr)

                ascaled = .true.

            END IF

            CALL slaswp( n, a, lda, 1, m-1, iwork(n+1), 1 )

      END IF

*

*    .. At this stage, preemptive scaling is done only to avoid column

*    norms overflows during the QR factorization. The SVD procedure should

*    have its own scaling to save the singular values from overflows and

*    underflows. That depends on the SVD procedure.

*

      IF ( .NOT.rowprm ) THEN

          rtmp = slange( 'M', m, n, a, lda, rdummy )

          IF ( ( rtmp .NE. rtmp ) .OR.

     $         ( (rtmp*zero) .NE. zero ) ) THEN

               info = -8

               CALL xerbla( 'SGESVDQ', -info )

               RETURN

          END IF

          IF ( rtmp .GT. big / sqrt(real(m)) ) THEN

*             .. to prevent overflow in the QR factorization, scale the

*             matrix by 1/sqrt(M) if too large entry detected

              CALL slascl('G',0,0, sqrt(real(m)),one, m,n, a,lda,

     $                     ierr)

              ascaled = .true.

          END IF

      END IF

*

*     .. QR factorization with column pivoting

*

*     A * P = Q * [ R ]

*                 [ 0 ]

*

      DO 1963 p = 1, n

*        .. all columns are free columns

         iwork(p) = 0

 1963 CONTINUE

      CALL sgeqp3( m, n, a, lda, iwork, work, work(n+1), lwork-n,

     $      ierr )

*

*    If the user requested accuracy level allows truncation in the

*    computed upper triangular factor, the matrix R is examined and,

*    if possible, replaced with its leading upper trapezoidal part.

*

      epsln = slamch('E')

      sfmin = slamch('S')

*     SMALL = SFMIN / EPSLN

      nr = n

*

      IF ( accla ) THEN

*

*        Standard absolute error bound suffices. All sigma_i with

*        sigma_i < N*EPS*||A||_F are flushed to zero. This is an

*        aggressive enforcement of lower numerical rank by introducing a

*        backward error of the order of N*EPS*||A||_F.

         nr = 1

         rtmp = sqrt(real(n))*epsln

         DO 3001 p = 2, n

            IF ( abs(a(p,p)) .LT. (rtmp*abs(a(1,1))) ) GO TO 3002

               nr = nr + 1

 3001    CONTINUE

 3002    CONTINUE

*

      ELSEIF ( acclm ) THEN

*        .. similarly as above, only slightly more gentle (less aggressive).

*        Sudden drop on the diagonal of R is used as the criterion for being

*        close-to-rank-deficient. The threshold is set to EPSLN=SLAMCH('E').

*        [[This can be made more flexible by replacing this hard-coded value

*        with a user specified threshold.]] Also, the values that underflow

*        will be truncated.

         nr = 1

         DO 3401 p = 2, n

            IF ( ( abs(a(p,p)) .LT. (epsln*abs(a(p-1,p-1))) ) .OR.

     $           ( abs(a(p,p)) .LT. sfmin ) ) GO TO 3402

            nr = nr + 1

 3401    CONTINUE

 3402    CONTINUE

*

      ELSE

*        .. RRQR not authorized to determine numerical rank except in the

*        obvious case of zero pivots.

*        .. inspect R for exact zeros on the diagonal;

*        R(i,i)=0 => R(i:N,i:N)=0.

         nr = 1

         DO 3501 p = 2, n

            IF ( abs(a(p,p)) .EQ. zero ) GO TO 3502

            nr = nr + 1

 3501    CONTINUE

 3502    CONTINUE

*

         IF ( conda ) THEN

*           Estimate the scaled condition number of A. Use the fact that it is

*           the same as the scaled condition number of R.

*              .. V is used as workspace

               CALL slacpy( 'U', n, n, a, lda, v, ldv )

*              Only the leading NR x NR submatrix of the triangular factor

*              is considered. Only if NR=N will this give a reliable error

*              bound. However, even for NR < N, this can be used on an

*              expert level and obtain useful information in the sense of

*              perturbation theory.

               DO 3053 p = 1, nr

                  rtmp = snrm2( p, v(1,p), 1 )

                  CALL sscal( p, one/rtmp, v(1,p), 1 )

 3053          CONTINUE

               IF ( .NOT. ( lsvec .OR. rsvec ) ) THEN

                   CALL spocon( 'U', nr, v, ldv, one, rtmp,

     $                  work, iwork(n+iwoff), ierr )

               ELSE

                   CALL spocon( 'U', nr, v, ldv, one, rtmp,

     $                  work(n+1), iwork(n+iwoff), ierr )

               END IF

               sconda = one / sqrt(rtmp)

*           For NR=N, SCONDA is an estimate of SQRT(||(R^* * R)^(-1)||_1),

*           N^(-1/4) * SCONDA <= ||R^(-1)||_2 <= N^(1/4) * SCONDA

*           See the reference [1] for more details.

         END IF

*

      ENDIF

*

      IF ( wntur ) THEN

          n1 = nr

      ELSE IF ( wntus .OR. wntuf) THEN

          n1 = n

      ELSE IF ( wntua ) THEN

          n1 = m

      END IF

*

      IF ( .NOT. ( rsvec .OR. lsvec ) ) THEN

*.......................................................................

*        .. only the singular values are requested

*.......................................................................

         IF ( rtrans ) THEN

*

*         .. compute the singular values of R**T = [A](1:NR,1:N)**T

*           .. set the lower triangle of [A] to [A](1:NR,1:N)**T and

*           the upper triangle of [A] to zero.

            DO 1146 p = 1, min( n, nr )

               DO 1147 q = p + 1, n

                  a(q,p) = a(p,q)

                  IF ( q .LE. nr ) a(p,q) = zero

 1147          CONTINUE

 1146       CONTINUE

*

            CALL sgesvd( 'N', 'N', n, nr, a, lda, s, u, ldu,

     $           v, ldv, work, lwork, info )

*

         ELSE

*

*           .. compute the singular values of R = [A](1:NR,1:N)

*

            IF ( nr .GT. 1 )

     $          CALL slaset( 'L', nr-1,nr-1, zero,zero, a(2,1), lda )

            CALL sgesvd( 'N', 'N', nr, n, a, lda, s, u, ldu,

     $           v, ldv, work, lwork, info )

*

         END IF

*

      ELSE IF ( lsvec .AND. ( .NOT. rsvec) ) THEN

*.......................................................................

*       .. the singular values and the left singular vectors requested

*.......................................................................""""""""

         IF ( rtrans ) THEN

*            .. apply SGESVD to R**T

*            .. copy R**T into [U] and overwrite [U] with the right singular

*            vectors of R

            DO 1192 p = 1, nr

               DO 1193 q = p, n

                  u(q,p) = a(p,q)

 1193          CONTINUE

 1192       CONTINUE

            IF ( nr .GT. 1 )

     $          CALL slaset( 'U', nr-1,nr-1, zero,zero, u(1,2), ldu )

*           .. the left singular vectors not computed, the NR right singular

*           vectors overwrite [U](1:NR,1:NR) as transposed. These

*           will be pre-multiplied by Q to build the left singular vectors of A.

               CALL sgesvd( 'N', 'O', n, nr, u, ldu, s, u, ldu,

     $              u, ldu, work(n+1), lwork-n, info )

*

               DO 1119 p = 1, nr

                   DO 1120 q = p + 1, nr

                      rtmp   = u(q,p)

                      u(q,p) = u(p,q)

                      u(p,q) = rtmp

 1120              CONTINUE

 1119          CONTINUE

*

         ELSE

*            .. apply SGESVD to R

*            .. copy R into [U] and overwrite [U] with the left singular vectors

             CALL slacpy( 'U', nr, n, a, lda, u, ldu )

             IF ( nr .GT. 1 )

     $         CALL slaset( 'L', nr-1, nr-1, zero, zero, u(2,1),

     $                      ldu )

*            .. the right singular vectors not computed, the NR left singular

*            vectors overwrite [U](1:NR,1:NR)

                CALL sgesvd( 'O', 'N', nr, n, u, ldu, s, u, ldu,

     $               v, ldv, work(n+1), lwork-n, info )

*               .. now [U](1:NR,1:NR) contains the NR left singular vectors of

*               R. These will be pre-multiplied by Q to build the left singular

*               vectors of A.

         END IF

*

*           .. assemble the left singular vector matrix U of dimensions

*              (M x NR) or (M x N) or (M x M).

         IF ( ( nr .LT. m ) .AND. ( .NOT.wntuf ) ) THEN

             CALL slaset('A', m-nr, nr, zero, zero, u(nr+1,1), ldu)

             IF ( nr .LT. n1 ) THEN

                CALL slaset( 'A',nr,n1-nr,zero,zero,u(1,nr+1), ldu )

                CALL slaset( 'A',m-nr,n1-nr,zero,one,

     $               u(nr+1,nr+1), ldu )

             END IF

         END IF

*

*           The Q matrix from the first QRF is built into the left singular

*           vectors matrix U.

*

         IF ( .NOT.wntuf )

     $       CALL sormqr( 'L', 'N', m, n1, n, a, lda, work, u,

     $            ldu, work(n+1), lwork-n, ierr )

         IF ( rowprm .AND. .NOT.wntuf )

     $          CALL slaswp( n1, u, ldu, 1, m-1, iwork(n+1), -1 )

*

      ELSE IF ( rsvec .AND. ( .NOT. lsvec ) ) THEN

*.......................................................................

*       .. the singular values and the right singular vectors requested

*.......................................................................

          IF ( rtrans ) THEN

*            .. apply SGESVD to R**T

*            .. copy R**T into V and overwrite V with the left singular vectors

            DO 1165 p = 1, nr

               DO 1166 q = p, n

                  v(q,p) = (a(p,q))

 1166          CONTINUE

 1165       CONTINUE

            IF ( nr .GT. 1 )

     $          CALL slaset( 'U', nr-1,nr-1, zero,zero, v(1,2), ldv )

*           .. the left singular vectors of R**T overwrite V, the right singular

*           vectors not computed

            IF ( wntvr .OR. ( nr .EQ. n ) ) THEN

               CALL sgesvd( 'O', 'N', n, nr, v, ldv, s, u, ldu,

     $              u, ldu, work(n+1), lwork-n, info )

*

               DO 1121 p = 1, nr

                   DO 1122 q = p + 1, nr

                      rtmp   = v(q,p)

                      v(q,p) = v(p,q)

                      v(p,q) = rtmp

 1122              CONTINUE

 1121          CONTINUE

*

               IF ( nr .LT. n ) THEN

                   DO 1103 p = 1, nr

                      DO 1104 q = nr + 1, n

                          v(p,q) = v(q,p)

 1104                 CONTINUE

 1103              CONTINUE

               END IF

               CALL slapmt( .false., nr, n, v, ldv, iwork )

            ELSE

*               .. need all N right singular vectors and NR < N

*               [!] This is simple implementation that augments [V](1:N,1:NR)

*               by padding a zero block. In the case NR << N, a more efficient

*               way is to first use the QR factorization. For more details

*               how to implement this, see the " FULL SVD " branch.

                CALL slaset('G', n, n-nr, zero, zero, v(1,nr+1), ldv)

                CALL sgesvd( 'O', 'N', n, n, v, ldv, s, u, ldu,

     $               u, ldu, work(n+1), lwork-n, info )

*

                DO 1123 p = 1, n

                   DO 1124 q = p + 1, n

                      rtmp   = v(q,p)

                      v(q,p) = v(p,q)

                      v(p,q) = rtmp

 1124              CONTINUE

 1123           CONTINUE

                CALL slapmt( .false., n, n, v, ldv, iwork )

            END IF

*

          ELSE

*            .. aply SGESVD to R

*            .. copy R into V and overwrite V with the right singular vectors

             CALL slacpy( 'U', nr, n, a, lda, v, ldv )

             IF ( nr .GT. 1 )

     $         CALL slaset( 'L', nr-1, nr-1, zero, zero, v(2,1),

     $                      ldv )

*            .. the right singular vectors overwrite V, the NR left singular

*            vectors stored in U(1:NR,1:NR)

             IF ( wntvr .OR. ( nr .EQ. n ) ) THEN

                CALL sgesvd( 'N', 'O', nr, n, v, ldv, s, u, ldu,

     $               v, ldv, work(n+1), lwork-n, info )

                CALL slapmt( .false., nr, n, v, ldv, iwork )

*               .. now [V](1:NR,1:N) contains V(1:N,1:NR)**T

             ELSE

*               .. need all N right singular vectors and NR < N

*               [!] This is simple implementation that augments [V](1:NR,1:N)

*               by padding a zero block. In the case NR << N, a more efficient

*               way is to first use the LQ factorization. For more details

*               how to implement this, see the " FULL SVD " branch.

                 CALL slaset('G', n-nr, n, zero,zero, v(nr+1,1), ldv)

                 CALL sgesvd( 'N', 'O', n, n, v, ldv, s, u, ldu,

     $                v, ldv, work(n+1), lwork-n, info )

                 CALL slapmt( .false., n, n, v, ldv, iwork )

             END IF

*            .. now [V] contains the transposed matrix of the right singular

*            vectors of A.

          END IF

*

      ELSE

*.......................................................................

*       .. FULL SVD requested

*.......................................................................

         IF ( rtrans ) THEN

*

*            .. apply SGESVD to R**T [[this option is left for R&D&T]]

*

            IF ( wntvr .OR. ( nr .EQ. n ) ) THEN

*            .. copy R**T into [V] and overwrite [V] with the left singular

*            vectors of R**T

            DO 1168 p = 1, nr

               DO 1169 q = p, n

                  v(q,p) = a(p,q)

 1169          CONTINUE

 1168       CONTINUE

            IF ( nr .GT. 1 )

     $          CALL slaset( 'U', nr-1,nr-1, zero,zero, v(1,2), ldv )

*

*           .. the left singular vectors of R**T overwrite [V], the NR right

*           singular vectors of R**T stored in [U](1:NR,1:NR) as transposed

               CALL sgesvd( 'O', 'A', n, nr, v, ldv, s, v, ldv,

     $              u, ldu, work(n+1), lwork-n, info )

*              .. assemble V

               DO 1115 p = 1, nr

                  DO 1116 q = p + 1, nr

                     rtmp   = v(q,p)

                     v(q,p) = v(p,q)

                     v(p,q) = rtmp

 1116             CONTINUE

 1115          CONTINUE

               IF ( nr .LT. n ) THEN

                   DO 1101 p = 1, nr

                      DO 1102 q = nr+1, n

                         v(p,q) = v(q,p)

 1102                 CONTINUE

 1101              CONTINUE

               END IF

               CALL slapmt( .false., nr, n, v, ldv, iwork )

*

                DO 1117 p = 1, nr

                   DO 1118 q = p + 1, nr

                      rtmp   = u(q,p)

                      u(q,p) = u(p,q)

                      u(p,q) = rtmp

 1118              CONTINUE

 1117           CONTINUE

*

                IF ( ( nr .LT. m ) .AND. .NOT.(wntuf)) THEN

                  CALL slaset('A', m-nr,nr, zero,zero, u(nr+1,1),

     $                         ldu)

                  IF ( nr .LT. n1 ) THEN

                     CALL slaset('A',nr,n1-nr,zero,zero,u(1,nr+1),

     $                            ldu)

                     CALL slaset( 'A',m-nr,n1-nr,zero,one,

     $                    u(nr+1,nr+1), ldu )

                  END IF

               END IF

*

            ELSE

*               .. need all N right singular vectors and NR < N

*            .. copy R**T into [V] and overwrite [V] with the left singular

*            vectors of R**T

*               [[The optimal ratio N/NR for using QRF instead of padding

*                 with zeros. Here hard coded to 2; it must be at least

*                 two due to work space constraints.]]

*               OPTRATIO = ILAENV(6, 'SGESVD', 'S' // 'O', NR,N,0,0)

*               OPTRATIO = MAX( OPTRATIO, 2 )

                optratio = 2

                IF ( optratio*nr .GT. n ) THEN

                   DO 1198 p = 1, nr

                      DO 1199 q = p, n

                         v(q,p) = a(p,q)

 1199                 CONTINUE

 1198              CONTINUE

                   IF ( nr .GT. 1 )

     $             CALL slaset('U',nr-1,nr-1, zero,zero, v(1,2),ldv)

*

                   CALL slaset('A',n,n-nr,zero,zero,v(1,nr+1),ldv)

                   CALL sgesvd( 'O', 'A', n, n, v, ldv, s, v, ldv,

     $                  u, ldu, work(n+1), lwork-n, info )

*

                   DO 1113 p = 1, n

                      DO 1114 q = p + 1, n

                         rtmp   = v(q,p)

                         v(q,p) = v(p,q)

                         v(p,q) = rtmp

 1114                 CONTINUE

 1113              CONTINUE

                   CALL slapmt( .false., n, n, v, ldv, iwork )

*              .. assemble the left singular vector matrix U of dimensions

*              (M x N1), i.e. (M x N) or (M x M).

*

                   DO 1111 p = 1, n

                      DO 1112 q = p + 1, n

                         rtmp   = u(q,p)

                         u(q,p) = u(p,q)

                         u(p,q) = rtmp

 1112                 CONTINUE

 1111              CONTINUE

*

                   IF ( ( n .LT. m ) .AND. .NOT.(wntuf)) THEN

                      CALL slaset('A',m-n,n,zero,zero,u(n+1,1),ldu)

                      IF ( n .LT. n1 ) THEN

                        CALL slaset('A',n,n1-n,zero,zero,u(1,n+1),

     $                               ldu)

                        CALL slaset('A',m-n,n1-n,zero,one,

     $                       u(n+1,n+1), ldu )

                      END IF

                   END IF

                ELSE

*                  .. copy R**T into [U] and overwrite [U] with the right

*                  singular vectors of R

                   DO 1196 p = 1, nr

                      DO 1197 q = p, n

                         u(q,nr+p) = a(p,q)

 1197                 CONTINUE

 1196              CONTINUE

                   IF ( nr .GT. 1 )

     $             CALL slaset('U',nr-1,nr-1,zero,zero,u(1,nr+2),ldu)

                   CALL sgeqrf( n, nr, u(1,nr+1), ldu, work(n+1),

     $                  work(n+nr+1), lwork-n-nr, ierr )

                   DO 1143 p = 1, nr

                       DO 1144 q = 1, n

                           v(q,p) = u(p,nr+q)

 1144                  CONTINUE

 1143              CONTINUE

                  CALL slaset('U',nr-1,nr-1,zero,zero,v(1,2),ldv)

                  CALL sgesvd( 'S', 'O', nr, nr, v, ldv, s, u, ldu,

     $                 v,ldv, work(n+nr+1),lwork-n-nr, info )

                  CALL slaset('A',n-nr,nr,zero,zero,v(nr+1,1),ldv)

                  CALL slaset('A',nr,n-nr,zero,zero,v(1,nr+1),ldv)

                  CALL slaset('A',n-nr,n-nr,zero,one,v(nr+1,nr+1),

     $                         ldv)

                  CALL sormqr('R','C', n, n, nr, u(1,nr+1), ldu,

     $                 work(n+1),v,ldv,work(n+nr+1),lwork-n-nr,ierr)

                  CALL slapmt( .false., n, n, v, ldv, iwork )

*                 .. assemble the left singular vector matrix U of dimensions

*                 (M x NR) or (M x N) or (M x M).

                  IF ( ( nr .LT. m ) .AND. .NOT.(wntuf)) THEN

                     CALL slaset('A',m-nr,nr,zero,zero,u(nr+1,1),ldu)

                     IF ( nr .LT. n1 ) THEN

                     CALL slaset('A',nr,n1-nr,zero,zero,u(1,nr+1),

     $                            ldu)

                     CALL slaset( 'A',m-nr,n1-nr,zero,one,

     $                    u(nr+1,nr+1),ldu)

                     END IF

                  END IF

                END IF

            END IF

*

         ELSE

*

*            .. apply SGESVD to R [[this is the recommended option]]

*

             IF ( wntvr .OR. ( nr .EQ. n ) ) THEN

*                .. copy R into [V] and overwrite V with the right singular vectors

                 CALL slacpy( 'U', nr, n, a, lda, v, ldv )

                IF ( nr .GT. 1 )

     $          CALL slaset( 'L', nr-1,nr-1, zero,zero, v(2,1), ldv )

*               .. the right singular vectors of R overwrite [V], the NR left

*               singular vectors of R stored in [U](1:NR,1:NR)

                CALL sgesvd( 'S', 'O', nr, n, v, ldv, s, u, ldu,

     $               v, ldv, work(n+1), lwork-n, info )

                CALL slapmt( .false., nr, n, v, ldv, iwork )

*               .. now [V](1:NR,1:N) contains V(1:N,1:NR)**T

*               .. assemble the left singular vector matrix U of dimensions

*              (M x NR) or (M x N) or (M x M).

               IF ( ( nr .LT. m ) .AND. .NOT.(wntuf)) THEN

                  CALL slaset('A', m-nr,nr, zero,zero, u(nr+1,1),

     $                         ldu)

                  IF ( nr .LT. n1 ) THEN

                     CALL slaset('A',nr,n1-nr,zero,zero,u(1,nr+1),

     $                            ldu)

                     CALL slaset( 'A',m-nr,n1-nr,zero,one,

     $                    u(nr+1,nr+1), ldu )

                  END IF

               END IF

*

             ELSE

*              .. need all N right singular vectors and NR < N

*              .. the requested number of the left singular vectors

*               is then N1 (N or M)

*               [[The optimal ratio N/NR for using LQ instead of padding

*                 with zeros. Here hard coded to 2; it must be at least

*                 two due to work space constraints.]]

*               OPTRATIO = ILAENV(6, 'SGESVD', 'S' // 'O', NR,N,0,0)

*               OPTRATIO = MAX( OPTRATIO, 2 )

               optratio = 2

               IF ( optratio * nr .GT. n ) THEN

                  CALL slacpy( 'U', nr, n, a, lda, v, ldv )

                  IF ( nr .GT. 1 )

     $            CALL slaset('L', nr-1,nr-1, zero,zero, v(2,1),ldv)

*              .. the right singular vectors of R overwrite [V], the NR left

*                 singular vectors of R stored in [U](1:NR,1:NR)

                  CALL slaset('A', n-nr,n, zero,zero, v(nr+1,1),ldv)

                  CALL sgesvd( 'S', 'O', n, n, v, ldv, s, u, ldu,

     $                 v, ldv, work(n+1), lwork-n, info )

                  CALL slapmt( .false., n, n, v, ldv, iwork )

*                 .. now [V] contains the transposed matrix of the right

*                 singular vectors of A. The leading N left singular vectors

*                 are in [U](1:N,1:N)

*                 .. assemble the left singular vector matrix U of dimensions

*                 (M x N1), i.e. (M x N) or (M x M).

                  IF ( ( n .LT. m ) .AND. .NOT.(wntuf)) THEN

                      CALL slaset('A',m-n,n,zero,zero,u(n+1,1),ldu)

                      IF ( n .LT. n1 ) THEN

                        CALL slaset('A',n,n1-n,zero,zero,u(1,n+1),

     $                               ldu)

                        CALL slaset( 'A',m-n,n1-n,zero,one,

     $                       u(n+1,n+1), ldu )

                      END IF

                  END IF

               ELSE

                  CALL slacpy( 'U', nr, n, a, lda, u(nr+1,1), ldu )

                  IF ( nr .GT. 1 )

     $            CALL slaset('L',nr-1,nr-1,zero,zero,u(nr+2,1),ldu)

                  CALL sgelqf( nr, n, u(nr+1,1), ldu, work(n+1),

     $                 work(n+nr+1), lwork-n-nr, ierr )

                  CALL slacpy('L',nr,nr,u(nr+1,1),ldu,v,ldv)

                  IF ( nr .GT. 1 )

     $            CALL slaset('U',nr-1,nr-1,zero,zero,v(1,2),ldv)

                  CALL sgesvd( 'S', 'O', nr, nr, v, ldv, s, u, ldu,

     $                 v, ldv, work(n+nr+1), lwork-n-nr, info )

                  CALL slaset('A',n-nr,nr,zero,zero,v(nr+1,1),ldv)

                  CALL slaset('A',nr,n-nr,zero,zero,v(1,nr+1),ldv)

                  CALL slaset('A',n-nr,n-nr,zero,one,v(nr+1,nr+1),

     $                         ldv)

                  CALL sormlq('R','N',n,n,nr,u(nr+1,1),ldu,work(n+1),

     $                 v, ldv, work(n+nr+1),lwork-n-nr,ierr)

                  CALL slapmt( .false., n, n, v, ldv, iwork )

*               .. assemble the left singular vector matrix U of dimensions

*              (M x NR) or (M x N) or (M x M).

                  IF ( ( nr .LT. m ) .AND. .NOT.(wntuf)) THEN

                     CALL slaset('A',m-nr,nr,zero,zero,u(nr+1,1),ldu)

                     IF ( nr .LT. n1 ) THEN

                     CALL slaset('A',nr,n1-nr,zero,zero,u(1,nr+1),

     $                            ldu)

                     CALL slaset( 'A',m-nr,n1-nr,zero,one,

     $                    u(nr+1,nr+1), ldu )

                     END IF

                  END IF

               END IF

             END IF

*        .. end of the "R**T or R" branch

         END IF

*

*           The Q matrix from the first QRF is built into the left singular

*           vectors matrix U.

*

         IF ( .NOT. wntuf )

     $       CALL sormqr( 'L', 'N', m, n1, n, a, lda, work, u,

     $            ldu, work(n+1), lwork-n, ierr )

         IF ( rowprm .AND. .NOT.wntuf )

     $          CALL slaswp( n1, u, ldu, 1, m-1, iwork(n+1), -1 )

*

*     ... end of the "full SVD" branch

      END IF

*

*     Check whether some singular values are returned as zeros, e.g.

*     due to underflow, and update the numerical rank.

      p = nr

      DO 4001 q = p, 1, -1

          IF ( s(q) .GT. zero ) GO TO 4002

          nr = nr - 1

 4001 CONTINUE

 4002 CONTINUE

*

*     .. if numerical rank deficiency is detected, the truncated

*     singular values are set to zero.

      IF ( nr .LT. n ) CALL slaset( 'G', n-nr,1, zero,zero, s(nr+1),

     $     n )

*     .. undo scaling; this may cause overflow in the largest singular

*     values.

      IF ( ascaled )

     $   CALL slascl( 'G',0,0, one,sqrt(real(m)), nr,1, s, n, ierr )

      IF ( conda ) rwork(1) = sconda

      rwork(2) = real( p - nr )

*     .. p-NR is the number of singular values that are computed as

*     exact zeros in SGESVD() applied to the (possibly truncated)

*     full row rank triangular (trapezoidal) factor of A.

      numrank = nr

*

      RETURN

*

*     End of SGESVDQ

*

      SUBROUTINE sgesvdq( JOBA, JOBP, JOBR, JOBU, JOBV, M, N, A, LDA, …

      END

xerbla
subroutine xerbla(srname, info)
Definition cblat2.f:3285

sgelqf
subroutine sgelqf(m, n, a, lda, tau, work, lwork, info)
SGELQF
Definition sgelqf.f:142

sgeqp3
subroutine sgeqp3(m, n, a, lda, jpvt, tau, work, lwork, info)
SGEQP3
Definition sgeqp3.f:149

sgeqrf
subroutine sgeqrf(m, n, a, lda, tau, work, lwork, info)
SGEQRF
Definition sgeqrf.f:144

sgesvd
subroutine sgesvd(jobu, jobvt, m, n, a, lda, s, u, ldu, vt, ldvt, work, lwork, info)
SGESVD computes the singular value decomposition (SVD) for GE matrices
Definition sgesvd.f:210

sgesvdq
subroutine sgesvdq(joba, jobp, jobr, jobu, jobv, m, n, a, lda, s, u, ldu, v, ldv, numrank, iwork, liwork, work, lwork, rwork, lrwork, info)
SGESVDQ computes the singular value decomposition (SVD) with a QR-Preconditioned QR SVD Method for GE...
Definition sgesvdq.f:413

slacpy
subroutine slacpy(uplo, m, n, a, lda, b, ldb)
SLACPY copies all or part of one two-dimensional array to another.
Definition slacpy.f:101

slapmt
subroutine slapmt(forwrd, m, n, x, ldx, k)
SLAPMT performs a forward or backward permutation of the columns of a matrix.
Definition slapmt.f:102

slascl
subroutine slascl(type, kl, ku, cfrom, cto, m, n, a, lda, info)
SLASCL multiplies a general rectangular matrix by a real scalar defined as cto/cfrom.
Definition slascl.f:142

slaset
subroutine slaset(uplo, m, n, alpha, beta, a, lda)
SLASET initializes the off-diagonal elements and the diagonal elements of a matrix to given values.
Definition slaset.f:108

slaswp
subroutine slaswp(n, a, lda, k1, k2, ipiv, incx)
SLASWP performs a series of row interchanges on a general rectangular matrix.
Definition slaswp.f:113

spocon
subroutine spocon(uplo, n, a, lda, anorm, rcond, work, iwork, info)
SPOCON
Definition spocon.f:119

sscal
subroutine sscal(n, sa, sx, incx)
SSCAL
Definition sscal.f:79

sormlq
subroutine sormlq(side, trans, m, n, k, a, lda, tau, c, ldc, work, lwork, info)
SORMLQ
Definition sormlq.f:166

sormqr
subroutine sormqr(side, trans, m, n, k, a, lda, tau, c, ldc, work, lwork, info)
SORMQR
Definition sormqr.f:166