subroutine dlasd2	(	integer	NL,
		integer	NR,
		integer	SQRE,
		integer	K,
		double precision, dimension( * )	D,
		double precision, dimension( * )	Z,
		double precision	ALPHA,
		double precision	BETA,
		double precision, dimension( ldu, * )	U,
		integer	LDU,
		double precision, dimension( ldvt, * )	VT,
		integer	LDVT,
		double precision, dimension( * )	DSIGMA,
		double precision, dimension( ldu2, * )	U2,
		integer	LDU2,
		double precision, dimension( ldvt2, * )	VT2,
		integer	LDVT2,
		integer, dimension( * )	IDXP,
		integer, dimension( * )	IDX,
		integer, dimension( * )	IDXC,
		integer, dimension( * )	IDXQ,
		integer, dimension( * )	COLTYP,
		integer	INFO
	)

DLASD2 merges the two sets of singular values together into a single sorted set. Used by sbdsdc.

Download DLASD2 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

 DLASD2 merges the two sets of singular values together into a single
 sorted set.  Then it tries to deflate the size of the problem.
 There are two ways in which deflation can occur:  when two or more
 singular values are close together or if there is a tiny entry in the
 Z vector.  For each such occurrence the order of the related secular
 equation problem is reduced by one.

 DLASD2 is called from DLASD1.

Parameters

[in]	NL	NL is INTEGER The row dimension of the upper block. NL >= 1.
[in]	NR	NR is INTEGER The row dimension of the lower block. NR >= 1.
[in]	SQRE	SQRE is INTEGER = 0: the lower block is an NR-by-NR square matrix. = 1: the lower block is an NR-by-(NR+1) rectangular matrix. The bidiagonal matrix has N = NL + NR + 1 rows and M = N + SQRE >= N columns.
[out]	K	K is INTEGER Contains the dimension of the non-deflated matrix, This is the order of the related secular equation. 1 <= K <=N.
[in,out]	D	D is DOUBLE PRECISION array, dimension(N) On entry D contains the singular values of the two submatrices to be combined. On exit D contains the trailing (N-K) updated singular values (those which were deflated) sorted into increasing order.
[out]	Z	Z is DOUBLE PRECISION array, dimension(N) On exit Z contains the updating row vector in the secular equation.
[in]	ALPHA	ALPHA is DOUBLE PRECISION Contains the diagonal element associated with the added row.
[in]	BETA	BETA is DOUBLE PRECISION Contains the off-diagonal element associated with the added row.
[in,out]	U	U is DOUBLE PRECISION array, dimension(LDU,N) On entry U contains the left singular vectors of two submatrices in the two square blocks with corners at (1,1), (NL, NL), and (NL+2, NL+2), (N,N). On exit U contains the trailing (N-K) updated left singular vectors (those which were deflated) in its last N-K columns.
[in]	LDU	LDU is INTEGER The leading dimension of the array U. LDU >= N.
[in,out]	VT	VT is DOUBLE PRECISION array, dimension(LDVT,M) On entry VTT contains the right singular vectors of two submatrices in the two square blocks with corners at (1,1), (NL+1, NL+1), and (NL+2, NL+2), (M,M). On exit VTT contains the trailing (N-K) updated right singular vectors (those which were deflated) in its last N-K columns. In case SQRE =1, the last row of VT spans the right null space.
[in]	LDVT	LDVT is INTEGER The leading dimension of the array VT. LDVT >= M.
[out]	DSIGMA	DSIGMA is DOUBLE PRECISION array, dimension (N) Contains a copy of the diagonal elements (K-1 singular values and one zero) in the secular equation.
[out]	U2	U2 is DOUBLE PRECISION array, dimension(LDU2,N) Contains a copy of the first K-1 left singular vectors which will be used by DLASD3 in a matrix multiply (DGEMM) to solve for the new left singular vectors. U2 is arranged into four blocks. The first block contains a column with 1 at NL+1 and zero everywhere else; the second block contains non-zero entries only at and above NL; the third contains non-zero entries only below NL+1; and the fourth is dense.
[in]	LDU2	LDU2 is INTEGER The leading dimension of the array U2. LDU2 >= N.
[out]	VT2	VT2 is DOUBLE PRECISION array, dimension(LDVT2,N) VT2**T contains a copy of the first K right singular vectors which will be used by DLASD3 in a matrix multiply (DGEMM) to solve for the new right singular vectors. VT2 is arranged into three blocks. The first block contains a row that corresponds to the special 0 diagonal element in SIGMA; the second block contains non-zeros only at and before NL +1; the third block contains non-zeros only at and after NL +2.
[in]	LDVT2	LDVT2 is INTEGER The leading dimension of the array VT2. LDVT2 >= M.
[out]	IDXP	IDXP is INTEGER array dimension(N) This will contain the permutation used to place deflated values of D at the end of the array. On output IDXP(2:K) points to the nondeflated D-values and IDXP(K+1:N) points to the deflated singular values.
[out]	IDX	IDX is INTEGER array dimension(N) This will contain the permutation used to sort the contents of D into ascending order.
[out]	IDXC	IDXC is INTEGER array dimension(N) This will contain the permutation used to arrange the columns of the deflated U matrix into three groups: the first group contains non-zero entries only at and above NL, the second contains non-zero entries only below NL+2, and the third is dense.
[in,out]	IDXQ	IDXQ is INTEGER array dimension(N) This contains the permutation which separately sorts the two sub-problems in D into ascending order. Note that entries in the first hlaf of this permutation must first be moved one position backward; and entries in the second half must first have NL+1 added to their values.
[out]	COLTYP	COLTYP is INTEGER array dimension(N) As workspace, this will contain a label which will indicate which of the following types a column in the U2 matrix or a row in the VT2 matrix is: 1 : non-zero in the upper half only 2 : non-zero in the lower half only 3 : dense 4 : deflated On exit, it is an array of dimension 4, with COLTYP(I) being the dimension of the I-th type columns.
[out]	INFO	INFO is INTEGER = 0: successful exit. < 0: if INFO = -i, the i-th argument had an illegal value.

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Date: September 2012

Contributors:: Ming Gu and Huan Ren, Computer Science Division, University of California at Berkeley, USA

Definition at line 271 of file dlasd2.f.

 *
 *  -- LAPACK auxiliary routine (version 3.4.2) --
 *  -- LAPACK is a software package provided by Univ. of Tennessee,    --
 *  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
 *     September 2012
 *
 *     .. Scalar Arguments ..
       INTEGER            info, k, ldu, ldu2, ldvt, ldvt2, nl, nr, sqre
       DOUBLE PRECISION   alpha, beta
 *     ..
 *     .. Array Arguments ..
       INTEGER            coltyp( * ), idx( * ), idxc( * ), idxp( * ),
      $                   idxq( * )
       DOUBLE PRECISION   d( * ), dsigma( * ), u( ldu, * ),
      $                   u2( ldu2, * ), vt( ldvt, * ), vt2( ldvt2, * ),
      $                   z( * )
 *     ..
 *
 *  =====================================================================
 *
 *     .. Parameters ..
       DOUBLE PRECISION   zero, one, two, eight
       parameter                ( zero = 0.0d+0, one = 1.0d+0, two = 2.0d+0,
      $                   eight = 8.0d+0 )
 *     ..
 *     .. Local Arrays ..
       INTEGER            ctot( 4 ), psm( 4 )
 *     ..
 *     .. Local Scalars ..
       INTEGER            ct, i, idxi, idxj, idxjp, j, jp, jprev, k2, m,
      $                   n, nlp1, nlp2
       DOUBLE PRECISION   c, eps, hlftol, s, tau, tol, z1
 *     ..
 *     .. External Functions ..
       DOUBLE PRECISION   dlamch, dlapy2
       EXTERNAL           dlamch, dlapy2
 *     ..
 *     .. External Subroutines ..
       EXTERNAL           dcopy, dlacpy, dlamrg, dlaset, drot, xerbla
 *     ..
 *     .. Intrinsic Functions ..
       INTRINSIC          abs, max
 *     ..
 *     .. Executable Statements ..
 *
 *     Test the input parameters.
 *
       info = 0
 *
       IF( nl.LT.1 ) THEN
          info = -1
       ELSE IF( nr.LT.1 ) THEN
          info = -2
       ELSE IF( ( sqre.NE.1 ) .AND. ( sqre.NE.0 ) ) THEN
          info = -3
       END IF
 *
       n = nl + nr + 1
       m = n + sqre
 *
       IF( ldu.LT.n ) THEN
          info = -10
       ELSE IF( ldvt.LT.m ) THEN
          info = -12
       ELSE IF( ldu2.LT.n ) THEN
          info = -15
       ELSE IF( ldvt2.LT.m ) THEN
          info = -17
       END IF
       IF( info.NE.0 ) THEN
          CALL xerbla( 'DLASD2', -info )
          RETURN
       END IF
 *
       nlp1 = nl + 1
       nlp2 = nl + 2
 *
 *     Generate the first part of the vector Z; and move the singular
 *     values in the first part of D one position backward.
 *
       z1 = alpha*vt( nlp1, nlp1 )
       z( 1 ) = z1
       DO 10 i = nl, 1, -1
          z( i+1 ) = alpha*vt( i, nlp1 )
          d( i+1 ) = d( i )
          idxq( i+1 ) = idxq( i ) + 1
    10 CONTINUE
 *
 *     Generate the second part of the vector Z.
 *
       DO 20 i = nlp2, m
          z( i ) = beta*vt( i, nlp2 )
    20 CONTINUE
 *
 *     Initialize some reference arrays.
 *
       DO 30 i = 2, nlp1
          coltyp( i ) = 1
    30 CONTINUE
       DO 40 i = nlp2, n
          coltyp( i ) = 2
    40 CONTINUE
 *
 *     Sort the singular values into increasing order
 *
       DO 50 i = nlp2, n
          idxq( i ) = idxq( i ) + nlp1
    50 CONTINUE
 *
 *     DSIGMA, IDXC, IDXC, and the first column of U2
 *     are used as storage space.
 *
       DO 60 i = 2, n
          dsigma( i ) = d( idxq( i ) )
          u2( i, 1 ) = z( idxq( i ) )
          idxc( i ) = coltyp( idxq( i ) )
    60 CONTINUE
 *
       CALL dlamrg( nl, nr, dsigma( 2 ), 1, 1, idx( 2 ) )
 *
       DO 70 i = 2, n
          idxi = 1 + idx( i )
          d( i ) = dsigma( idxi )
          z( i ) = u2( idxi, 1 )
          coltyp( i ) = idxc( idxi )
    70 CONTINUE
 *
 *     Calculate the allowable deflation tolerance
 *
       eps = dlamch( 'Epsilon' )
       tol = max( abs( alpha ), abs( beta ) )
       tol = eight*eps*max( abs( d( n ) ), tol )
 *
 *     There are 2 kinds of deflation -- first a value in the z-vector
 *     is small, second two (or more) singular values are very close
 *     together (their difference is small).
 *
 *     If the value in the z-vector is small, we simply permute the
 *     array so that the corresponding singular value is moved to the
 *     end.
 *
 *     If two values in the D-vector are close, we perform a two-sided
 *     rotation designed to make one of the corresponding z-vector
 *     entries zero, and then permute the array so that the deflated
 *     singular value is moved to the end.
 *
 *     If there are multiple singular values then the problem deflates.
 *     Here the number of equal singular values are found.  As each equal
 *     singular value is found, an elementary reflector is computed to
 *     rotate the corresponding singular subspace so that the
 *     corresponding components of Z are zero in this new basis.
 *
       k = 1
       k2 = n + 1
       DO 80 j = 2, n
          IF( abs( z( j ) ).LE.tol ) THEN
 *
 *           Deflate due to small z component.
 *
             k2 = k2 - 1
             idxp( k2 ) = j
             coltyp( j ) = 4
             IF( j.EQ.n )
      $         GO TO 120
          ELSE
             jprev = j
             GO TO 90
          END IF
    80 CONTINUE
    90 CONTINUE
       j = jprev
   100 CONTINUE
       j = j + 1
       IF( j.GT.n )
      $   GO TO 110
       IF( abs( z( j ) ).LE.tol ) THEN
 *
 *        Deflate due to small z component.
 *
          k2 = k2 - 1
          idxp( k2 ) = j
          coltyp( j ) = 4
       ELSE
 *
 *        Check if singular values are close enough to allow deflation.
 *
          IF( abs( d( j )-d( jprev ) ).LE.tol ) THEN
 *
 *           Deflation is possible.
 *
             s = z( jprev )
             c = z( j )
 *
 *           Find sqrt(a**2+b**2) without overflow or
 *           destructive underflow.
 *
             tau = dlapy2( c, s )
             c = c / tau
             s = -s / tau
             z( j ) = tau
             z( jprev ) = zero
 *
 *           Apply back the Givens rotation to the left and right
 *           singular vector matrices.
 *
             idxjp = idxq( idx( jprev )+1 )
             idxj = idxq( idx( j )+1 )
             IF( idxjp.LE.nlp1 ) THEN
                idxjp = idxjp - 1
             END IF
             IF( idxj.LE.nlp1 ) THEN
                idxj = idxj - 1
             END IF
             CALL drot( n, u( 1, idxjp ), 1, u( 1, idxj ), 1, c, s )
             CALL drot( m, vt( idxjp, 1 ), ldvt, vt( idxj, 1 ), ldvt, c,
      $                 s )
             IF( coltyp( j ).NE.coltyp( jprev ) ) THEN
                coltyp( j ) = 3
             END IF
             coltyp( jprev ) = 4
             k2 = k2 - 1
             idxp( k2 ) = jprev
             jprev = j
          ELSE
             k = k + 1
             u2( k, 1 ) = z( jprev )
             dsigma( k ) = d( jprev )
             idxp( k ) = jprev
             jprev = j
          END IF
       END IF
       GO TO 100
   110 CONTINUE
 *
 *     Record the last singular value.
 *
       k = k + 1
       u2( k, 1 ) = z( jprev )
       dsigma( k ) = d( jprev )
       idxp( k ) = jprev
 *
   120 CONTINUE
 *
 *     Count up the total number of the various types of columns, then
 *     form a permutation which positions the four column types into
 *     four groups of uniform structure (although one or more of these
 *     groups may be empty).
 *
       DO 130 j = 1, 4
          ctot( j ) = 0
   130 CONTINUE
       DO 140 j = 2, n
          ct = coltyp( j )
          ctot( ct ) = ctot( ct ) + 1
   140 CONTINUE
 *
 *     PSM(*) = Position in SubMatrix (of types 1 through 4)
 *
       psm( 1 ) = 2
       psm( 2 ) = 2 + ctot( 1 )
       psm( 3 ) = psm( 2 ) + ctot( 2 )
       psm( 4 ) = psm( 3 ) + ctot( 3 )
 *
 *     Fill out the IDXC array so that the permutation which it induces
 *     will place all type-1 columns first, all type-2 columns next,
 *     then all type-3's, and finally all type-4's, starting from the
 *     second column. This applies similarly to the rows of VT.
 *
       DO 150 j = 2, n
          jp = idxp( j )
          ct = coltyp( jp )
          idxc( psm( ct ) ) = j
          psm( ct ) = psm( ct ) + 1
   150 CONTINUE
 *
 *     Sort the singular values and corresponding singular vectors into
 *     DSIGMA, U2, and VT2 respectively.  The singular values/vectors
 *     which were not deflated go into the first K slots of DSIGMA, U2,
 *     and VT2 respectively, while those which were deflated go into the
 *     last N - K slots, except that the first column/row will be treated
 *     separately.
 *
       DO 160 j = 2, n
          jp = idxp( j )
          dsigma( j ) = d( jp )
          idxj = idxq( idx( idxp( idxc( j ) ) )+1 )
          IF( idxj.LE.nlp1 ) THEN
             idxj = idxj - 1
          END IF
          CALL dcopy( n, u( 1, idxj ), 1, u2( 1, j ), 1 )
          CALL dcopy( m, vt( idxj, 1 ), ldvt, vt2( j, 1 ), ldvt2 )
   160 CONTINUE
 *
 *     Determine DSIGMA(1), DSIGMA(2) and Z(1)
 *
       dsigma( 1 ) = zero
       hlftol = tol / two
       IF( abs( dsigma( 2 ) ).LE.hlftol )
      $   dsigma( 2 ) = hlftol
       IF( m.GT.n ) THEN
          z( 1 ) = dlapy2( z1, z( m ) )
          IF( z( 1 ).LE.tol ) THEN
             c = one
             s = zero
             z( 1 ) = tol
          ELSE
             c = z1 / z( 1 )
             s = z( m ) / z( 1 )
          END IF
       ELSE
          IF( abs( z1 ).LE.tol ) THEN
             z( 1 ) = tol
          ELSE
             z( 1 ) = z1
          END IF
       END IF
 *
 *     Move the rest of the updating row to Z.
 *
       CALL dcopy( k-1, u2( 2, 1 ), 1, z( 2 ), 1 )
 *
 *     Determine the first column of U2, the first row of VT2 and the
 *     last row of VT.
 *
       CALL dlaset( 'A', n, 1, zero, zero, u2, ldu2 )
       u2( nlp1, 1 ) = one
       IF( m.GT.n ) THEN
          DO 170 i = 1, nlp1
             vt( m, i ) = -s*vt( nlp1, i )
             vt2( 1, i ) = c*vt( nlp1, i )
   170    CONTINUE
          DO 180 i = nlp2, m
             vt2( 1, i ) = s*vt( m, i )
             vt( m, i ) = c*vt( m, i )
   180    CONTINUE
       ELSE
          CALL dcopy( m, vt( nlp1, 1 ), ldvt, vt2( 1, 1 ), ldvt2 )
       END IF
       IF( m.GT.n ) THEN
          CALL dcopy( m, vt( m, 1 ), ldvt, vt2( m, 1 ), ldvt2 )
       END IF
 *
 *     The deflated singular values and their corresponding vectors go
 *     into the back of D, U, and V respectively.
 *
       IF( n.GT.k ) THEN
          CALL dcopy( n-k, dsigma( k+1 ), 1, d( k+1 ), 1 )
          CALL dlacpy( 'A', n, n-k, u2( 1, k+1 ), ldu2, u( 1, k+1 ),
      $                ldu )
          CALL dlacpy( 'A', n-k, m, vt2( k+1, 1 ), ldvt2, vt( k+1, 1 ),
      $                ldvt )
       END IF
 *
 *     Copy CTOT into COLTYP for referencing in DLASD3.
 *
       DO 190 j = 1, 4
          coltyp( j ) = ctot( j )
   190 CONTINUE
 *
       RETURN
 *
 *     End of DLASD2
 *

Here is the call graph for this function:

Here is the caller graph for this function: