db/d5b/dlasq3_8f_source.html

*> \brief \b DLASQ3 checks for deflation, computes a shift and calls dqds. Used by sbdsqr.

*

*  =========== DOCUMENTATION ===========

*

* Online html documentation available at

*            http://www.netlib.org/lapack/explore-html/

*

*> \htmlonly

*> Download DLASQ3 + dependencies

*> <a href="http://www.netlib.org/cgi-bin/netlibfiles.tgz?format=tgz&filename=/lapack/lapack_routine/dlasq3.f">

*> [TGZ]</a>

*> <a href="http://www.netlib.org/cgi-bin/netlibfiles.zip?format=zip&filename=/lapack/lapack_routine/dlasq3.f">

*> [ZIP]</a>

*> <a href="http://www.netlib.org/cgi-bin/netlibfiles.txt?format=txt&filename=/lapack/lapack_routine/dlasq3.f">

*> [TXT]</a>

*> \endhtmlonly

*

*  Definition:

*  ===========

*

*       SUBROUTINE DLASQ3( I0, N0, Z, PP, DMIN, SIGMA, DESIG, QMAX, NFAIL,

*                          ITER, NDIV, IEEE, TTYPE, DMIN1, DMIN2, DN, DN1,

*                          DN2, G, TAU )

*

*       .. Scalar Arguments ..

*       LOGICAL            IEEE

*       INTEGER            I0, ITER, N0, NDIV, NFAIL, PP

*       DOUBLE PRECISION   DESIG, DMIN, DMIN1, DMIN2, DN, DN1, DN2, G,

*      $                   QMAX, SIGMA, TAU

*       ..

*       .. Array Arguments ..

*       DOUBLE PRECISION   Z( * )

*       ..

*

*

*> \par Purpose:

*  =============

*>

*> \verbatim

*>

*> DLASQ3 checks for deflation, computes a shift (TAU) and calls dqds.

*> In case of failure it changes shifts, and tries again until output

*> is positive.

*> \endverbatim

*

*  Arguments:

*  ==========

*

*> \param[in] I0

*> \verbatim

*>          I0 is INTEGER

*>         First index.

*> \endverbatim

*>

*> \param[in,out] N0

*> \verbatim

*>          N0 is INTEGER

*>         Last index.

*> \endverbatim

*>

*> \param[in] Z

*> \verbatim

*>          Z is DOUBLE PRECISION array, dimension ( 4*N )

*>         Z holds the qd array.

*> \endverbatim

*>

*> \param[in,out] PP

*> \verbatim

*>          PP is INTEGER

*>         PP=0 for ping, PP=1 for pong.

*>         PP=2 indicates that flipping was applied to the Z array

*>         and that the initial tests for deflation should not be

*>         performed.

*> \endverbatim

*>

*> \param[out] DMIN

*> \verbatim

*>          DMIN is DOUBLE PRECISION

*>         Minimum value of d.

*> \endverbatim

*>

*> \param[out] SIGMA

*> \verbatim

*>          SIGMA is DOUBLE PRECISION

*>         Sum of shifts used in current segment.

*> \endverbatim

*>

*> \param[in,out] DESIG

*> \verbatim

*>          DESIG is DOUBLE PRECISION

*>         Lower order part of SIGMA

*> \endverbatim

*>

*> \param[in] QMAX

*> \verbatim

*>          QMAX is DOUBLE PRECISION

*>         Maximum value of q.

*> \endverbatim

*>

*> \param[out] NFAIL

*> \verbatim

*>          NFAIL is INTEGER

*>         Number of times shift was too big.

*> \endverbatim

*>

*> \param[out] ITER

*> \verbatim

*>          ITER is INTEGER

*>         Number of iterations.

*> \endverbatim

*>

*> \param[out] NDIV

*> \verbatim

*>          NDIV is INTEGER

*>         Number of divisions.

*> \endverbatim

*>

*> \param[in] IEEE

*> \verbatim

*>          IEEE is LOGICAL

*>         Flag for IEEE or non IEEE arithmetic (passed to DLASQ5).

*> \endverbatim

*>

*> \param[in,out] TTYPE

*> \verbatim

*>          TTYPE is INTEGER

*>         Shift type.

*> \endverbatim

*>

*> \param[in,out] DMIN1

*> \verbatim

*>          DMIN1 is DOUBLE PRECISION

*> \endverbatim

*>

*> \param[in,out] DMIN2

*> \verbatim

*>          DMIN2 is DOUBLE PRECISION

*> \endverbatim

*>

*> \param[in,out] DN

*> \verbatim

*>          DN is DOUBLE PRECISION

*> \endverbatim

*>

*> \param[in,out] DN1

*> \verbatim

*>          DN1 is DOUBLE PRECISION

*> \endverbatim

*>

*> \param[in,out] DN2

*> \verbatim

*>          DN2 is DOUBLE PRECISION

*> \endverbatim

*>

*> \param[in,out] G

*> \verbatim

*>          G is DOUBLE PRECISION

*> \endverbatim

*>

*> \param[in,out] TAU

*> \verbatim

*>          TAU is DOUBLE PRECISION

*>

*>         These are passed as arguments in order to save their values

*>         between calls to DLASQ3.

*> \endverbatim

*

*  Authors:

*  ========

*

*> \author Univ. of Tennessee

*> \author Univ. of California Berkeley

*> \author Univ. of Colorado Denver

*> \author NAG Ltd.

*

*> \date September 2012

*

*> \ingroup auxOTHERcomputational

*

*  =====================================================================

      SUBROUTINE dlasq3( I0, N0, Z, PP, DMIN, SIGMA, DESIG, QMAX, NFAIL,

     $                   iter, ndiv, ieee, ttype, dmin1, dmin2, dn, dn1,

     $                   dn2, g, tau )

*

*  -- LAPACK computational routine (version 3.4.2) --

*  -- LAPACK is a software package provided by Univ. of Tennessee,    --

*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--

*     September 2012

*

*     .. Scalar Arguments ..

      LOGICAL            ieee

      INTEGER            i0, iter, n0, ndiv, nfail, pp

      DOUBLE PRECISION   desig, dmin, dmin1, dmin2, dn, dn1, dn2, g,

     $                   qmax, sigma, tau

*     ..

*     .. Array Arguments ..

      DOUBLE PRECISION   z( * )

*     ..

*

*  =====================================================================

*

*     .. Parameters ..

      DOUBLE PRECISION   cbias

      parameter( cbias = 1.50d0 )

      DOUBLE PRECISION   zero, qurtr, half, one, two, hundrd

      parameter( zero = 0.0d0, qurtr = 0.250d0, half = 0.5d0,

     $                     one = 1.0d0, two = 2.0d0, hundrd = 100.0d0 )

*     ..

*     .. Local Scalars ..

      INTEGER            ipn4, j4, n0in, nn, ttype

      DOUBLE PRECISION   eps, s, t, temp, tol, tol2

*     ..

*     .. External Subroutines ..

      EXTERNAL           dlasq4, dlasq5, dlasq6

*     ..

*     .. External Function ..

      DOUBLE PRECISION   dlamch

      LOGICAL            disnan

      EXTERNAL           disnan, dlamch

*     ..

*     .. Intrinsic Functions ..

      INTRINSIC          abs, max, min, sqrt

*     ..

*     .. Executable Statements ..

*

      n0in = n0

      eps = dlamch( 'Precision' )

      tol = eps*hundrd

      tol2 = tol**2

*

*     Check for deflation.

*

   10 continue

*

      IF( n0.LT.i0 )

     $   return

      IF( n0.EQ.i0 )

     $   go to 20

      nn = 4*n0 + pp

      IF( n0.EQ.( i0+1 ) )

     $   go to 40

*

*     Check whether E(N0-1) is negligible, 1 eigenvalue.

*

      IF( z( nn-5 ).GT.tol2*( sigma+z( nn-3 ) ) .AND.

     $    z( nn-2*pp-4 ).GT.tol2*z( nn-7 ) )

     $   go to 30

*

   20 continue

*

      z( 4*n0-3 ) = z( 4*n0+pp-3 ) + sigma

      n0 = n0 - 1

      go to 10

*

*     Check  whether E(N0-2) is negligible, 2 eigenvalues.

*

   30 continue

*

      IF( z( nn-9 ).GT.tol2*sigma .AND.

     $    z( nn-2*pp-8 ).GT.tol2*z( nn-11 ) )

     $   go to 50

*

   40 continue

*

      IF( z( nn-3 ).GT.z( nn-7 ) ) THEN

         s = z( nn-3 )

         z( nn-3 ) = z( nn-7 )

         z( nn-7 ) = s

      END IF

      t = half*( ( z( nn-7 )-z( nn-3 ) )+z( nn-5 ) )

      IF( z( nn-5 ).GT.z( nn-3 )*tol2.AND.t.NE.zero ) THEN

         s = z( nn-3 )*( z( nn-5 ) / t )

         IF( s.LE.t ) THEN

            s = z( nn-3 )*( z( nn-5 ) /

     $          ( t*( one+sqrt( one+s / t ) ) ) )

         ELSE

            s = z( nn-3 )*( z( nn-5 ) / ( t+sqrt( t )*sqrt( t+s ) ) )

         END IF

         t = z( nn-7 ) + ( s+z( nn-5 ) )

         z( nn-3 ) = z( nn-3 )*( z( nn-7 ) / t )

         z( nn-7 ) = t

      END IF

      z( 4*n0-7 ) = z( nn-7 ) + sigma

      z( 4*n0-3 ) = z( nn-3 ) + sigma

      n0 = n0 - 2

      go to 10

*

   50 continue

      IF( pp.EQ.2 )

     $   pp = 0

*

*     Reverse the qd-array, if warranted.

*

      IF( dmin.LE.zero .OR. n0.LT.n0in ) THEN

         IF( cbias*z( 4*i0+pp-3 ).LT.z( 4*n0+pp-3 ) ) THEN

            ipn4 = 4*( i0+n0 )

            DO 60 j4 = 4*i0, 2*( i0+n0-1 ), 4

               temp = z( j4-3 )

               z( j4-3 ) = z( ipn4-j4-3 )

               z( ipn4-j4-3 ) = temp

               temp = z( j4-2 )

               z( j4-2 ) = z( ipn4-j4-2 )

               z( ipn4-j4-2 ) = temp

               temp = z( j4-1 )

               z( j4-1 ) = z( ipn4-j4-5 )

               z( ipn4-j4-5 ) = temp

               temp = z( j4 )

               z( j4 ) = z( ipn4-j4-4 )

               z( ipn4-j4-4 ) = temp

   60       continue

            IF( n0-i0.LE.4 ) THEN

               z( 4*n0+pp-1 ) = z( 4*i0+pp-1 )

               z( 4*n0-pp ) = z( 4*i0-pp )

            END IF

            dmin2 = min( dmin2, z( 4*n0+pp-1 ) )

            z( 4*n0+pp-1 ) = min( z( 4*n0+pp-1 ), z( 4*i0+pp-1 ),

     $                            z( 4*i0+pp+3 ) )

            z( 4*n0-pp ) = min( z( 4*n0-pp ), z( 4*i0-pp ),

     $                          z( 4*i0-pp+4 ) )

            qmax = max( qmax, z( 4*i0+pp-3 ), z( 4*i0+pp+1 ) )

            dmin = -zero

         END IF

      END IF

*

*     Choose a shift.

*

      CALL dlasq4( i0, n0, z, pp, n0in, dmin, dmin1, dmin2, dn, dn1,

     $             dn2, tau, ttype, g )

*

*     Call dqds until DMIN > 0.

*

   70 continue

*

      CALL dlasq5( i0, n0, z, pp, tau, sigma, dmin, dmin1, dmin2, dn,

     $             dn1, dn2, ieee, eps )

*

      ndiv = ndiv + ( n0-i0+2 )

      iter = iter + 1

*

*     Check status.

*

      IF( dmin.GE.zero .AND. dmin1.GE.zero ) THEN

*

*        Success.

*

         go to 90

*

      ELSE IF( dmin.LT.zero .AND. dmin1.GT.zero .AND.

     $         z( 4*( n0-1 )-pp ).LT.tol*( sigma+dn1 ) .AND.

     $         abs( dn ).LT.tol*sigma ) THEN

*

*        Convergence hidden by negative DN.

*

         z( 4*( n0-1 )-pp+2 ) = zero

         dmin = zero

         go to 90

      ELSE IF( dmin.LT.zero ) THEN

*

*        TAU too big. Select new TAU and try again.

*

         nfail = nfail + 1

         IF( ttype.LT.-22 ) THEN

*

*           Failed twice. Play it safe.

*

            tau = zero

         ELSE IF( dmin1.GT.zero ) THEN

*

*           Late failure. Gives excellent shift.

*

            tau = ( tau+dmin )*( one-two*eps )

            ttype = ttype - 11

         ELSE

*

*           Early failure. Divide by 4.

*

            tau = qurtr*tau

            ttype = ttype - 12

         END IF

         go to 70

      ELSE IF( disnan( dmin ) ) THEN

*

*        NaN.

*

         IF( tau.EQ.zero ) THEN

            go to 80

         ELSE

            tau = zero

            go to 70

         END IF

      ELSE

*

*        Possible underflow. Play it safe.

*

         go to 80

      END IF

*

*     Risk of underflow.

*

   80 continue

      CALL dlasq6( i0, n0, z, pp, dmin, dmin1, dmin2, dn, dn1, dn2 )

      ndiv = ndiv + ( n0-i0+2 )

      iter = iter + 1

      tau = zero

*

   90 continue

      IF( tau.LT.sigma ) THEN

         desig = desig + tau

         t = sigma + desig

         desig = desig - ( t-sigma )

      ELSE

         t = sigma + tau

         desig = sigma - ( t-tau ) + desig

      END IF

      sigma = t

*

      return

*

*     End of DLASQ3

*

      END