d0/d61/pdlltdriver_8f_source.html

      PROGRAM pdlltdriver

*

*  -- ScaLAPACK testing driver (version 1.7) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     May 1, 1997

*

*  Purpose

*  =======

*

*  PDLLTDRIVER is the main test program for the DOUBLE PRECISION

*  ScaLAPACK Cholesky routines.  This test driver performs an

*  A = L*L**T or A = U**T*U factorization and solve, and optionally

*  performs condition estimation and iterative refinement.

*

*  The program must be driven by a short data file.  An annotated

*  example of a data file can be obtained by deleting the first 3

*  characters from the following 18 lines:

*  'ScaLAPACK LLt factorization input file'

*  'Intel iPSC/860 hypercube, gamma model.'

*  'LLT.out'            output file name (if any)

*  6                    device out

*  'U'                  define Lower or Upper

*  1                    number of problems sizes

*  31 100 200           values of N

*  1                    number of NB's

*  2 10 24              values of NB

*  1                    number of NRHS's

*  1                    values of NRHS

*  1                    Number of NBRHS's

*  1                    values of NBRHS

*  1                    number of process grids (ordered pairs of P & Q)

*  2                    values of P

*  2                    values of Q

*  1.0                  threshold

*  T                    (T or F) Test Cond. Est. and Iter. Ref. Routines

*

*

*  Internal Parameters

*  ===================

*

*  TOTMEM   INTEGER, default = 2000000

*           TOTMEM is a machine-specific parameter indicating the

*           maximum amount of available memory in bytes.

*           The user should customize TOTMEM to his platform.  Remember

*           to leave room in memory for the operating system, the BLACS

*           buffer, etc.  For example, on a system with 8 MB of memory

*           per process (e.g., one processor on an Intel iPSC/860), the

*           parameters we use are TOTMEM=6200000 (leaving 1.8 MB for OS,

*           code, BLACS buffer, etc).  However, for PVM, we usually set

*           TOTMEM = 2000000.  Some experimenting with the maximum value

*           of TOTMEM may be required.

*

*  INTGSZ   INTEGER, default = 4 bytes.

*  DBLESZ   INTEGER, default = 8 bytes.

*           INTGSZ and DBLESZ indicate the length in bytes on the

*           given platform for an integer and a double precision real.

*  MEM      DOUBLE PRECISION array, dimension ( TOTMEM / DBLESZ )

*

*           All arrays used by SCALAPACK routines are allocated from

*           this array and referenced by pointers.  The integer IPA,

*           for example, is a pointer to the starting element of MEM for

*           the matrix A.

*

*  =====================================================================

*

*     .. Parameters ..

      INTEGER            block_cyclic_2d, csrc_, ctxt_, dlen_, dtype_,

     $                   lld_, mb_, m_, nb_, n_, rsrc_

      parameter( block_cyclic_2d = 1, dlen_ = 9, dtype_ = 1,

     $                     ctxt_ = 2, m_ = 3, n_ = 4, mb_ = 5, nb_ = 6,

     $                     rsrc_ = 7, csrc_ = 8, lld_ = 9 )

      INTEGER            dblesz, intgsz, memsiz, ntests, totmem

      DOUBLE PRECISION   padval, zero

      parameter( dblesz = 8, intgsz = 4, totmem = 2000000,

     $                     memsiz = totmem / dblesz, ntests = 20,

     $                     padval = -9923.0d+0, zero = 0.0d+0 )

*     ..

*     .. Local Scalars ..

      LOGICAL            check, est

      CHARACTER          uplo

      CHARACTER*6        passed

      CHARACTER*80       outfile

      INTEGER            hh, i, iam, iaseed, ibseed, ictxt, imidpad,

     $                   info, ipa, ipa0, ipb, ipb0, ipberr, ipferr,

     $                   iprepad, ipostpad, ipw, ipw2, itemp, j, k,

     $                   kfail, kk, kpass, kskip, ktests, lcm, lcmq,

     $                   liwork, lwork, lw2, mycol, myrhs, myrow, n, nb,

     $                   nbrhs, ngrids, nmat, nnb, nnbr, nnr, nout, np,

     $                   npcol, nprocs, nprow, nq, nrhs, worksiz

      REAL               thresh

      DOUBLE PRECISION   anorm, anorm1, fresid, nops, rcond,

     $                   sresid, sresid2, tmflops

*     ..

*     .. Local Arrays ..

      INTEGER            desca( dlen_ ), descb( dlen_ ), ierr( 1 ),

     $                   nbrval( ntests ), nbval( ntests ),

     $                   nrval( ntests ), nval( ntests ),

     $                   pval( ntests ), qval( ntests )

      DOUBLE PRECISION   ctime( 2 ), mem( memsiz ), wtime( 2 )

*     ..

*     .. External Subroutines ..

      EXTERNAL           blacs_barrier, blacs_exit, blacs_gridexit,

     $                   blacs_gridinfo, blacs_gridinit, descinit,

     $                   igsum2d, blacs_pinfo, pdchekpad, pdfillpad,

     $                   pdlafchk, pdlaschk, pdlltinfo,

     $                   pdmatgen, pdpocon, pdporfs,

     $                   pdpotrf, pdpotrrv, pdpotrs, slboot,

     $                   slcombine, sltimer

*     ..

*     .. External Functions ..

      LOGICAL            lsame

      INTEGER            iceil, ilcm, numroc

      DOUBLE PRECISION   pdlansy

      EXTERNAL           iceil, ilcm, lsame, numroc, pdlansy

*     ..

*     .. Intrinsic Functions ..

      INTRINSIC          dble, max, min

*     ..

*     .. Data Statements ..

      DATA               kfail, kpass, kskip, ktests / 4*0 /

*     ..

*     .. Executable Statements ..

*

*     Get starting information

*

      CALL blacs_pinfo( iam, nprocs )

      iaseed = 100

      ibseed = 200

      CALL pdlltinfo( outfile, nout, uplo, nmat, nval, ntests, nnb,

     $                nbval, ntests, nnr, nrval, ntests, nnbr, nbrval,

     $                ntests, ngrids, pval, ntests, qval, ntests,

     $                thresh, est, mem, iam, nprocs )

      check = ( thresh.GE.0.0e+0 )

*

*     Print headings

*

      IF( iam.EQ.0 ) THEN

         WRITE( nout, fmt = * )

         WRITE( nout, fmt = 9995 )

         WRITE( nout, fmt = 9994 )

         WRITE( nout, fmt = * )

      END IF

*

*     Loop over different process grids

*

      DO 50 i = 1, ngrids

*

         nprow = pval( i )

         npcol = qval( i )

*

*        Make sure grid information is correct

*

         ierr( 1 ) = 0

         IF( nprow.LT.1 ) THEN

            IF( iam.EQ.0 )

     $         WRITE( nout, fmt = 9999 ) 'GRID', 'nprow', nprow

            ierr( 1 ) = 1

         ELSE IF( npcol.LT.1 ) THEN

            IF( iam.EQ.0 )

     $         WRITE( nout, fmt = 9999 ) 'GRID', 'npcol', npcol

            ierr( 1 ) = 1

         ELSE IF( nprow*npcol.GT.nprocs ) THEN

            IF( iam.EQ.0 )

     $         WRITE( nout, fmt = 9998 ) nprow*npcol, nprocs

            ierr( 1 ) = 1

         END IF

*

         IF( ierr( 1 ).GT.0 ) THEN

            IF( iam.EQ.0 )

     $         WRITE( nout, fmt = 9997 ) 'grid'

            kskip = kskip + 1

            GO TO 50

         END IF

*

*        Define process grid

*

         CALL blacs_get( -1, 0, ictxt )

         CALL blacs_gridinit( ictxt, 'Row-major', nprow, npcol )

         CALL blacs_gridinfo( ictxt, nprow, npcol, myrow, mycol )

*

*        Go to bottom of process grid loop if this case doesn't use my

*        process

*

         IF( myrow.GE.nprow .OR. mycol.GE.npcol )

     $      GO TO 50

*

         DO 40 j = 1, nmat

*

            n = nval( j )

*

*           Make sure matrix information is correct

*

            ierr( 1 ) = 0

            IF( n.LT.1 ) THEN

               IF( iam.EQ.0 )

     $            WRITE( nout, fmt = 9999 ) 'MATRIX', 'N', n

               ierr( 1 ) = 1

            ELSE IF( n.LT.1 ) THEN

               IF( iam.EQ.0 )

     $            WRITE( nout, fmt = 9999 ) 'MATRIX', 'N', n

               ierr( 1 ) = 1

            END IF

*

*           Check all processes for an error

*

            CALL igsum2d( ictxt, 'All', ' ', 1, 1, ierr, 1, -1, 0 )

*

            IF( ierr( 1 ).GT.0 ) THEN

               IF( iam.EQ.0 )

     $            WRITE( nout, fmt = 9997 ) 'matrix'

               kskip = kskip + 1

               GO TO 40

            END IF

*

            DO 30 k = 1, nnb

*

               nb = nbval( k )

*

*              Make sure nb is legal

*

               ierr( 1 ) = 0

               IF( nb.LT.1 ) THEN

                  ierr( 1 ) = 1

                  IF( iam.EQ.0 )

     $               WRITE( nout, fmt = 9999 ) 'NB', 'NB', nb

               END IF

*

*              Check all processes for an error

*

               CALL igsum2d( ictxt, 'All', ' ', 1, 1, ierr, 1, -1, 0 )

*

               IF( ierr( 1 ).GT.0 ) THEN

                  IF( iam.EQ.0 )

     $               WRITE( nout, fmt = 9997 ) 'NB'

                  kskip = kskip + 1

                  GO TO 30

               END IF

*

*              Padding constants

*

               np = numroc( n, nb, myrow, 0, nprow )

               nq = numroc( n, nb, mycol, 0, npcol )

               IF( check ) THEN

                  iprepad  = max( nb, np )

                  imidpad  = nb

                  ipostpad = max( nb, nq )

               ELSE

                  iprepad  = 0

                  imidpad  = 0

                  ipostpad = 0

               END IF

*

*              Initialize the array descriptor for the matrix A

*

               CALL descinit( desca, n, n, nb, nb, 0, 0, ictxt,

     $                        max( 1, np )+imidpad, ierr( 1 ) )

*

*              Check all processes for an error

*

               CALL igsum2d( ictxt, 'All', ' ', 1, 1, ierr, 1, -1, 0 )

*

               IF( ierr( 1 ).LT.0 ) THEN

                  IF( iam.EQ.0 )

     $               WRITE( nout, fmt = 9997 ) 'descriptor'

                  kskip = kskip + 1

                  GO TO 30

               END IF

*

*              Assign pointers into MEM for SCALAPACK arrays, A is

*              allocated starting at position MEM( IPREPAD+1 )

*

               ipa = iprepad+1

               IF( est ) THEN

                  ipa0 = ipa + desca( lld_ )*nq + ipostpad + iprepad

                  ipw = ipa0 + desca( lld_ )*nq + ipostpad + iprepad

               ELSE

                  ipw = ipa + desca( lld_ )*nq + ipostpad + iprepad

               END IF

*

*

               IF( check ) THEN

*

*                 Calculate the amount of workspace required by

*                 the checking routines PDLAFCHK, PDPOTRRV, and

*                 PDLANSY

*

                  worksiz = np * desca( nb_ )

*

                  worksiz = max( worksiz, desca( mb_ ) * desca( nb_ ) )

*

                  lcm = ilcm( nprow, npcol )

                  itemp = max( 2, 2 * nq ) + np

                  IF( nprow.NE.npcol ) THEN

                     itemp = itemp +

     $                       nb * iceil( iceil( np, nb ), lcm / nprow )

                  END IF

                  worksiz = max( worksiz, itemp )

                  worksiz = worksiz + ipostpad

*

               ELSE

*

                  worksiz = ipostpad

*

               END IF

*

*              Check for adequate memory for problem size

*

               ierr( 1 ) = 0

               IF( ipw+worksiz.GT.memsiz ) THEN

                  IF( iam.EQ.0 )

     $               WRITE( nout, fmt = 9996 ) 'factorization',

     $               ( ipw+worksiz )*dblesz

                  ierr( 1 ) = 1

               END IF

*

*              Check all processes for an error

*

               CALL igsum2d( ictxt, 'All', ' ', 1, 1, ierr, 1, -1, 0 )

*

               IF( ierr( 1 ).GT.0 ) THEN

                  IF( iam.EQ.0 )

     $               WRITE( nout, fmt = 9997 ) 'MEMORY'

                  kskip = kskip + 1

                  GO TO 30

               END IF

*

*              Generate a symmetric positive definite matrix A

*

               CALL pdmatgen( ictxt, 'Symm', 'Diag', desca( m_ ),

     $                        desca( n_ ), desca( mb_ ), desca( nb_ ),

     $                        mem( ipa ), desca( lld_ ), desca( rsrc_ ),

     $                        desca( csrc_ ), iaseed, 0, np, 0, nq,

     $                        myrow, mycol, nprow, npcol )

*

*              Calculate inf-norm of A for residual error-checking

*

               IF( check ) THEN

                  CALL pdfillpad( ictxt, np, nq, mem( ipa-iprepad ),

     $                             desca( lld_ ), iprepad, ipostpad,

     $                             padval )

                  CALL pdfillpad( ictxt, worksiz-ipostpad, 1,

     $                             mem( ipw-iprepad ), worksiz-ipostpad,

     $                             iprepad, ipostpad, padval )

                  anorm = pdlansy( 'I', uplo, n, mem( ipa ), 1, 1,

     $                             desca, mem( ipw ) )

                  anorm1 = pdlansy( '1', uplo, n, mem( ipa ), 1, 1,

     $                             desca, mem( ipw ) )

                  CALL pdchekpad( ictxt, 'PDLANSY', np, nq,

     $                            mem( ipa-iprepad ), desca( lld_ ),

     $                            iprepad, ipostpad, padval )

                  CALL pdchekpad( ictxt, 'PDLANSY',

     $                            worksiz-ipostpad, 1,

     $                            mem( ipw-iprepad ), worksiz-ipostpad,

     $                            iprepad, ipostpad, padval )

               END IF

*

               IF( est ) THEN

                  CALL pdmatgen( ictxt, 'Symm', 'Diag', desca( m_ ),

     $                           desca( n_ ), desca( mb_ ),

     $                           desca( nb_ ), mem( ipa0 ),

     $                           desca( lld_ ), desca( rsrc_ ),

     $                           desca( csrc_ ), iaseed, 0, np, 0, nq,

     $                           myrow, mycol, nprow, npcol )

                  IF( check )

     $               CALL pdfillpad( ictxt, np, nq,

     $                               mem( ipa0-iprepad ), desca( lld_ ),

     $                               iprepad, ipostpad, padval )

               END IF

*

               CALL slboot()

               CALL blacs_barrier( ictxt, 'All' )

*

*              Perform LLt factorization

*

               CALL sltimer( 1 )

*

               CALL pdpotrf( uplo, n, mem( ipa ), 1, 1, desca, info )

*

               CALL sltimer( 1 )

*

               IF( info.NE.0 ) THEN

                  IF( iam.EQ.0 )

     $               WRITE( nout, fmt = * ) 'PDPOTRF INFO=', info

                  kfail = kfail + 1

                  rcond = zero

                  GO TO 60

               END IF

*

               IF( check ) THEN

*

*                 Check for memory overwrite in LLt factorization

*

                  CALL pdchekpad( ictxt, 'PDPOTRF', np, nq,

     $                            mem( ipa-iprepad ), desca( lld_ ),

     $                            iprepad, ipostpad, padval )

               END IF

*

               IF( est ) THEN

*

*                 Calculate workspace required for PDPOCON

*

                  lwork = max( 1, 2*np ) + max( 1, 2*nq ) +

     $                    max( 2, desca( nb_ )*

     $                    max( 1, iceil( nprow-1, npcol ) ),

     $                    nq + desca( nb_ )*

     $                    max( 1, iceil( npcol-1, nprow ) ) )

                  ipw2  = ipw + lwork + ipostpad + iprepad

                  liwork = max( 1, np )

                  lw2 = iceil( liwork*intgsz, dblesz ) + ipostpad

*

                  ierr( 1 ) = 0

                  IF( ipw2+lw2.GT.memsiz ) THEN

                     IF( iam.EQ.0 )

     $                  WRITE( nout, fmt = 9996 )'cond est',

     $                  ( ipw2+lw2 )*dblesz

                     ierr( 1 ) = 1

                  END IF

*

*                 Check all processes for an error

*

                  CALL igsum2d( ictxt, 'All', ' ', 1, 1, ierr, 1,

     $                          -1, 0 )

*

                  IF( ierr( 1 ).GT.0 ) THEN

                     IF( iam.EQ.0 )

     $                  WRITE( nout, fmt = 9997 ) 'MEMORY'

                     kskip = kskip + 1

                     GO TO 60

                  END IF

*

                  IF( check ) THEN

                     CALL pdfillpad( ictxt, lwork, 1,

     $                               mem( ipw-iprepad ), lwork,

     $                               iprepad, ipostpad, padval )

                     CALL pdfillpad( ictxt, lw2-ipostpad, 1,

     $                               mem( ipw2-iprepad ),

     $                               lw2-ipostpad, iprepad,

     $                               ipostpad, padval )

                  END IF

*

*                 Compute condition number of the matrix

*

                  CALL pdpocon( uplo, n, mem( ipa ), 1, 1, desca,

     $                          anorm1, rcond, mem( ipw ), lwork,

     $                          mem( ipw2 ), liwork, info )

*

                  IF( check ) THEN

                     CALL pdchekpad( ictxt, 'PDPOCON', np, nq,

     $                               mem( ipa-iprepad ), desca( lld_ ),

     $                               iprepad, ipostpad, padval )

                     CALL pdchekpad( ictxt, 'PDPOCON',

     $                               lwork, 1, mem( ipw-iprepad ),

     $                               lwork, iprepad, ipostpad,

     $                               padval )

                     CALL pdchekpad( ictxt, 'PDPOCON',

     $                               lw2-ipostpad, 1,

     $                               mem( ipw2-iprepad ), lw2-ipostpad,

     $                               iprepad, ipostpad, padval )

                  END IF

               END IF

*

*              Loop over the different values for NRHS

*

               DO 20 hh = 1, nnr

*

                  nrhs = nrval( hh )

*

                  DO 10 kk = 1, nnbr

*

                     nbrhs = nbrval( kk )

*

*                    Initialize Array Descriptor for rhs

*

                     CALL descinit( descb, n, nrhs, nb, nbrhs, 0, 0,

     $                              ictxt, max( 1, np )+imidpad,

     $                              ierr( 1 ) )

*

*                    move IPW to allow room for RHS

*

                     myrhs = numroc( descb( n_ ), descb( nb_ ), mycol,

     $                               descb( csrc_ ), npcol )

                     ipb = ipw

*

                     IF( est ) THEN

                        ipb0 = ipb +  descb( lld_ )*myrhs + ipostpad +

     $                           iprepad

                        ipferr = ipb0 +  descb( lld_ )*myrhs + ipostpad

     $                           + iprepad

                        ipberr = myrhs + ipferr + ipostpad + iprepad

                        ipw = myrhs + ipberr + ipostpad + iprepad

                     ELSE

                        ipw = ipb +  descb( lld_ )*myrhs + ipostpad +

     $                        iprepad

                     END IF

*

                     IF( check ) THEN

*

*                       Calculate the amount of workspace required by

*                       the checking routines PDLASCHK

*

                        lcmq = lcm / npcol

                        worksiz = max( worksiz-ipostpad,

     $                    nq * nbrhs + np * nbrhs +

     $                    max( max( nq*nb, 2*nbrhs ),

     $                    nbrhs * numroc( numroc(n,nb,0,0,npcol),nb,

     $                    0,0,lcmq ) ) )

                        worksiz = ipostpad + worksiz

                     ELSE

                        worksiz = ipostpad

                     END IF

*

                     ierr( 1 ) = 0

                     IF( ipw+worksiz.GT.memsiz ) THEN

                        IF( iam.EQ.0 )

     $                     WRITE( nout, fmt = 9996 )'solve',

     $                            ( ipw+worksiz )*dblesz

                        ierr( 1 ) = 1

                     END IF

*

*                    Check all processes for an error

*

                     CALL igsum2d( ictxt, 'All', ' ', 1, 1, ierr, 1,

     $                             -1, 0 )

*

                     IF( ierr( 1 ).GT.0 ) THEN

                        IF( iam.EQ.0 )

     $                     WRITE( nout, fmt = 9997 ) 'MEMORY'

                        kskip = kskip + 1

                        GO TO 10

                     END IF

*

*                    Generate RHS

*

                     CALL pdmatgen( ictxt, 'No', 'No', descb( m_ ),

     $                              descb( n_ ), descb( mb_ ),

     $                              descb( nb_ ), mem( ipb ),

     $                              descb( lld_ ), descb( rsrc_ ),

     $                              descb( csrc_ ), ibseed, 0, np, 0,

     $                              myrhs, myrow, mycol, nprow, npcol )

*

                     IF( check )

     $                  CALL pdfillpad( ictxt, np, myrhs,

     $                                  mem( ipb-iprepad ),

     $                                  descb( lld_ ),

     $                                  iprepad, ipostpad, padval )

*

                     IF( est ) THEN

                        CALL pdmatgen( ictxt, 'No', 'No', descb( m_ ),

     $                                 descb( n_ ), descb( mb_ ),

     $                                 descb( nb_ ), mem( ipb0 ),

     $                                 descb( lld_ ), descb( rsrc_ ),

     $                                 descb( csrc_ ), ibseed, 0, np, 0,

     $                                 myrhs, myrow, mycol, nprow,

     $                                 npcol )

*

                        IF( check ) THEN

                           CALL pdfillpad( ictxt, np, myrhs,

     $                                     mem( ipb0-iprepad ),

     $                                     descb( lld_ ), iprepad,

     $                                     ipostpad, padval )

                           CALL pdfillpad( ictxt, 1, myrhs,

     $                                     mem( ipferr-iprepad ), 1,

     $                                     iprepad, ipostpad,

     $                                     padval )

                           CALL pdfillpad( ictxt, 1, myrhs,

     $                                     mem( ipberr-iprepad ), 1,

     $                                     iprepad, ipostpad,

     $                                     padval )

                        END IF

                     END IF

*

                     CALL blacs_barrier( ictxt, 'All' )

                     CALL sltimer( 2 )

*

*                    Solve linear system via Cholesky factorization

*

                     CALL pdpotrs( uplo, n, nrhs, mem( ipa ), 1, 1,

     $                             desca, mem( ipb ), 1, 1, descb,

     $                             info )

*

                     CALL sltimer( 2 )

*

                     IF( check ) THEN

*

*                       check for memory overwrite

*

                        CALL pdchekpad( ictxt, 'PDPOTRS', np, nq,

     $                                  mem( ipa-iprepad ),

     $                                  desca( lld_ ),

     $                                  iprepad, ipostpad, padval )

                        CALL pdchekpad( ictxt, 'PDPOTRS', np,

     $                                  myrhs, mem( ipb-iprepad ),

     $                                  descb( lld_ ), iprepad,

     $                                  ipostpad, padval )

*

                        CALL pdfillpad( ictxt, worksiz-ipostpad, 1,

     $                                  mem( ipw-iprepad ),

     $                                  worksiz-ipostpad, iprepad,

     $                                  ipostpad, padval )

*

*                       check the solution to rhs

*

                        CALL pdlaschk( 'Symm', 'Diag', n, nrhs,

     $                                 mem( ipb ), 1, 1, descb,

     $                                 iaseed, 1, 1, desca, ibseed,

     $                                 anorm, sresid, mem( ipw ) )

*

                        IF( iam.EQ.0 .AND. sresid.GT.thresh )

     $                        WRITE( nout, fmt = 9985 ) sresid

*

*                       check for memory overwrite

*

                        CALL pdchekpad( ictxt, 'PDLASCHK', np,

     $                                  myrhs, mem( ipb-iprepad ),

     $                                  descb( lld_ ), iprepad,

     $                                  ipostpad, padval )

                        CALL pdchekpad( ictxt, 'PDLASCHK',

     $                                  worksiz-ipostpad, 1,

     $                                  mem( ipw-iprepad ),

     $                                  worksiz-ipostpad, iprepad,

     $                                  ipostpad, padval )

*

*                       The second test is a NaN trap

*

                        IF( ( sresid.LE.thresh          ).AND.

     $                      ( (sresid-sresid).EQ.0.0d+0 ) ) THEN

                           kpass = kpass + 1

                           passed = 'PASSED'

                        ELSE

                           kfail = kfail + 1

                           passed = 'FAILED'

                        END IF

                     ELSE

                        kpass = kpass + 1

                        sresid = sresid - sresid

                        passed = 'BYPASS'

                     END IF

*

                     IF( est ) THEN

*

*                       Calculate workspace required for PDPORFS

*

                           lwork = max( 1, 3*np )

                           ipw2  = ipw + lwork + ipostpad + iprepad

                           liwork = max( 1, np )

                           lw2 = iceil( liwork*intgsz, dblesz ) +

     $                           ipostpad

*

                           ierr( 1 ) = 0

                           IF( ipw2+lw2.GT.memsiz ) THEN

                              IF( iam.EQ.0 )

     $                           WRITE( nout, fmt = 9996 )

     $                           'iter ref', ( ipw2+lw2 )*dblesz

                              ierr( 1 ) = 1

                           END IF

*

*                          Check all processes for an error

*

                           CALL igsum2d( ictxt, 'All', ' ', 1, 1, ierr,

     $                                   1, -1, 0 )

*

                           IF( ierr( 1 ).GT.0 ) THEN

                              IF( iam.EQ.0 )

     $                           WRITE( nout, fmt = 9997 )

     $                           'MEMORY'

                              kskip = kskip + 1

                              GO TO 10

                           END IF

*

                           IF( check ) THEN

                              CALL pdfillpad( ictxt, lwork, 1,

     $                                        mem( ipw-iprepad ),

     $                                        lwork, iprepad, ipostpad,

     $                                        padval )

                              CALL pdfillpad( ictxt, lw2-ipostpad,

     $                                        1, mem( ipw2-iprepad ),

     $                                        lw2-ipostpad,

     $                                        iprepad, ipostpad,

     $                                        padval )

                           END IF

*

*                          Use iterative refinement to improve the

*                          computed solution

*

                           CALL pdporfs( uplo, n, nrhs, mem( ipa0 ),

     $                                   1, 1, desca, mem( ipa ), 1, 1,

     $                                   desca, mem( ipb0 ), 1, 1,

     $                                   descb, mem( ipb ), 1, 1, descb,

     $                                   mem( ipferr ), mem( ipberr ),

     $                                   mem( ipw ), lwork, mem( ipw2 ),

     $                                   liwork, info )

*

*                          check for memory overwrite

*

                           IF( check ) THEN

                              CALL pdchekpad( ictxt, 'PDPORFS', np,

     $                                        nq, mem( ipa0-iprepad ),

     $                                        desca( lld_ ), iprepad,

     $                                        ipostpad, padval )

                              CALL pdchekpad( ictxt, 'PDPORFS', np,

     $                                        nq, mem( ipa-iprepad ),

     $                                        desca( lld_ ), iprepad,

     $                                        ipostpad, padval )

                              CALL pdchekpad( ictxt, 'PDPORFS', np,

     $                                        myrhs, mem( ipb-iprepad ),

     $                                        descb( lld_ ), iprepad,

     $                                        ipostpad, padval )

                              CALL pdchekpad( ictxt, 'PDPORFS', np,

     $                                        myrhs,

     $                                        mem( ipb0-iprepad ),

     $                                        descb( lld_ ), iprepad,

     $                                        ipostpad, padval )

                              CALL pdchekpad( ictxt, 'PDPORFS', 1,

     $                                        myrhs,

     $                                        mem( ipferr-iprepad ), 1,

     $                                        iprepad, ipostpad,

     $                                        padval )

                              CALL pdchekpad( ictxt, 'PDPORFS', 1,

     $                                        myrhs,

     $                                        mem( ipberr-iprepad ), 1,

     $                                        iprepad, ipostpad,

     $                                        padval )

                              CALL pdchekpad( ictxt, 'PDPORFS', lwork,

     $                                        1, mem( ipw-iprepad ),

     $                                        lwork, iprepad, ipostpad,

     $                                        padval )

                              CALL pdchekpad( ictxt, 'PDPORFS',

     $                                        lw2-ipostpad, 1,

     $                                        mem( ipw2-iprepad ),

     $                                        lw2-ipostpad,

     $                                        iprepad, ipostpad,

     $                                        padval )

*

                              CALL pdfillpad( ictxt, worksiz-ipostpad,

     $                                        1, mem( ipw-iprepad ),

     $                                        worksiz-ipostpad, iprepad,

     $                                        ipostpad, padval )

*

*                             check the solution to rhs

*

                              CALL pdlaschk( 'Symm', 'Diag', n, nrhs,

     $                                       mem( ipb ), 1, 1, descb,

     $                                       iaseed, 1, 1, desca,

     $                                       ibseed, anorm, sresid2,

     $                                       mem( ipw ) )

*

                              IF( iam.EQ.0 .AND. sresid2.GT.thresh )

     $                           WRITE( nout, fmt = 9985 ) sresid2

*

*                             check for memory overwrite

*

                              CALL pdchekpad( ictxt, 'PDLASCHK', np,

     $                                        myrhs, mem( ipb-iprepad ),

     $                                        descb( lld_ ), iprepad,

     $                                        ipostpad, padval )

                              CALL pdchekpad( ictxt, 'PDLASCHK',

     $                                        worksiz-ipostpad, 1,

     $                                        mem( ipw-iprepad ),

     $                                        worksiz-ipostpad,

     $                                        iprepad, ipostpad,

     $                                        padval )

                        END IF

                     END IF

*

*                    Gather maximum of all CPU and WALL clock timings

*

                     CALL slcombine( ictxt, 'All', '>', 'W', 2, 1,

     $                               wtime )

                     CALL slcombine( ictxt, 'All', '>', 'C', 2, 1,

     $                               ctime )

*

*                    Print results

*

                     IF( myrow.EQ.0 .AND. mycol.EQ.0 ) THEN

*

*                       1/3 N^3 + 1/2 N^2 flops for LLt factorization

*

                        nops = (dble(n)**3)/3.0d+0 +

     $                         (dble(n)**2)/2.0d+0

*

*                       nrhs * 2 N^2 flops for LLt solve.

*

                        nops = nops + 2.0d+0*(dble(n)**2)*dble(nrhs)

*

*                       Calculate total megaflops -- factorization and

*                       solve -- for WALL and CPU time, and print output

*

*                       Print WALL time if machine supports it

*

                        IF( wtime( 1 ) + wtime( 2 ) .GT. 0.0d+0 ) THEN

                           tmflops = nops /

     $                            ( ( wtime( 1 )+wtime( 2 ) ) * 1.0d+6 )

                        ELSE

                           tmflops = 0.0d+0

                        END IF

*

                        IF( wtime( 2 ).GE.0.0d+0 )

     $                     WRITE( nout, fmt = 9993 ) 'WALL', uplo, n,

     $                            nb, nrhs, nbrhs, nprow, npcol,

     $                            wtime( 1 ), wtime( 2 ), tmflops,

     $                            passed

*

*                       Print CPU time if machine supports it

*

                        IF( ctime( 1 )+ctime( 2 ).GT.0.0d+0 ) THEN

                           tmflops = nops /

     $                            ( ( ctime( 1 )+ctime( 2 ) ) * 1.0d+6 )

                        ELSE

                           tmflops = 0.0d+0

                        END IF

*

                        IF( ctime( 2 ).GE.0.0d+0 )

     $                     WRITE( nout, fmt = 9993 ) 'CPU ', uplo, n,

     $                            nb, nrhs, nbrhs, nprow, npcol,

     $                            ctime( 1 ), ctime( 2 ), tmflops,

     $                            passed

*

                     END IF

   10             CONTINUE

   20          CONTINUE

*

               IF( check .AND. sresid.GT.thresh ) THEN

*

*                 Compute FRESID = ||A - LL'|| / (||A|| * N * eps)

*

                  CALL pdpotrrv( uplo, n, mem( ipa ), 1, 1, desca,

     $                           mem( ipw ) )

                  CALL pdlafchk( 'Symm', 'Diag', n, n, mem( ipa ), 1, 1,

     $                           desca, iaseed, anorm, fresid,

     $                           mem( ipw ) )

*

*                 Check for memory overwrite

*

                  CALL pdchekpad( ictxt, 'PDPOTRRV', np, nq,

     $                            mem( ipa-iprepad ), desca( lld_ ),

     $                            iprepad, ipostpad, padval )

                  CALL pdchekpad( ictxt, 'PDGETRRV',

     $                            worksiz-ipostpad, 1,

     $                            mem( ipw-iprepad ), worksiz-ipostpad,

     $                            iprepad, ipostpad, padval )

*

                  IF( iam.EQ.0 ) THEN

                     IF( lsame( uplo, 'L' ) ) THEN

                        WRITE( nout, fmt = 9986 ) 'L*L''', fresid

                     ELSE

                        WRITE( nout, fmt = 9986 ) 'U''*U', fresid

                     END IF

                  END IF

               END IF

*

   30       CONTINUE

   40    CONTINUE

         CALL blacs_gridexit( ictxt )

   50 CONTINUE

*

*     Print ending messages and close output file

*

   60 CONTINUE

      IF( iam.EQ.0 ) THEN

         ktests = kpass + kfail + kskip

         WRITE( nout, fmt = * )

         WRITE( nout, fmt = 9992 ) ktests

         IF( check ) THEN

            WRITE( nout, fmt = 9991 ) kpass

            WRITE( nout, fmt = 9989 ) kfail

         ELSE

            WRITE( nout, fmt = 9990 ) kpass

         END IF

         WRITE( nout, fmt = 9988 ) kskip

         WRITE( nout, fmt = * )

         WRITE( nout, fmt = * )

         WRITE( nout, fmt = 9987 )

         IF( nout.NE.6 .AND. nout.NE.0 )

     $      CLOSE ( nout )

      END IF

*

      CALL blacs_exit( 0 )

*

 9999 FORMAT( 'ILLEGAL ', a6, ': ', a5, ' = ', i3,

     $        '; It should be at least 1' )

 9998 FORMAT( 'ILLEGAL GRID: nprow*npcol = ', i4, '. It can be at most',

     $        i4 )

 9997 FORMAT( 'Bad ', a6, ' parameters: going on to next test case.' )

 9996 FORMAT( 'Unable to perform ', a, ': need TOTMEM of at least',

     $        i11 )

 9995 FORMAT( 'TIME UPLO     N  NB NRHS NBRHS    P    Q LLt Time ',

     $        'Slv Time   MFLOPS CHECK' )

 9994 FORMAT( '---- ---- ----- --- ---- ----- ---- ---- -------- ',

     $        '-------- -------- ------' )

 9993 FORMAT( a4, 4x, a1, 1x, i5, 1x, i3, 1x, i4, 1x, i5, 1x, i4, 1x,

     $        i4, 1x, f8.2, 1x, f8.2, 1x, f8.2, 1x, a6 )

 9992 FORMAT( 'Finished ', i6, ' tests, with the following results:' )

 9991 FORMAT( i5, ' tests completed and passed residual checks.' )

 9990 FORMAT( i5, ' tests completed without checking.' )

 9989 FORMAT( i5, ' tests completed and failed residual checks.' )

 9988 FORMAT( i5, ' tests skipped because of illegal input values.' )

 9987 FORMAT( 'END OF TESTS.' )

 9986 FORMAT( '||A - ', a4, '|| / (||A|| * N * eps) = ', g25.7 )

 9985 FORMAT( '||Ax-b||/(||x||*||A||*eps*N) ', f25.7 )

*

      stop

*

*     End of PDLLTDRIVER

*

      END

pdlafchk
subroutine pdlafchk(aform, diag, m, n, a, ia, ja, desca, iaseed, anorm, fresid, work)
Definition pdlafchk.f:3

pdmatgen
subroutine pdmatgen(ictxt, aform, diag, m, n, mb, nb, a, lda, iarow, iacol, iseed, iroff, irnum, icoff, icnum, myrow, mycol, nprow, npcol)
Definition pdmatgen.f:4

descinit
subroutine descinit(desc, m, n, mb, nb, irsrc, icsrc, ictxt, lld, info)
Definition descinit.f:3

iceil
integer function iceil(inum, idenom)
Definition iceil.f:2

ilcm
integer function ilcm(m, n)
Definition ilcm.f:2

numroc
integer function numroc(n, nb, iproc, isrcproc, nprocs)
Definition numroc.f:2

max
#define max(A, B)
Definition pcgemr.c:180

min
#define min(A, B)
Definition pcgemr.c:181

pdchekpad
subroutine pdchekpad(ictxt, mess, m, n, a, lda, ipre, ipost, chkval)
Definition pdchekpad.f:3

pdfillpad
subroutine pdfillpad(ictxt, m, n, a, lda, ipre, ipost, chkval)
Definition pdfillpad.f:2

pdlansy
double precision function pdlansy(norm, uplo, n, a, ia, ja, desca, work)
Definition pdlansy.f:3

pdlaschk
subroutine pdlaschk(symm, diag, n, nrhs, x, ix, jx, descx, iaseed, ia, ja, desca, ibseed, anorm, resid, work)
Definition pdlaschk.f:4

pdlltdriver
program pdlltdriver
Definition pdlltdriver.f:1

pdlltinfo
subroutine pdlltinfo(summry, nout, uplo, nmat, nval, ldnval, nnb, nbval, ldnbval, nnr, nrval, ldnrval, nnbr, nbrval, ldnbrval, ngrids, pval, ldpval, qval, ldqval, thresh, est, work, iam, nprocs)
Definition pdlltinfo.f:6

pdpocon
subroutine pdpocon(uplo, n, a, ia, ja, desca, anorm, rcond, work, lwork, iwork, liwork, info)
Definition pdpocon.f:3

pdporfs
subroutine pdporfs(uplo, n, nrhs, a, ia, ja, desca, af, iaf, jaf, descaf, b, ib, jb, descb, x, ix, jx, descx, ferr, berr, work, lwork, iwork, liwork, info)
Definition pdporfs.f:4

pdpotrf
subroutine pdpotrf(uplo, n, a, ia, ja, desca, info)
Definition pdpotrf.f:2

pdpotrrv
subroutine pdpotrrv(uplo, n, a, ia, ja, desca, work)
Definition pdpotrrv.f:2

pdpotrs
subroutine pdpotrs(uplo, n, nrhs, a, ia, ja, desca, b, ib, jb, descb, info)
Definition pdpotrs.f:3

slboot
subroutine slboot()
Definition sltimer.f:2

sltimer
subroutine sltimer(i)
Definition sltimer.f:47

slcombine
subroutine slcombine(ictxt, scope, op, timetype, n, ibeg, times)
Definition sltimer.f:267

lsame
logical function lsame(ca, cb)
Definition tools.f:1724