d0/d71/pcblas1tst_8f_source.html

      BLOCK DATA

      INTEGER NSUBS

      parameter(nsubs = 10)

      CHARACTER*7        SNAMES( NSUBS )

      COMMON             /snamec/snames

      DATA               snames/'PCSWAP ', 'PCSCAL ',

     $                   'PCSSCAL', 'PCCOPY ', 'PCAXPY ',

     $                   'PCDOTU ', 'PCDOTC ', 'PSCNRM2',

     $                   'PSCASUM', 'PCAMAX'/

      END BLOCK DATA


      PROGRAM pcbla1tst

*

*  -- PBLAS testing driver (version 2.0.2) --

*     Univ. of Tennessee, Univ. of California Berkeley, Univ. of Colorado Denver

*     May 1 2012

*

*  Purpose

*  =======

*

*  PCBLA1TST is the main testing program for the PBLAS Level 1 routines.

*

*  The program must be driven by a short data file.  An  annotated exam-

*  ple of a data file can be obtained by deleting the first 3 characters

*  from the following 46 lines:

*  'Level 1 PBLAS, Testing input file'

*  'Intel iPSC/860 hypercube, gamma model.'

*  'PCBLAS1TST.SUMM'            output file name (if any)

*  6       device out

*  F       logical flag, T to stop on failures

*  F       logical flag, T to test error exits

*  0       verbosity, 0 for pass/fail, 1-3 for matrix dump on errors

*  10      the leading dimension gap

*  1       number of process grids (ordered pairs of P & Q)

*  2 2 1 4 2 3 8        values of P

*  2 2 4 1 3 2 1        values of Q

*  (1.0E0, 0.0E0)       value of ALPHA

*  2                    number of tests problems

*  3  4                 values of N

*  6 10                 values of M_X

*  6 10                 values of N_X

*  2  5                 values of IMB_X

*  2  5                 values of INB_X

*  2  5                 values of MB_X

*  2  5                 values of NB_X

*  0  1                 values of RSRC_X

*  0  0                 values of CSRC_X

*  1  1                 values of IX

*  1  1                 values of JX

*  1  1                 values of INCX

*  6 10                 values of M_Y

*  6 10                 values of N_Y

*  2  5                 values of IMB_Y

*  2  5                 values of INB_Y

*  2  5                 values of MB_Y

*  2  5                 values of NB_Y

*  0  1                 values of RSRC_Y

*  0  0                 values of CSRC_Y

*  1  1                 values of IY

*  1  1                 values of JY

*  6  1                 values of INCY

*  PCSWAP  T            put F for no test in the same column

*  PCSCAL  T            put F for no test in the same column

*  PCSSCAL T            put F for no test in the same column

*  PCCOPY  T            put F for no test in the same column

*  PCAXPY  T            put F for no test in the same column

*  PCDOTU  T            put F for no test in the same column

*  PCDOTC  T            put F for no test in the same column

*  PSCNRM2 T            put F for no test in the same column

*  PSCASUM T            put F for no test in the same column

*  PCAMAX  T            put F for no test in the same column

*

*  Internal Parameters

*  ===================

*

*  TOTMEM  INTEGER

*          TOTMEM  is  a machine-specific parameter indicating the maxi-

*          mum  amount  of  available  memory per  process in bytes. The

*          user  should  customize TOTMEM to his  platform.  Remember to

*          leave  room  in  memory  for the  operating system, the BLACS

*          buffer, etc.  For  example,  on  a system with 8 MB of memory

*          per process (e.g., one processor  on an Intel iPSC/860),  the

*          parameters we use are TOTMEM=6200000  (leaving 1.8 MB for OS,

*          code, BLACS buffer, etc).  However,  for PVM,  we usually set

*          TOTMEM = 2000000.  Some experimenting  with the maximum value

*          of TOTMEM may be required. By default, TOTMEM is 2000000.

*

*  REALSZ  INTEGER

*  CPLXSZ  INTEGER

*          REALSZ  and  CPLXSZ indicate the length in bytes on the given

*          platform  for a  single precision real and a single precision

*          complex. By default,  REALSZ is set to four and CPLXSZ is set

*          to eight.

*

*  MEM     COMPLEX array

*          MEM is an array of dimension TOTMEM / CPLXSZ.

*          All arrays used by SCALAPACK routines are allocated from this

*          array MEM and referenced by pointers. The  integer  IPA,  for

*          example, is a pointer to the starting element of MEM for  the

*          matrix A.

*

*  -- Written on April 1, 1998 by

*     Antoine Petitet, University  of  Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Parameters ..

      INTEGER            maxtests, maxgrids, gapmul, cplxsz, totmem,

     $                   memsiz, nsubs

      REAL               rzero

      COMPLEX            padval, zero

      parameter( maxtests = 20, maxgrids = 20, gapmul = 10,

     $                   cplxsz = 8, totmem = 2000000,

     $                   memsiz = totmem / cplxsz,

     $                   padval = ( -9923.0e+0, -9923.0e+0 ),

     $                   rzero = 0.0e+0, zero = ( 0.0e+0, 0.0e+0 ),

     $                   nsubs = 10 )

      INTEGER            block_cyclic_2d_inb, csrc_, ctxt_, dlen_,

     $                   dtype_, imb_, inb_, lld_, mb_, m_, nb_, n_,

     $                   rsrc_

      parameter( block_cyclic_2d_inb = 2, dlen_ = 11,

     $                   dtype_ = 1, ctxt_ = 2, m_ = 3, n_ = 4,

     $                   imb_ = 5, inb_ = 6, mb_ = 7, nb_ = 8,

     $                   rsrc_ = 9, csrc_ = 10, lld_ = 11 )

*     ..

*     .. Local Scalars ..

      LOGICAL            errflg, sof, tee

      INTEGER            csrcx, csrcy, i, iam, ictxt, igap, imbx, imby,

     $                   imidx, imidy, inbx, inby, incx, incy, ipmatx,

     $                   ipmaty, ipostx, iposty, iprex, iprey, ipw, ipx,

     $                   ipy, iverb, ix, ixseed, iy, iyseed, j, jx, jy,

     $                   k, ldx, ldy, mbx, mby, memreqd, mpx, mpy, mx,

     $                   my, mycol, myrow, n, nbx, nby, ngrids, nout,

     $                   npcol, nprocs, nprow, nqx, nqy, ntests, nx, ny,

     $                   pisclr, rsrcx, rsrcy, tskip, tstcnt

      REAL               pusclr

      COMPLEX            alpha, psclr

*     ..

*     .. Local Arrays ..

      CHARACTER*80       outfile

      LOGICAL            ltest( nsubs ), ycheck( nsubs )

      INTEGER            cscxval( maxtests ), cscyval( maxtests ),

     $                   descx( dlen_ ), descxr( dlen_ ),

     $                   descy( dlen_ ), descyr( dlen_ ), ierr( 4 ),

     $                   imbxval( maxtests ), imbyval( maxtests ),

     $                   inbxval( maxtests ), inbyval( maxtests ),

     $                   incxval( maxtests ), incyval( maxtests ),

     $                   ixval( maxtests ), iyval( maxtests ),

     $                   jxval( maxtests ), jyval( maxtests ),

     $                   kfail( nsubs ), kpass( nsubs ), kskip( nsubs ),

     $                   ktests( nsubs ), mbxval( maxtests ),

     $                   mbyval( maxtests ), mxval( maxtests ),

     $                   myval( maxtests ), nbxval( maxtests ),

     $                   nbyval( maxtests ), nval( maxtests ),

     $                   nxval( maxtests ), nyval( maxtests ),

     $                   pval( maxtests ), qval( maxtests ),

     $                   rscxval( maxtests ), rscyval( maxtests )

      COMPLEX            mem( memsiz )

*     ..

*     .. External Subroutines ..

      EXTERNAL           blacs_exit, blacs_get, blacs_gridexit,

     $                   blacs_gridinfo, blacs_gridinit, blacs_pinfo,

     $                   igsum2d, pb_cchekpad, pb_cfillpad, pb_descset2,

     $                   pb_pclaprnt, pcamax, pcaxpy, pcbla1tstinfo,

     $                   pcblas1tstchk, pcblas1tstchke, pcchkarg1,

     $                   pcchkvout, pccopy, pcdotc, pcdotu, pclagen,

     $                   pcmprnt, pcscal, pcsscal, pcswap, pcvprnt,

     $                   pscasum, pscnrm2, pvdescchk, pvdimchk

*     ..

*     .. Intrinsic Functions ..

      INTRINSIC          abs, max, mod, real

*     ..

*     .. Common Blocks ..

      CHARACTER*7        snames( nsubs )

      LOGICAL            abrtflg

      INTEGER            info, nblog

      COMMON             /snamec/snames

      COMMON             /infoc/info, nblog

      COMMON             /pberrorc/nout, abrtflg

*     ..

*     .. Data Statements ..

      DATA               ycheck/.true., .false., .false., .true.,

     $                   .true., .true., .true., .false., .false.,

     $                   .false./

*     ..

*     .. Executable Statements ..

*

*     Initialization

*

*     Set flag so that the PBLAS error handler will abort on errors.

*

      abrtflg = .false.

*

*     So far no error, will become true as soon as one error is found.

*

      errflg = .false.

*

*     Test counters

*

      tskip  = 0

      tstcnt = 0

*

*     Seeds for random matrix generations.

*

      ixseed = 100

      iyseed = 200

*

*     So far no tests have been performed.

*

      DO 10 i = 1, nsubs

         kpass( i )  = 0

         kskip( i )  = 0

         kfail( i )  = 0

         ktests( i ) = 0

   10 CONTINUE

*

*     Get starting information

*

      CALL blacs_pinfo( iam, nprocs )

      CALL pcbla1tstinfo( outfile, nout, ntests, nval, mxval, nxval,

     $                    imbxval, mbxval, inbxval, nbxval, rscxval,

     $                    cscxval, ixval, jxval, incxval, myval,

     $                    nyval, imbyval, mbyval, inbyval, nbyval,

     $                    rscyval, cscyval, iyval, jyval, incyval,

     $                    maxtests, ngrids, pval, maxgrids, qval,

     $                    maxgrids, ltest, sof, tee, iam, igap, iverb,

     $                    nprocs, alpha, mem )

*

      IF( iam.EQ.0 ) THEN

         WRITE( nout, fmt = 9979 )

         WRITE( nout, fmt = * )

      END IF

*

*     If TEE is set then Test Error Exits of routines.

*

      IF( tee )

     $   CALL pcblas1tstchke( ltest, nout, nprocs )

*

*     Loop over different process grids

*

      DO 60 i = 1, ngrids

*

         nprow = pval( i )

         npcol = qval( i )

*

*        Make sure grid information is correct

*

         ierr( 1 ) = 0

         IF( nprow.LT.1 ) THEN

            IF( iam.EQ.0 )

     $         WRITE( nout, fmt = 9999 ) 'GRID SIZE', 'NPROW', nprow

            ierr( 1 ) = 1

         ELSE IF( npcol.LT.1 ) THEN

            IF( iam.EQ.0 )

     $         WRITE( nout, fmt = 9999 ) 'GRID SIZE', 'NPCOL', npcol

            ierr( 1 ) = 1

         ELSE IF( nprow*npcol.GT.nprocs ) THEN

            IF( iam.EQ.0 )

     $         WRITE( nout, fmt = 9998 ) nprow*npcol, nprocs

            ierr( 1 ) = 1

         END IF

*

         IF( ierr( 1 ).GT.0 ) THEN

            IF( iam.EQ.0 )

     $         WRITE( nout, fmt = 9997 ) 'GRID'

            tskip = tskip + 1

            GO TO 60

         END IF

*

*        Define process grid

*

         CALL blacs_get( -1, 0, ictxt )

         CALL blacs_gridinit( ictxt, 'Row-major', nprow, npcol )

         CALL blacs_gridinfo( ictxt, nprow, npcol, myrow, mycol )

*

*        Go to bottom of process grid loop if this case doesn't use my

*        process

*

         IF( myrow.GE.nprow .OR. mycol.GE.npcol )

     $      GO TO 60

*

*        Loop over number of tests

*

         DO 50 j = 1, ntests

*

*           Get the test parameters

*

            n     = nval( j )

            mx    = mxval( j )

            nx    = nxval( j )

            imbx  = imbxval( j )

            mbx   = mbxval( j )

            inbx  = inbxval( j )

            nbx   = nbxval( j )

            rsrcx = rscxval( j )

            csrcx = cscxval( j )

            ix    = ixval( j )

            jx    = jxval( j )

            incx  = incxval( j )

            my    = myval( j )

            ny    = nyval( j )

            imby  = imbyval( j )

            mby   = mbyval( j )

            inby  = inbyval( j )

            nby   = nbyval( j )

            rsrcy = rscyval( j )

            csrcy = cscyval( j )

            iy    = iyval( j )

            jy    = jyval( j )

            incy  = incyval( j )

*

            IF( iam.EQ.0 ) THEN

               tstcnt = tstcnt + 1

               WRITE( nout, fmt = * )

               WRITE( nout, fmt = 9996 ) tstcnt, nprow, npcol

               WRITE( nout, fmt = * )

*

               WRITE( nout, fmt = 9995 )

               WRITE( nout, fmt = 9994 )

               WRITE( nout, fmt = 9995 )

               WRITE( nout, fmt = 9993 ) n, ix, jx, mx, nx, imbx, inbx,

     $                                   mbx, nbx, rsrcx, csrcx, incx

*

               WRITE( nout, fmt = 9995 )

               WRITE( nout, fmt = 9992 )

               WRITE( nout, fmt = 9995 )

               WRITE( nout, fmt = 9993 ) n, iy, jy, my, ny, imby, inby,

     $                                   mby, nby, rsrcy, csrcy, incy

               WRITE( nout, fmt = 9995 )

            END IF

*

*           Check the validity of the input and initialize DESC_

*

            CALL pvdescchk( ictxt, nout, 'X', descx,

     $                      block_cyclic_2d_inb, mx, nx, imbx, inbx,

     $                      mbx, nbx, rsrcx, csrcx, incx, mpx, nqx,

     $                      iprex, imidx, ipostx, igap, gapmul,

     $                      ierr( 1 ) )

            CALL pvdescchk( ictxt, nout, 'Y', descy,

     $                      block_cyclic_2d_inb, my, ny, imby, inby,

     $                      mby, nby, rsrcy, csrcy, incy, mpy, nqy,

     $                      iprey, imidy, iposty, igap, gapmul,

     $                      ierr( 2 ) )

*

            IF( ierr( 1 ).GT.0 .OR. ierr( 2 ).GT.0 ) THEN

               tskip = tskip + 1

               GO TO 40

            END IF

*

            ldx = max( 1, mx )

            ldy = max( 1, my )

*

*           Assign pointers into MEM for matrices corresponding to

*           vectors X and Y. Ex: IPX starts at position MEM( IPREX+1 ).

*

            ipx    = iprex + 1

            ipy    = ipx + descx( lld_ ) * nqx + ipostx + iprey

            ipmatx = ipy + descy( lld_ ) * nqy + iposty

            ipmaty = ipmatx + mx * nx

            ipw    = ipmaty + my * ny

*

*           Check if sufficient memory.

*           Requirement = mem for local part of parallel matrices +

*                         mem for whole matrices for comp. check +

*                         mem for recving comp. check error vals.

*

            memreqd = ipw - 1 +

     $                max( max( imbx, mbx ), max( imby, mby ) )

            ierr( 1 ) = 0

            IF( memreqd.GT.memsiz ) THEN

               IF( iam.EQ.0 )

     $            WRITE( nout, fmt = 9990 ) memreqd*cplxsz

               ierr( 1 ) = 1

            END IF

*

*           Check all processes for an error

*

            CALL igsum2d( ictxt, 'All', ' ', 1, 1, ierr, 1, -1, 0 )

*

            IF( ierr( 1 ).GT.0 ) THEN

               IF( iam.EQ.0 )

     $            WRITE( nout, fmt = 9991 )

               tskip = tskip + 1

               GO TO 40

            END IF

*

*           Loop over all PBLAS 1 routines

*

            DO 30 k = 1, nsubs

*

*              Continue only if this sub has to be tested.

*

               IF( .NOT.ltest( k ) )

     $            GO TO 30

*

               IF( iam.EQ.0 ) THEN

                  WRITE( nout, fmt = * )

                  WRITE( nout, fmt = 9989 ) snames( k )

               END IF

*

*              Check the validity of the operand sizes

*

               CALL pvdimchk( ictxt, nout, n, 'X', ix, jx, descx, incx,

     $                        ierr( 1 ) )

               CALL pvdimchk( ictxt, nout, n, 'Y', iy, jy, descy, incy,

     $                        ierr( 2 ) )

*

               IF( ierr( 1 ).NE.0 .OR. ierr( 2 ).NE.0 ) THEN

                  kskip( k ) = kskip( k ) + 1

                  GO TO 30

               END IF

*

*              Generate distributed matrices X and Y

*

               CALL pclagen( .false., 'None', 'No diag', 0, mx, nx, 1,

     $                       1, descx, ixseed, mem( ipx ),

     $                       descx( lld_ ) )

               IF( ycheck( k ) )

     $            CALL pclagen( .false., 'None', 'No diag', 0, my, ny,

     $                          1, 1, descy, iyseed, mem( ipy ),

     $                          descy( lld_ ) )

*

*              Generate entire matrices on each process.

*

               CALL pb_descset2( descxr, mx, nx, imbx, inbx, mbx, nbx,

     $                           -1, -1, ictxt, max( 1, mx ) )

               CALL pclagen( .false., 'None', 'No diag', 0, mx, nx, 1,

     $                       1, descxr, ixseed, mem( ipmatx ),

     $                       descxr( lld_ ) )

               IF( ycheck( k ) ) THEN

                  CALL pb_descset2( descyr, my, ny, imby, inby, mby,

     $                              nby, -1, -1, ictxt, max( 1, my ) )

                  CALL pclagen( .false., 'None', 'No diag', 0, my, ny,

     $                          1, 1, descyr, iyseed, mem( ipmaty ),

     $                          descyr( lld_ ) )

               END IF

*

*              Pad the guard zones of X, and Y

*

               CALL pb_cfillpad( ictxt, mpx, nqx, mem( ipx-iprex ),

     $                           descx( lld_ ), iprex, ipostx, padval )

*

               IF( ycheck( k ) ) THEN

                  CALL pb_cfillpad( ictxt, mpy, nqy, mem( ipy-iprey ),

     $                              descy( lld_ ), iprey, iposty,

     $                              padval )

               END IF

*

*              Initialize the check for INPUT only args.

*

               info = 0

               CALL pcchkarg1( ictxt, nout, snames( k ), n, alpha, ix,

     $                         jx, descx, incx, iy, jy, descy, incy,

     $                         info )

*

               info = 0

               psclr  = zero

               pusclr = rzero

               pisclr = 0

*

*              Print initial parallel data if IVERB >= 2.

*

               IF( iverb.EQ.2 ) THEN

                  IF( incx.EQ.descx( m_ ) ) THEN

                     CALL pb_pclaprnt( 1, n, mem( ipx ), ix, jx, descx,

     $                                 0, 0, 'PARALLEL_INITIAL_X', nout,

     $                                 mem( ipw ) )

                  ELSE

                     CALL pb_pclaprnt( n, 1, mem( ipx ), ix, jx, descx,

     $                                 0, 0, 'PARALLEL_INITIAL_X', nout,

     $                                 mem( ipw ) )

                  END IF

                  IF( ycheck( k ) ) THEN

                     IF( incy.EQ.descy( m_ ) ) THEN

                        CALL pb_pclaprnt( 1, n, mem( ipy ), iy, jy,

     $                                    descy, 0, 0,

     $                                    'PARALLEL_INITIAL_Y', nout,

     $                                    mem( ipw ) )

                     ELSE

                        CALL pb_pclaprnt( n, 1, mem( ipy ), iy, jy,

     $                                    descy, 0, 0,

     $                                    'PARALLEL_INITIAL_Y', nout,

     $                                    mem( ipw ) )

                     END IF

                  END IF

               ELSE IF( iverb.GE.3 ) THEN

                  CALL pb_pclaprnt( mx, nx, mem( ipx ), 1, 1, descx, 0,

     $                              0, 'PARALLEL_INITIAL_X', nout,

     $                              mem( ipw ) )

                  IF( ycheck( k ) )

     $               CALL pb_pclaprnt( my, ny, mem( ipy ), 1, 1, descy,

     $                                 0, 0, 'PARALLEL_INITIAL_Y', nout,

     $                                 mem( ipw ) )

               END IF

*

*              Call the PBLAS routine

*

               IF( k.EQ.1 ) THEN

*

*                 Test PCSWAP

*

                  CALL pcswap( n, mem( ipx ), ix, jx, descx, incx,

     $                         mem( ipy ), iy, jy, descy, incy )

*

               ELSE IF( k.EQ.2 ) THEN

*

*                 Test PCSCAL

*

                  psclr = alpha

                  CALL pcscal( n, alpha, mem( ipx ), ix, jx, descx,

     $                         incx )

*

               ELSE IF( k.EQ.3 ) THEN

*

*                 Test PCSSCAL

*

                  pusclr = real( alpha )

                  CALL pcsscal( n, real( alpha ), mem( ipx ), ix, jx,

     $                          descx, incx )

*

               ELSE IF( k.EQ.4 ) THEN

*

*                 Test PCCOPY

*

                  CALL pccopy( n, mem( ipx ), ix, jx, descx, incx,

     $                         mem( ipy ), iy, jy, descy, incy )

*

               ELSE IF( k.EQ.5 ) THEN

*

*                 Test PCAXPY

*

                  psclr = alpha

                  CALL pcaxpy( n, alpha, mem( ipx ), ix, jx, descx,

     $                         incx, mem( ipy ), iy, jy, descy, incy )

*

               ELSE IF( k.EQ.6 ) THEN

*

*                 Test PCDOTU

*

                  CALL pcdotu( n, psclr, mem( ipx ), ix, jx, descx,

     $                         incx, mem( ipy ), iy, jy, descy, incy )

*

               ELSE IF( k.EQ.7 ) THEN

*

*                 Test PCDOTC

*

                  CALL pcdotc( n, psclr, mem( ipx ), ix, jx, descx,

     $                         incx, mem( ipy ), iy, jy, descy, incy )

*

               ELSE IF( k.EQ.8 ) THEN

*

*                 Test PSCNRM2

*

                  CALL pscnrm2( n, pusclr, mem( ipx ), ix, jx, descx,

     $                          incx )

*

               ELSE IF( k.EQ.9 ) THEN

*

*                 Test PSCASUM

*

                  CALL pscasum( n, pusclr, mem( ipx ), ix, jx, descx,

     $                          incx )

*

               ELSE IF( k.EQ.10 ) THEN

*

                  CALL pcamax( n, psclr, pisclr, mem( ipx ), ix, jx,

     $                         descx, incx )

*

               END IF

*

*              Check if the operation has been performed.

*

               IF( info.NE.0 ) THEN

                  kskip( k ) = kskip( k ) + 1

                  IF( iam.EQ.0 )

     $               WRITE( nout, fmt = 9978 ) info

                  GO TO 30

               END IF

*

*              Check the computations

*

               CALL pcblas1tstchk( ictxt, nout, k, n, psclr, pusclr,

     $                             pisclr, mem( ipmatx ), mem( ipx ),

     $                             ix, jx, descx, incx, mem( ipmaty ),

     $                             mem( ipy ), iy, jy, descy, incy,

     $                             info )

               IF( mod( info, 2 ).EQ.1 ) THEN

                  ierr( 1 ) = 1

               ELSE IF( mod( info / 2, 2 ).EQ.1 ) THEN

                  ierr( 2 ) = 1

               ELSE IF( info.NE.0 ) THEN

                  ierr( 1 ) = 1

                  ierr( 2 ) = 1

               END IF

*

*              Check padding

*

               CALL pb_cchekpad( ictxt, snames( k ), mpx, nqx,

     $                           mem( ipx-iprex ), descx( lld_ ),

     $                           iprex, ipostx, padval )

               IF( ycheck( k ) ) THEN

                  CALL pb_cchekpad( ictxt, snames( k ), mpy, nqy,

     $                              mem( ipy-iprey ), descy( lld_ ),

     $                              iprey, iposty, padval )

               END IF

*

*              Check input-only scalar arguments

*

               info = 1

               CALL pcchkarg1( ictxt, nout, snames( k ), n, alpha, ix,

     $                         jx, descx, incx, iy, jy, descy, incy,

     $                         info )

*

*              Check input-only array arguments

*

               CALL pcchkvout( n, mem( ipmatx ), mem( ipx ), ix, jx,

     $                         descx, incx, ierr( 3 ) )

*

               IF( ierr( 3 ).NE.0 ) THEN

                  IF( iam.EQ.0 )

     $               WRITE( nout, fmt = 9986 ) 'PARALLEL_X', snames( k )

               END IF

*

               IF( ycheck( k ) ) THEN

                  CALL pcchkvout( n, mem( ipmaty ), mem( ipy ), iy, jy,

     $                            descy, incy, ierr( 4 ) )

                  IF( ierr( 4 ).NE.0 ) THEN

                     IF( iam.EQ.0 )

     $                  WRITE( nout, fmt = 9986 ) 'PARALLEL_Y',

     $                                       snames( k )

                  END IF

               END IF

*

*              Only node 0 prints computational test result

*

               IF( info.NE.0 .OR. ierr( 1 ).NE.0 .OR.

     $             ierr( 2 ).NE.0 .OR. ierr( 3 ).NE.0 .OR.

     $             ierr( 4 ).NE. 0 ) THEN

                  IF( iam.EQ.0 )

     $               WRITE( nout, fmt = 9988 ) snames( k )

                  kfail( k ) = kfail( k ) + 1

                  errflg = .true.

               ELSE

                  IF( iam.EQ.0 )

     $               WRITE( nout, fmt = 9987 ) snames( k )

                  kpass( k ) = kpass( k ) + 1

               END IF

*

*              Dump matrix if IVERB >= 1 and error.

*

               IF( iverb.GE.1 .AND. errflg ) THEN

                  IF( ierr( 3 ).NE.0 .OR. iverb.GE.3 ) THEN

                     CALL pcmprnt( ictxt, nout, mx, nx, mem( ipmatx ),

     $                             ldx, 0, 0, 'SERIAL_X' )

                     CALL pb_pclaprnt( mx, nx, mem( ipx ), 1, 1, descx,

     $                                 0, 0, 'PARALLEL_X', nout,

     $                                 mem( ipmatx ) )

                  ELSE IF( ierr( 1 ).NE.0 ) THEN

                     IF( n.GT.0 )

     $                  CALL pcvprnt( ictxt, nout, n,

     $                                mem( ipmatx+ix-1+(jx-1)*ldx ),

     $                                incx, 0, 0, 'SERIAL_X' )

                     IF( incx.EQ.descx( m_ ) ) THEN

                        CALL pb_pclaprnt( 1, n, mem( ipx ), ix, jx,

     $                                    descx, 0, 0, 'PARALLEL_X',

     $                                    nout, mem( ipmatx ) )

                     ELSE

                        CALL pb_pclaprnt( n, 1, mem( ipx ), ix, jx,

     $                                    descx, 0, 0, 'PARALLEL_X',

     $                                    nout, mem( ipmatx ) )

                     END IF

                  END IF

                  IF( ycheck( k ) ) THEN

                     IF( ierr( 4 ).NE.0 .OR. iverb.GE.3 ) THEN

                        CALL pcmprnt( ictxt, nout, my, ny,

     $                                mem( ipmaty ), ldy, 0, 0,

     $                                'SERIAL_Y' )

                        CALL pb_pclaprnt( my, ny, mem( ipy ), 1, 1,

     $                                    descy, 0, 0, 'PARALLEL_Y',

     $                                    nout, mem( ipmatx ) )

                     ELSE IF( ierr( 2 ).NE.0 ) THEN

                        IF( n.GT.0 )

     $                     CALL pcvprnt( ictxt, nout, n,

     $                                   mem( ipmaty+iy-1+(jy-1)*ldy ),

     $                                   incy, 0, 0, 'SERIAL_Y' )

                        IF( incy.EQ.descy( m_ ) ) THEN

                           CALL pb_pclaprnt( 1, n, mem( ipy ), iy, jy,

     $                                       descy, 0, 0, 'PARALLEL_Y',

     $                                       nout, mem( ipmatx ) )

                        ELSE

                           CALL pb_pclaprnt( n, 1, mem( ipy ), iy, jy,

     $                                       descy, 0, 0, 'PARALLEL_Y',

     $                                       nout, mem( ipmatx ) )

                        END IF

                     END IF

                  END IF

               END IF

*

*              Leave if error and "Stop On Failure"

*

               IF( sof.AND.errflg )

     $            GO TO 70

*

   30       CONTINUE

*

   40       IF( iam.EQ.0 ) THEN

               WRITE( nout, fmt = * )

               WRITE( nout, fmt = 9985 ) j

            END IF

*

   50   CONTINUE

*

        CALL blacs_gridexit( ictxt )

*

   60 CONTINUE

*

*     Come here, if error and "Stop On Failure"

*

   70 CONTINUE

*

*     Before printing out final stats, add TSKIP to all skips

*

      DO 80 i = 1, nsubs

         IF( ltest( i ) ) THEN

            kskip( i ) = kskip( i ) + tskip

            ktests( i ) = kskip( i ) + kfail( i ) + kpass( i )

         END IF

   80 CONTINUE

*

*     Print results

*

      IF( iam.EQ.0 ) THEN

         WRITE( nout, fmt = * )

         WRITE( nout, fmt = 9981 )

         WRITE( nout, fmt = * )

         WRITE( nout, fmt = 9983 )

         WRITE( nout, fmt = 9982 )

*

         DO 90 i = 1, nsubs

            WRITE( nout, fmt = 9984 ) '|', snames( i ), ktests( i ),

     $                                kpass( i ), kfail( i ), kskip( i )

   90    CONTINUE

         WRITE( nout, fmt = * )

         WRITE( nout, fmt = 9980 )

         WRITE( nout, fmt = * )

*

      END IF

*

      CALL blacs_exit( 0 )

*

 9999 FORMAT( 'ILLEGAL ', a, ': ', a, ' = ', i10,

     $        ' should be at least 1' )

 9998 FORMAT( 'ILLEGAL GRID: NPROW*NPCOL = ', i4,

     $        '. It can be at most', i4 )

 9997 FORMAT( 'Bad ', a, ' parameters: going on to next test case.' )

 9996 FORMAT( 2x, 'Test number ', i4 , ' started on a ', i6, ' x ',

     $        i6, ' process grid.' )

 9995 FORMAT( 2x, '---------------------------------------------------',

     $        '--------------------------' )

 9994 FORMAT( 2x, '     N     IX     JX     MX     NX  IMBX  INBX',

     $        '   MBX   NBX RSRCX CSRCX   INCX' )

 9993 FORMAT( 2x,i6,1x,i6,1x,i6,1x,i6,1x,i6,1x,i5,1x,i5,1x,i5,1x,i5,1x,

     $        i5,1x,i5,1x,i6 )

 9992 FORMAT( 2x, '     N     IY     JY     MY     NY  IMBY  INBY',

     $        '   MBY   NBY RSRCY CSRCY   INCY' )

 9991 FORMAT( 'Not enough memory for this test: going on to',

     $        ' next test case.' )

 9990 FORMAT( 'Not enough memory. Need: ', i12 )

 9989 FORMAT( 2x, '   Tested Subroutine: ', a )

 9988 FORMAT( 2x, '   ***** Computational check: ', a, '       ',

     $        ' FAILED ',' *****' )

 9987 FORMAT( 2x, '   ***** Computational check: ', a, '       ',

     $        ' PASSED ',' *****' )

 9986 FORMAT( 2x, '   ***** ERROR ***** Matrix operand ', a,

     $        ' modified by ', a, ' *****' )

 9985 FORMAT( 2x, 'Test number ', i4, ' completed.' )

 9984 FORMAT( 2x,a1,2x,a7,8x,i4,6x,i4,5x,i4,4x,i4 )

 9983 FORMAT( 2x, '   SUBROUTINE  TOTAL TESTS  PASSED   FAILED  ',

     $        'SKIPPED' )

 9982 FORMAT( 2x, '   ----------  -----------  ------   ------  ',

     $        '-------' )

 9981 FORMAT( 2x, 'Testing Summary')

 9980 FORMAT( 2x, 'End of Tests.' )

 9979 FORMAT( 2x, 'Tests started.' )

 9978 FORMAT( 2x, '   ***** Operation not supported, error code: ',

     $        i5, ' *****' )

*

      stop

*

*     End of PCBLA1TST

*

      END


      SUBROUTINE pcbla1tstinfo( SUMMRY, NOUT, NMAT, NVAL, MXVAL,

     $                          NXVAL, IMBXVAL, MBXVAL, INBXVAL,

     $                          NBXVAL, RSCXVAL, CSCXVAL, IXVAL,

     $                          JXVAL, INCXVAL, MYVAL, NYVAL, IMBYVAL,

     $                          MBYVAL, INBYVAL, NBYVAL, RSCYVAL,

     $                          CSCYVAL, IYVAL, JYVAL, INCYVAL,

     $                          LDVAL, NGRIDS, PVAL, LDPVAL, QVAL,

     $                          LDQVAL, LTEST, SOF, TEE, IAM, IGAP,

     $                          IVERB, NPROCS, ALPHA, WORK )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Scalar Arguments ..

      LOGICAL            SOF, TEE

      INTEGER            IAM, IGAP, IVERB, LDPVAL, LDQVAL, LDVAL,

     $                   NGRIDS, NMAT, NOUT, NPROCS

      COMPLEX            ALPHA

*     ..

*     .. Array Arguments ..

      CHARACTER*( * )    SUMMRY

      LOGICAL            LTEST( * )

      INTEGER            CSCXVAL( LDVAL ), CSCYVAL( LDVAL ),

     $                   imbxval( ldval ), imbyval( ldval ),

     $                   inbxval( ldval ), inbyval( ldval ),

     $                   incxval( ldval ), incyval( ldval ),

     $                   ixval( ldval ), iyval( ldval ), jxval( ldval ),

     $                   jyval( ldval ), mbxval( ldval ),

     $                   mbyval( ldval ), mxval( ldval ),

     $                   myval( ldval ), nbxval( ldval ),

     $                   nbyval( ldval ), nval( ldval ), nxval( ldval ),

     $                   nyval( ldval ), pval( ldpval ), qval( ldqval ),

     $                   rscxval( ldval ), rscyval( ldval ), work( * )

*     ..

*

*  Purpose

*  =======

*

*  PCBLA1TSTINFO  get the needed startup information for testing various

*  Level 1 PBLAS routines, and transmits it to all processes.

*

*  Notes

*  =====

*

*  For packing the information we assumed that the length in bytes of an

*  integer is equal to the length in bytes of a real single precision.

*

*  Arguments

*  =========

*

*  SUMMRY  (global output) CHARACTER*(*)

*          On  exit,  SUMMRY  is  the  name of output (summary) file (if

*          any). SUMMRY is only defined for process 0.

*

*  NOUT    (global output) INTEGER

*          On exit, NOUT  specifies the unit number for the output file.

*          When NOUT is 6, output to screen,  when  NOUT is 0, output to

*          stderr. NOUT is only defined for process 0.

*

*  NMAT    (global output) INTEGER

*          On exit,  NMAT  specifies the number of different test cases.

*

*  NVAL    (global output) INTEGER array

*          On entry, NVAL is an array of dimension LDVAL.  On exit, this

*          array contains the values of N to run the code with.

*

*  MXVAL   (global output) INTEGER array

*          On entry, MXVAL is an array of dimension LDVAL. On exit, this

*          array  contains  the values  of  DESCX( M_ )  to run the code

*          with.

*

*  NXVAL   (global output) INTEGER array

*          On entry, NXVAL is an array of dimension LDVAL. On exit, this

*          array  contains  the values  of  DESCX( N_ )  to run the code

*          with.

*

*  IMBXVAL (global output) INTEGER array

*          On entry,  IMBXVAL  is an array of  dimension LDVAL. On exit,

*          this  array  contains  the values of DESCX( IMB_ ) to run the

*          code with.

*

*  MBXVAL  (global output) INTEGER array

*          On entry,  MBXVAL  is an array of  dimension  LDVAL. On exit,

*          this  array  contains  the values of DESCX( MB_ ) to  run the

*          code with.

*

*  INBXVAL (global output) INTEGER array

*          On entry,  INBXVAL  is an array of  dimension LDVAL. On exit,

*          this  array  contains  the values of DESCX( INB_ ) to run the

*          code with.

*

*  NBXVAL  (global output) INTEGER array

*          On entry,  NBXVAL  is an array of  dimension  LDVAL. On exit,

*          this  array  contains  the values of DESCX( NB_ ) to  run the

*          code with.

*

*  RSCXVAL (global output) INTEGER array

*          On entry, RSCXVAL  is an array of  dimension  LDVAL. On exit,

*          this  array  contains the values of DESCX( RSRC_ ) to run the

*          code with.

*

*  CSCXVAL (global output) INTEGER array

*          On entry, CSCXVAL  is an array of  dimension  LDVAL. On exit,

*          this  array  contains the values of DESCX( CSRC_ ) to run the

*          code with.

*

*  IXVAL   (global output) INTEGER array

*          On entry, IXVAL is an array of dimension LDVAL. On exit, this

*          array  contains the values of IX to run the code with.

*

*  JXVAL   (global output) INTEGER array

*          On entry, JXVAL is an array of dimension LDVAL. On exit, this

*          array  contains the values of JX to run the code with.

*

*  INCXVAL (global output) INTEGER array

*          On entry,  INCXVAL  is  an array of dimension LDVAL. On exit,

*          this array  contains the values of INCX to run the code with.

*

*  MYVAL   (global output) INTEGER array

*          On entry, MYVAL is an array of dimension LDVAL. On exit, this

*          array  contains  the values  of  DESCY( M_ )  to run the code

*          with.

*

*  NYVAL   (global output) INTEGER array

*          On entry, NYVAL is an array of dimension LDVAL. On exit, this

*          array  contains  the values  of  DESCY( N_ )  to run the code

*          with.

*

*  IMBYVAL (global output) INTEGER array

*          On entry,  IMBYVAL  is an array of  dimension LDVAL. On exit,

*          this  array  contains  the values of DESCY( IMB_ ) to run the

*          code with.

*

*  MBYVAL  (global output) INTEGER array

*          On entry,  MBYVAL  is an array of  dimension  LDVAL. On exit,

*          this  array  contains  the values of DESCY( MB_ ) to  run the

*          code with.

*

*  INBYVAL (global output) INTEGER array

*          On entry,  INBYVAL  is an array of  dimension LDVAL. On exit,

*          this  array  contains  the values of DESCY( INB_ ) to run the

*          code with.

*

*  NBYVAL  (global output) INTEGER array

*          On entry,  NBYVAL  is an array of  dimension  LDVAL. On exit,

*          this  array  contains  the values of DESCY( NB_ ) to  run the

*          code with.

*

*  RSCYVAL (global output) INTEGER array

*          On entry, RSCYVAL  is an array of  dimension  LDVAL. On exit,

*          this  array  contains the values of DESCY( RSRC_ ) to run the

*          code with.

*

*  CSCYVAL (global output) INTEGER array

*          On entry, CSCYVAL  is an array of  dimension  LDVAL. On exit,

*          this  array  contains the values of DESCY( CSRC_ ) to run the

*          code with.

*

*  IYVAL   (global output) INTEGER array

*          On entry, IYVAL is an array of dimension LDVAL. On exit, this

*          array  contains the values of IY to run the code with.

*

*  JYVAL   (global output) INTEGER array

*          On entry, JYVAL is an array of dimension LDVAL. On exit, this

*          array  contains the values of JY to run the code with.

*

*  INCYVAL (global output) INTEGER array

*          On entry,  INCYVAL  is  an array of dimension LDVAL. On exit,

*          this array  contains the values of INCY to run the code with.

*

*  LDVAL   (global input) INTEGER

*          On entry, LDVAL specifies the maximum number of different va-

*          lues that can be used for  DESCX(:),  IX, JX, INCX, DESCY(:),

*          IY,  JY  and  INCY.  This  is also the maximum number of test

*          cases.

*

*  NGRIDS  (global output) INTEGER

*          On exit, NGRIDS specifies the number of different values that

*          can be used for P and Q.

*

*  PVAL    (global output) INTEGER array

*          On entry, PVAL is an array of dimension LDPVAL. On exit, this

*          array contains the values of P to run the code with.

*

*  LDPVAL  (global input) INTEGER

*          On entry,  LDPVAL  specifies  the maximum number of different

*          values that can be used for P.

*

*  QVAL    (global output) INTEGER array

*          On entry, QVAL is an array of dimension LDQVAL. On exit, this

*          array contains the values of Q to run the code with.

*

*  LDQVAL  (global input) INTEGER

*          On entry,  LDQVAL  specifies  the maximum number of different

*          values that can be used for Q.

*

*  LTEST   (global output) LOGICAL array

*          On entry, LTEST  is an array of dimension at  least  ten.  On

*          exit, if LTEST( i ) is .TRUE., the i-th Level 1 PBLAS routine

*          will be tested.  See  the  input file for the ordering of the

*          routines.

*

*  SOF     (global output) LOGICAL

*          On exit, if SOF is .TRUE., the tester will  stop on the first

*          detected failure. Otherwise, it won't.

*

*  TEE     (global output) LOGICAL

*          On exit, if TEE is .TRUE., the tester will  perform the error

*          exit tests. These tests won't be performed otherwise.

*

*  IAM     (local input) INTEGER

*          On entry,  IAM  specifies the number of the process executing

*          this routine.

*

*  IGAP    (global output) INTEGER

*          On exit, IGAP  specifies the user-specified gap used for pad-

*          ding. IGAP must be at least zero.

*

*  IVERB   (global output) INTEGER

*          On exit,  IVERB  specifies  the output verbosity level: 0 for

*          pass/fail, 1, 2 or 3 for matrix dump on errors.

*

*  NPROCS  (global input) INTEGER

*          On entry, NPROCS specifies the total number of processes.

*

*  ALPHA   (global output) COMPLEX

*          On exit, ALPHA specifies the value of alpha to be used in all

*          the test cases.

*

*  WORK    (local workspace) INTEGER array

*          On   entry,   WORK   is   an  array  of  dimension  at  least

*          MAX( 2, 2*NGRIDS+23*NMAT+NSUBS+4 )  with  NSUBS  equal to 10.

*          This array is used to pack all output arrays in order to send

*          the information in one message.

*

*  -- Written on April 1, 1998 by

*     Antoine Petitet, University  of  Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Parameters ..

      INTEGER            NIN, NSUBS

      PARAMETER          ( NIN = 11, nsubs = 10 )

*     ..

*     .. Local Scalars ..

      LOGICAL            LTESTT

      INTEGER            I, ICTXT, J

      REAL               EPS

*     ..

*     .. Local Arrays ..

      CHARACTER*7        SNAMET

      CHARACTER*79       USRINFO

*     ..

*     .. External Subroutines ..

      EXTERNAL           blacs_abort, blacs_get, blacs_gridexit,

     $                   blacs_gridinit, blacs_setup, cgebr2d, cgebs2d,

     $                   icopy, igebr2d, igebs2d, sgebr2d, sgebs2d

*     ..

*     .. External Functions ..

      REAL               PSLAMCH

      EXTERNAL           PSLAMCH

*     ..

*     .. Intrinsic Functions ..

      INTRINSIC          max, min

*     ..

*     .. Common Blocks ..

      CHARACTER*7        SNAMES( NSUBS )

      COMMON             /snamec/snames

*     ..

*     .. Executable Statements ..

*

*     Process 0 reads the input data, broadcasts to other processes and

*     writes needed information to NOUT

*

      IF( iam.EQ.0 ) THEN

*

*        Open file and skip data file header

*

         OPEN( nin, file='PCBLAS1TST.dat', status='OLD' )

         READ( nin, fmt = * ) summry

         summry = ' '

*

*        Read in user-supplied info about machine type, compiler, etc.

*

         READ( nin, fmt = 9999 ) usrinfo

*

*        Read name and unit number for summary output file

*

         READ( nin, fmt = * ) summry

         READ( nin, fmt = * ) nout

         IF( nout.NE.0 .AND. nout.NE.6 )

     $      OPEN( nout, file = summry, status = 'UNKNOWN' )

*

*        Read and check the parameter values for the tests.

*

*        Read the flag that indicates if Stop on Failure

*

         READ( nin, fmt = * ) sof

*

*        Read the flag that indicates if Test Error Exits

*

         READ( nin, fmt = * ) tee

*

*        Read the verbosity level

*

         READ( nin, fmt = * ) iverb

         IF( iverb.LT.0 .OR. iverb.GT.3 )

     $      iverb = 0

*

*        Read the leading dimension gap

*

         READ( nin, fmt = * ) igap

         IF( igap.LT.0 )

     $      igap = 0

*

*        Get number of grids

*

         READ( nin, fmt = * ) ngrids

         IF( ngrids.LT.1 .OR. ngrids.GT.ldpval ) THEN

            WRITE( nout, fmt = 9998 ) 'Grids', ldpval

            GO TO 100

         ELSE IF( ngrids.GT.ldqval ) THEN

            WRITE( nout, fmt = 9998 ) 'Grids', ldqval

            GO TO 100

         END IF

*

*        Get values of P and Q

*

         READ( nin, fmt = * ) ( pval( i ), i = 1, ngrids )

         READ( nin, fmt = * ) ( qval( i ), i = 1, ngrids )

*

*        Read ALPHA

*

         READ( nin, fmt = * ) alpha

*

*        Read number of tests.

*

         READ( nin, fmt = * ) nmat

         IF( nmat.LT.1 .OR. nmat.GT.ldval ) THEN

            WRITE( nout, fmt = 9998 ) 'Tests', ldval

            GO TO 100

         END IF

*

*        Read in input data into arrays.

*

         READ( nin, fmt = * ) ( nval( i ),     i = 1, nmat )

         READ( nin, fmt = * ) ( mxval( i ),    i = 1, nmat )

         READ( nin, fmt = * ) ( nxval( i ),    i = 1, nmat )

         READ( nin, fmt = * ) ( imbxval( i ),  i = 1, nmat )

         READ( nin, fmt = * ) ( inbxval( i ),  i = 1, nmat )

         READ( nin, fmt = * ) ( mbxval( i ),   i = 1, nmat )

         READ( nin, fmt = * ) ( nbxval( i ),   i = 1, nmat )

         READ( nin, fmt = * ) ( rscxval( i ),  i = 1, nmat )

         READ( nin, fmt = * ) ( cscxval( i ),  i = 1, nmat )

         READ( nin, fmt = * ) ( ixval( i ),    i = 1, nmat )

         READ( nin, fmt = * ) ( jxval( i ),    i = 1, nmat )

         READ( nin, fmt = * ) ( incxval( i ),  i = 1, nmat )

         READ( nin, fmt = * ) ( myval( i ),    i = 1, nmat )

         READ( nin, fmt = * ) ( nyval( i ),    i = 1, nmat )

         READ( nin, fmt = * ) ( imbyval( i ),  i = 1, nmat )

         READ( nin, fmt = * ) ( inbyval( i ),  i = 1, nmat )

         READ( nin, fmt = * ) ( mbyval( i ),   i = 1, nmat )

         READ( nin, fmt = * ) ( nbyval( i ),   i = 1, nmat )

         READ( nin, fmt = * ) ( rscyval( i ),  i = 1, nmat )

         READ( nin, fmt = * ) ( cscyval( i ),  i = 1, nmat )

         READ( nin, fmt = * ) ( iyval( i ),    i = 1, nmat )

         READ( nin, fmt = * ) ( jyval( i ),    i = 1, nmat )

         READ( nin, fmt = * ) ( incyval( i ),  i = 1, nmat )

*

*        Read names of subroutines and flags which indicate

*        whether they are to be tested.

*

         DO 10 i = 1, nsubs

            ltest( i ) = .false.

   10    CONTINUE

   20    CONTINUE

         READ( nin, fmt = 9996, END = 50 ) SNAMET, ltestt

         DO 30 i = 1, nsubs

            IF( snamet.EQ.snames( i ) )

     $         GO TO 40

   30    CONTINUE

*

         WRITE( nout, fmt = 9995 )snamet

         GO TO 100

*

   40    CONTINUE

         ltest( i ) = ltestt

         GO TO 20

*

   50    CONTINUE

*

*        Close input file

*

         CLOSE ( nin )

*

*        For pvm only: if virtual machine not set up, allocate it and

*        spawn the correct number of processes.

*

         IF( nprocs.LT.1 ) THEN

            nprocs = 0

            DO 60 i = 1, ngrids

               nprocs = max( nprocs, pval( i )*qval( i ) )

   60       CONTINUE

            CALL blacs_setup( iam, nprocs )

         END IF

*

*        Temporarily define blacs grid to include all processes so

*        information can be broadcast to all processes

*

         CALL blacs_get( -1, 0, ictxt )

         CALL blacs_gridinit( ictxt, 'Row-major', 1, nprocs )

*

*        Compute machine epsilon

*

         eps = pslamch( ictxt, 'eps' )

*

*        Pack information arrays and broadcast

*

         CALL cgebs2d( ictxt, 'All', ' ', 1, 1, alpha, 1 )

*

         work( 1 ) = ngrids

         work( 2 ) = nmat

         CALL igebs2d( ictxt, 'All', ' ', 2, 1, work, 2 )

*

         i = 1

         IF( sof ) THEN

            work( i ) = 1

         ELSE

            work( i ) = 0

         END IF

         i = i + 1

         IF( tee ) THEN

            work( i ) = 1

         ELSE

            work( i ) = 0

         END IF

         i = i + 1

         work( i ) = iverb

         i = i + 1

         work( i ) = igap

         i = i + 1

         CALL icopy( ngrids, pval,     1, work( i ), 1 )

         i = i + ngrids

         CALL icopy( ngrids, qval,     1, work( i ), 1 )

         i = i + ngrids

         CALL icopy( nmat,   nval,     1, work( i ), 1 )

         i = i + nmat

         CALL icopy( nmat,   mxval,    1, work( i ), 1 )

         i = i + nmat

         CALL icopy( nmat,   nxval,    1, work( i ), 1 )

         i = i + nmat

         CALL icopy( nmat,   imbxval,  1, work( i ), 1 )

         i = i + nmat

         CALL icopy( nmat,   inbxval,  1, work( i ), 1 )

         i = i + nmat

         CALL icopy( nmat,   mbxval,   1, work( i ), 1 )

         i = i + nmat

         CALL icopy( nmat,   nbxval,   1, work( i ), 1 )

         i = i + nmat

         CALL icopy( nmat,   rscxval,  1, work( i ), 1 )

         i = i + nmat

         CALL icopy( nmat,   cscxval,  1, work( i ), 1 )

         i = i + nmat

         CALL icopy( nmat,   ixval,    1, work( i ), 1 )

         i = i + nmat

         CALL icopy( nmat,   jxval,    1, work( i ), 1 )

         i = i + nmat

         CALL icopy( nmat,   incxval,  1, work( i ), 1 )

         i = i + nmat

         CALL icopy( nmat,   myval,    1, work( i ), 1 )

         i = i + nmat

         CALL icopy( nmat,   nyval,    1, work( i ), 1 )

         i = i + nmat

         CALL icopy( nmat,   imbyval,  1, work( i ), 1 )

         i = i + nmat

         CALL icopy( nmat,   inbyval,  1, work( i ), 1 )

         i = i + nmat

         CALL icopy( nmat,   mbyval,   1, work( i ), 1 )

         i = i + nmat

         CALL icopy( nmat,   nbyval,   1, work( i ), 1 )

         i = i + nmat

         CALL icopy( nmat,   rscyval,  1, work( i ), 1 )

         i = i + nmat

         CALL icopy( nmat,   cscyval,  1, work( i ), 1 )

         i = i + nmat

         CALL icopy( nmat,   iyval,    1, work( i ), 1 )

         i = i + nmat

         CALL icopy( nmat,   jyval,    1, work( i ), 1 )

         i = i + nmat

         CALL icopy( nmat,   incyval,  1, work( i ), 1 )

         i = i + nmat

*

         DO 70 j = 1, nsubs

            IF( ltest( j ) ) THEN

               work( i ) = 1

            ELSE

               work( i ) = 0

            END IF

            i = i + 1

   70    CONTINUE

         i = i - 1

         CALL igebs2d( ictxt, 'All', ' ', i, 1, work, i )

*

*        regurgitate input

*

         WRITE( nout, fmt = 9999 ) 'Level 1 PBLAS testing program.'

         WRITE( nout, fmt = 9999 ) usrinfo

         WRITE( nout, fmt = * )

         WRITE( nout, fmt = 9999 )

     $               'Tests of the complex single precision '//

     $               'Level 1 PBLAS'

         WRITE( nout, fmt = * )

         WRITE( nout, fmt = 9999 )

     $               'The following parameter values will be used:'

         WRITE( nout, fmt = * )

         WRITE( nout, fmt = 9993 ) nmat

         WRITE( nout, fmt = 9992 ) ngrids

         WRITE( nout, fmt = 9990 )

     $               'P', ( pval(i), i = 1, min(ngrids, 5) )

         IF( ngrids.GT.5 )

     $      WRITE( nout, fmt = 9991 ) ( pval(i), i = 6,

     $                                  min( 10, ngrids ) )

         IF( ngrids.GT.10 )

     $      WRITE( nout, fmt = 9991 ) ( pval(i), i = 11,

     $                                  min( 15, ngrids ) )

         IF( ngrids.GT.15 )

     $      WRITE( nout, fmt = 9991 ) ( pval(i), i = 16, ngrids )

         WRITE( nout, fmt = 9990 )

     $               'Q', ( qval(i), i = 1, min(ngrids, 5) )

         IF( ngrids.GT.5 )

     $      WRITE( nout, fmt = 9991 ) ( qval(i), i = 6,

     $                                  min( 10, ngrids ) )

         IF( ngrids.GT.10 )

     $      WRITE( nout, fmt = 9991 ) ( qval(i), i = 11,

     $                                  min( 15, ngrids ) )

         IF( ngrids.GT.15 )

     $      WRITE( nout, fmt = 9991 ) ( qval(i), i = 16, ngrids )

         WRITE( nout, fmt = 9988 ) sof

         WRITE( nout, fmt = 9987 ) tee

         WRITE( nout, fmt = 9983 ) igap

         WRITE( nout, fmt = 9986 ) iverb

         WRITE( nout, fmt = 9982 ) alpha

         IF( ltest( 1 ) ) THEN

            WRITE( nout, fmt = 9985 ) snames( 1 ), ' ... Yes'

         ELSE

            WRITE( nout, fmt = 9985 ) snames( 1 ), ' ... No '

         END IF

         DO 80 i = 2, nsubs

            IF( ltest( i ) ) THEN

               WRITE( nout, fmt = 9984 ) snames( i ), ' ... Yes'

            ELSE

               WRITE( nout, fmt = 9984 ) snames( i ), ' ... No '

            END IF

   80    CONTINUE

         WRITE( nout, fmt = 9994 ) eps

         WRITE( nout, fmt = * )

*

      ELSE

*

*        If in pvm, must participate setting up virtual machine

*

         IF( nprocs.LT.1 )

     $      CALL blacs_setup( iam, nprocs )

*

*        Temporarily define blacs grid to include all processes so

*        information can be broadcast to all processes

*

         CALL blacs_get( -1, 0, ictxt )

         CALL blacs_gridinit( ictxt, 'Row-major', 1, nprocs )

*

*        Compute machine epsilon

*

         eps = pslamch( ictxt, 'eps' )

*

         CALL cgebr2d( ictxt, 'All', ' ', 1, 1, alpha, 1, 0, 0 )

*

         CALL igebr2d( ictxt, 'All', ' ', 2, 1, work, 2, 0, 0 )

         ngrids = work( 1 )

         nmat   = work( 2 )

*

         i = 2*ngrids + 23*nmat + nsubs + 4

         CALL igebr2d( ictxt, 'All', ' ', i, 1, work, i, 0, 0 )

*

         i = 1

         IF( work( i ).EQ.1 ) THEN

            sof = .true.

         ELSE

            sof = .false.

         END IF

         i = i + 1

         IF( work( i ).EQ.1 ) THEN

            tee = .true.

         ELSE

            tee = .false.

         END IF

         i = i + 1

         iverb = work( i )

         i = i + 1

         igap = work( i )

         i = i + 1

         CALL icopy( ngrids, work( i ), 1, pval,     1 )

         i = i + ngrids

         CALL icopy( ngrids, work( i ), 1, qval,     1 )

         i = i + ngrids

         CALL icopy( nmat,   work( i ), 1, nval,     1 )

         i = i + nmat

         CALL icopy( nmat,   work( i ), 1, mxval,    1 )

         i = i + nmat

         CALL icopy( nmat,   work( i ), 1, nxval,    1 )

         i = i + nmat

         CALL icopy( nmat,   work( i ), 1, imbxval,  1 )

         i = i + nmat

         CALL icopy( nmat,   work( i ), 1, inbxval,  1 )

         i = i + nmat

         CALL icopy( nmat,   work( i ), 1, mbxval,   1 )

         i = i + nmat

         CALL icopy( nmat,   work( i ), 1, nbxval,   1 )

         i = i + nmat

         CALL icopy( nmat,   work( i ), 1, rscxval,  1 )

         i = i + nmat

         CALL icopy( nmat,   work( i ), 1, cscxval,  1 )

         i = i + nmat

         CALL icopy( nmat,   work( i ), 1, ixval,    1 )

         i = i + nmat

         CALL icopy( nmat,   work( i ), 1, jxval,    1 )

         i = i + nmat

         CALL icopy( nmat,   work( i ), 1, incxval,  1 )

         i = i + nmat

         CALL icopy( nmat,   work( i ), 1, myval,    1 )

         i = i + nmat

         CALL icopy( nmat,   work( i ), 1, nyval,    1 )

         i = i + nmat

         CALL icopy( nmat,   work( i ), 1, imbyval,  1 )

         i = i + nmat

         CALL icopy( nmat,   work( i ), 1, inbyval,  1 )

         i = i + nmat

         CALL icopy( nmat,   work( i ), 1, mbyval,   1 )

         i = i + nmat

         CALL icopy( nmat,   work( i ), 1, nbyval,   1 )

         i = i + nmat

         CALL icopy( nmat,   work( i ), 1, rscyval,  1 )

         i = i + nmat

         CALL icopy( nmat,   work( i ), 1, cscyval,  1 )

         i = i + nmat

         CALL icopy( nmat,   work( i ), 1, iyval,    1 )

         i = i + nmat

         CALL icopy( nmat,   work( i ), 1, jyval,    1 )

         i = i + nmat

         CALL icopy( nmat,   work( i ), 1, incyval,  1 )

         i = i + nmat

*

         DO 90 j = 1, nsubs

            IF( work( i ).EQ.1 ) THEN

               ltest( j ) = .true.

            ELSE

               ltest( j ) = .false.

            END IF

            i = i + 1

   90    CONTINUE

*

      END IF

*

      CALL blacs_gridexit( ictxt )

*

      RETURN

*

  100 WRITE( nout, fmt = 9997 )

      CLOSE( nin )

      IF( nout.NE.6 .AND. nout.NE.0 )

     $   CLOSE( nout )

      CALL blacs_abort( ictxt, 1 )

*

      stop

*

 9999 FORMAT( a )

 9998 FORMAT( ' Number of values of ',5a, ' is less than 1 or greater ',

     $        'than ', i2 )

 9997 FORMAT( ' Illegal input in file ',40a,'.  Aborting run.' )

 9996 FORMAT( a7, l2 )

 9995 FORMAT( '  Subprogram name ', a7, ' not recognized',

     $        /' ******* TESTS ABANDONED *******' )

 9994 FORMAT( 2x, 'Relative machine precision (eps) is taken to be ',

     $        e18.6 )

 9993 FORMAT( 2x, 'Number of Tests           : ', i6 )

 9992 FORMAT( 2x, 'Number of process grids   : ', i6 )

 9991 FORMAT( 2x, '                          : ', 5i6 )

 9990 FORMAT( 2x, a1, '                         : ', 5i6 )

 9988 FORMAT( 2x, 'Stop on failure flag      : ', l6 )

 9987 FORMAT( 2x, 'Test for error exits flag : ', l6 )

 9986 FORMAT( 2x, 'Verbosity level           : ', i6 )

 9985 FORMAT( 2x, 'Routines to be tested     :      ', a, a8 )

 9984 FORMAT( 2x, '                                 ', a, a8 )

 9983 FORMAT( 2x, 'Leading dimension gap     : ', i6 )

 9982 FORMAT( 2x, 'Alpha                     :      (', g16.6,

     $        ',', g16.6, ')' )

*

*     End of PCBLA1TSTINFO

*


      END


      SUBROUTINE pcblas1tstchke( LTEST, INOUT, NPROCS )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Scalar Arguments ..

      INTEGER            INOUT, NPROCS

*     ..

*     .. Array Arguments ..

      LOGICAL            LTEST( * )

*     ..

*

*  Purpose

*  =======

*

*  PCBLAS1TSTCHKE tests the error exits of the Level 1 PBLAS.

*

*  Notes

*  =====

*

*  A description  vector  is associated with each 2D block-cyclicly dis-

*  tributed matrix.  This  vector  stores  the  information  required to

*  establish the  mapping  between a  matrix entry and its corresponding

*  process and memory location.

*

*  In  the  following  comments,   the character _  should  be  read  as

*  "of  the  distributed  matrix".  Let  A  be a generic term for any 2D

*  block cyclicly distributed matrix.  Its description vector is DESCA:

*

*  NOTATION         STORED IN       EXPLANATION

*  ---------------- --------------- ------------------------------------

*  DTYPE_A (global) DESCA( DTYPE_ ) The descriptor type.

*  CTXT_A  (global) DESCA( CTXT_  ) The BLACS context handle, indicating

*                                   the NPROW x NPCOL BLACS process grid

*                                   A  is distributed over.  The context

*                                   itself  is  global,  but  the handle

*                                   (the integer value) may vary.

*  M_A     (global) DESCA( M_     ) The  number of rows in the distribu-

*                                   ted matrix A, M_A >= 0.

*  N_A     (global) DESCA( N_     ) The number of columns in the distri-

*                                   buted matrix A, N_A >= 0.

*  IMB_A   (global) DESCA( IMB_   ) The number of rows of the upper left

*                                   block of the matrix A, IMB_A > 0.

*  INB_A   (global) DESCA( INB_   ) The  number  of columns of the upper

*                                   left   block   of   the   matrix  A,

*                                   INB_A > 0.

*  MB_A    (global) DESCA( MB_    ) The blocking factor used to  distri-

*                                   bute the last  M_A-IMB_A rows of  A,

*                                   MB_A > 0.

*  NB_A    (global) DESCA( NB_    ) The blocking factor used to  distri-

*                                   bute the last  N_A-INB_A  columns of

*                                   A, NB_A > 0.

*  RSRC_A  (global) DESCA( RSRC_  ) The process row over which the first

*                                   row of the matrix  A is distributed,

*                                   NPROW > RSRC_A >= 0.

*  CSRC_A  (global) DESCA( CSRC_  ) The  process  column  over which the

*                                   first  column of  A  is distributed.

*                                   NPCOL > CSRC_A >= 0.

*  LLD_A   (local)  DESCA( LLD_   ) The  leading  dimension of the local

*                                   array  storing  the  local blocks of

*                                   the distributed matrix A,

*                                   IF( Lc( 1, N_A ) > 0 )

*                                      LLD_A >= MAX( 1, Lr( 1, M_A ) )

*                                   ELSE

*                                      LLD_A >= 1.

*

*  Let K be the number of  rows of a matrix A starting at the global in-

*  dex IA,i.e, A( IA:IA+K-1, : ). Lr( IA, K ) denotes the number of rows

*  that the process of row coordinate MYROW ( 0 <= MYROW < NPROW ) would

*  receive if these K rows were distributed over NPROW processes.  If  K

*  is the number of columns of a matrix  A  starting at the global index

*  JA, i.e, A( :, JA:JA+K-1, : ), Lc( JA, K ) denotes the number  of co-

*  lumns that the process MYCOL ( 0 <= MYCOL < NPCOL ) would  receive if

*  these K columns were distributed over NPCOL processes.

*

*  The values of Lr() and Lc() may be determined via a call to the func-

*  tion PB_NUMROC:

*  Lr( IA, K ) = PB_NUMROC( K, IA, IMB_A, MB_A, MYROW, RSRC_A, NPROW )

*  Lc( JA, K ) = PB_NUMROC( K, JA, INB_A, NB_A, MYCOL, CSRC_A, NPCOL )

*

*  Arguments

*  =========

*

*  LTEST   (global input) LOGICAL array

*          On entry, LTEST is an array of dimension at least 10 (NSUBS).

*             If LTEST( 1 )  is .TRUE., PCSWAP  will be tested;

*             If LTEST( 2 )  is .TRUE., PCSCAL  will be tested;

*             If LTEST( 3 )  is .TRUE., PCSSCAL will be tested;

*             If LTEST( 4 )  is .TRUE., PCCOPY  will be tested;

*             If LTEST( 5 )  is .TRUE., PCAXPY  will be tested;

*             If LTEST( 6 )  is .TRUE., PCDOTU  will be tested;

*             If LTEST( 7 )  is .TRUE., PCDOTC  will be tested;

*             If LTEST( 8 )  is .TRUE., PSCNRM2 will be tested;

*             If LTEST( 9 )  is .TRUE., PSCASUM will be tested;

*             If LTEST( 10 ) is .TRUE., PCAMAX  will be tested.

*

*  INOUT   (global input) INTEGER

*          On entry,  INOUT  specifies  the unit number for output file.

*          When INOUT is 6, output to screen,  when INOUT = 0, output to

*          stderr. INOUT is only defined in process 0.

*

*  NPROCS  (global input) INTEGER

*          On entry, NPROCS specifies the total number of processes cal-

*          ling this routine.

*

*  Calling sequence encodings

*  ==========================

*

*  code Formal argument list                                Examples

*

*  11   (n,      v1,v2)                                     _SWAP, _COPY

*  12   (n,s1,   v1   )                                     _SCAL, _SCAL

*  13   (n,s1,   v1,v2)                                     _AXPY, _DOT_

*  14   (n,s1,i1,v1   )                                     _AMAX

*  15   (n,u1,   v1   )                                     _ASUM, _NRM2

*

*  21   (     trans,     m,n,s1,m1,v1,s2,v2)                _GEMV

*  22   (uplo,             n,s1,m1,v1,s2,v2)                _SYMV, _HEMV

*  23   (uplo,trans,diag,  n,   m1,v1      )                _TRMV, _TRSV

*  24   (                m,n,s1,v1,v2,m1)                   _GER_

*  25   (uplo,             n,s1,v1,   m1)                   _SYR

*  26   (uplo,             n,u1,v1,   m1)                   _HER

*  27   (uplo,             n,s1,v1,v2,m1)                   _SYR2, _HER2

*

*  31   (          transa,transb,     m,n,k,s1,m1,m2,s2,m3) _GEMM

*  32   (side,uplo,                   m,n,  s1,m1,m2,s2,m3) _SYMM, _HEMM

*  33   (     uplo,trans,               n,k,s1,m1,   s2,m3) _SYRK

*  34   (     uplo,trans,               n,k,u1,m1,   u2,m3) _HERK

*  35   (     uplo,trans,               n,k,s1,m1,m2,s2,m3) _SYR2K

*  36   (     uplo,trans,               n,k,s1,m1,m2,u2,m3) _HER2K

*  37   (                             m,n,  s1,m1,   s2,m3) _TRAN_

*  38   (side,uplo,transa,       diag,m,n,  s1,m1,m2      ) _TRMM, _TRSM

*  39   (          trans,             m,n,  s1,m1,   s2,m3) _GEADD

*  40   (     uplo,trans,             m,n,  s1,m1,   s2,m3) _TRADD

*

*  -- Written on April 1, 1998 by

*     Antoine Petitet, University  of  Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Parameters ..

      INTEGER            NSUBS

      PARAMETER          ( NSUBS = 10 )

*     ..

*     .. Local Scalars ..

      logical            abrtsav

      INTEGER            I, ICTXT, MYCOL, MYROW, NPCOL, NPROW

*     ..

*     .. Local Arrays ..

      INTEGER            SCODE( NSUBS )

*     ..

*     .. External Subroutines ..

      EXTERNAL           blacs_get, blacs_gridexit, blacs_gridinfo,

     $                   blacs_gridinit, pcamax, pcaxpy, pccopy,

     $                   pcdimee, pcdotc, pcdotu, pcscal, pcsscal,

     $                   pcswap, pcvecee, pscasum, pscnrm2

*     ..

*     .. Common Blocks ..

      LOGICAL            ABRTFLG

      INTEGER            NOUT

      CHARACTER*7        SNAMES( NSUBS )

      COMMON             /SNAMEC/SNAMES

      COMMON             /PBERRORC/NOUT, ABRTFLG

*     ..

*     .. Data Statements ..

      DATA               SCODE/11, 12, 12, 11, 13, 13, 13, 15, 15, 14/

*     ..

*     .. Executable Statements ..

*

*     Temporarily define blacs grid to include all processes so

*     information can be broadcast to all processes.

*

      CALL blacs_get( -1, 0, ictxt )

      CALL blacs_gridinit( ictxt, 'Row-major', 1, nprocs )

      CALL blacs_gridinfo( ictxt, nprow, npcol, myrow, mycol )

*

*     Set ABRTFLG to FALSE so that the PBLAS error handler won't abort

*     on errors during these tests and set the output device unit for

*     it.

*

      abrtsav = abrtflg

      abrtflg = .false.

      nout    = inout

*

*     Test PCSWAP

*

      i = 1

      IF( ltest( i ) ) THEN

         CALL pcdimee( ictxt, nout, pcswap, scode( i ), snames( i ) )

         CALL pcvecee( ictxt, nout, pcswap, scode( i ), snames( i ) )

      END IF

*

*     Test PCSCAL

*

      i = i + 1

      IF( ltest( i ) ) THEN

         CALL pcdimee( ictxt, nout, pcscal, scode( i ), snames( i ) )

         CALL pcvecee( ictxt, nout, pcscal, scode( i ), snames( i ) )

      END IF

*

*     Test PCSSCAL

*

      i = i + 1

      IF( ltest( i ) ) THEN

         CALL pcdimee( ictxt, nout, pcsscal, scode( i ), snames( i ) )

         CALL pcvecee( ictxt, nout, pcsscal, scode( i ), snames( i ) )

      END IF

*

*     Test PCCOPY

*

      i = i + 1

      IF( ltest( i ) ) THEN

         CALL pcdimee( ictxt, nout, pccopy, scode( i ), snames( i ) )

         CALL pcvecee( ictxt, nout, pccopy, scode( i ), snames( i ) )

      END IF

*

*     Test PCAXPY

*

      i = i + 1

      IF( ltest( i ) ) THEN

         CALL pcdimee( ictxt, nout, pcaxpy, scode( i ), snames( i ) )

         CALL pcvecee( ictxt, nout, pcaxpy, scode( i ), snames( i ) )

      END IF

*

*     Test PCDOTU

*

      i = i + 1

      IF( ltest( i ) ) THEN

         CALL pcdimee( ictxt, nout, pcdotu, scode( i ), snames( i ) )

         CALL pcvecee( ictxt, nout, pcdotu, scode( i ), snames( i ) )

      END IF

*

*     Test PCDOTC

*

      i = i + 1

      IF( ltest( i ) ) THEN

         CALL pcdimee( ictxt, nout, pcdotc, scode( i ), snames( i ) )

         CALL pcvecee( ictxt, nout, pcdotc, scode( i ), snames( i ) )

      END IF

*

*     PSCNRM2

*

      i = i + 1

      IF( ltest( i ) ) THEN

         CALL pcdimee( ictxt, nout, pscnrm2, scode( i ), snames( i ) )

         CALL pcvecee( ictxt, nout, pscnrm2, scode( i ), snames( i ) )

      END IF

*

*     Test PSCASUM

*

      i = i + 1

      IF( ltest( i ) ) THEN

         CALL pcdimee( ictxt, nout, pscasum, scode( i ), snames( i ) )

         CALL pcvecee( ictxt, nout, pscasum, scode( i ), snames( i ) )

      END IF

*

*     Test PCAMAX

*

      i = i + 1

      IF( ltest( i ) ) THEN

         CALL pcdimee( ictxt, nout, pcamax, scode( i ), snames( i ) )

         CALL pcvecee( ictxt, nout, pcamax, scode( i ), snames( i ) )

      END IF

*

      IF( myrow.EQ.0 .AND. mycol.EQ.0 )

     $   WRITE( nout, fmt = 9999 )

*

      CALL blacs_gridexit( ictxt )

*

*     Reset ABRTFLG to the value it had before calling this routine

*

      abrtflg = abrtsav

*

 9999 FORMAT( 2x, 'Error-exit tests completed.' )

*

      RETURN

*

*     End of PCBLAS1TSTCHKE

*


      END


      SUBROUTINE pcchkarg1( ICTXT, NOUT, SNAME, N, ALPHA, IX, JX,

     $                      DESCX, INCX, IY, JY, DESCY, INCY, INFO )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Scalar Arguments ..

      INTEGER            ICTXT, INCX, INCY, INFO, IX, IY, JX, JY, N,

     $                   NOUT

      COMPLEX            ALPHA

*     ..

*     .. Array Arguments ..

      CHARACTER*(*)      SNAME

      INTEGER            DESCX( * ), DESCY( * )

*     ..

*

*  Purpose

*  =======

*

*  PCCHKARG1 checks the input-only arguments of the Level 1 PBLAS.  When

*  INFO = 0, this routine makes a copy of its arguments (which are INPUT

*  only arguments to PBLAS routines). Otherwise, it verifies the  values

*  of these arguments against the saved copies.

*

*  Notes

*  =====

*

*  A description  vector  is associated with each 2D block-cyclicly dis-

*  tributed matrix.  This  vector  stores  the  information  required to

*  establish the  mapping  between a  matrix entry and its corresponding

*  process and memory location.

*

*  In  the  following  comments,   the character _  should  be  read  as

*  "of  the  distributed  matrix".  Let  A  be a generic term for any 2D

*  block cyclicly distributed matrix.  Its description vector is DESCA:

*

*  NOTATION         STORED IN       EXPLANATION

*  ---------------- --------------- ------------------------------------

*  DTYPE_A (global) DESCA( DTYPE_ ) The descriptor type.

*  CTXT_A  (global) DESCA( CTXT_  ) The BLACS context handle, indicating

*                                   the NPROW x NPCOL BLACS process grid

*                                   A  is distributed over.  The context

*                                   itself  is  global,  but  the handle

*                                   (the integer value) may vary.

*  M_A     (global) DESCA( M_     ) The  number of rows in the distribu-

*                                   ted matrix A, M_A >= 0.

*  N_A     (global) DESCA( N_     ) The number of columns in the distri-

*                                   buted matrix A, N_A >= 0.

*  IMB_A   (global) DESCA( IMB_   ) The number of rows of the upper left

*                                   block of the matrix A, IMB_A > 0.

*  INB_A   (global) DESCA( INB_   ) The  number  of columns of the upper

*                                   left   block   of   the   matrix  A,

*                                   INB_A > 0.

*  MB_A    (global) DESCA( MB_    ) The blocking factor used to  distri-

*                                   bute the last  M_A-IMB_A rows of  A,

*                                   MB_A > 0.

*  NB_A    (global) DESCA( NB_    ) The blocking factor used to  distri-

*                                   bute the last  N_A-INB_A  columns of

*                                   A, NB_A > 0.

*  RSRC_A  (global) DESCA( RSRC_  ) The process row over which the first

*                                   row of the matrix  A is distributed,

*                                   NPROW > RSRC_A >= 0.

*  CSRC_A  (global) DESCA( CSRC_  ) The  process  column  over which the

*                                   first  column of  A  is distributed.

*                                   NPCOL > CSRC_A >= 0.

*  LLD_A   (local)  DESCA( LLD_   ) The  leading  dimension of the local

*                                   array  storing  the  local blocks of

*                                   the distributed matrix A,

*                                   IF( Lc( 1, N_A ) > 0 )

*                                      LLD_A >= MAX( 1, Lr( 1, M_A ) )

*                                   ELSE

*                                      LLD_A >= 1.

*

*  Let K be the number of  rows of a matrix A starting at the global in-

*  dex IA,i.e, A( IA:IA+K-1, : ). Lr( IA, K ) denotes the number of rows

*  that the process of row coordinate MYROW ( 0 <= MYROW < NPROW ) would

*  receive if these K rows were distributed over NPROW processes.  If  K

*  is the number of columns of a matrix  A  starting at the global index

*  JA, i.e, A( :, JA:JA+K-1, : ), Lc( JA, K ) denotes the number  of co-

*  lumns that the process MYCOL ( 0 <= MYCOL < NPCOL ) would  receive if

*  these K columns were distributed over NPCOL processes.

*

*  The values of Lr() and Lc() may be determined via a call to the func-

*  tion PB_NUMROC:

*  Lr( IA, K ) = PB_NUMROC( K, IA, IMB_A, MB_A, MYROW, RSRC_A, NPROW )

*  Lc( JA, K ) = PB_NUMROC( K, JA, INB_A, NB_A, MYCOL, CSRC_A, NPCOL )

*

*  Arguments

*  =========

*

*  ICTXT   (local input) INTEGER

*          On entry,  ICTXT  specifies the BLACS context handle, indica-

*          ting the global  context of the operation. The context itself

*          is global, but the value of ICTXT is local.

*

*  NOUT    (global input) INTEGER

*          On entry, NOUT specifies the unit number for the output file.

*          When NOUT is 6, output to screen,  when  NOUT is 0, output to

*          stderr. NOUT is only defined for process 0.

*

*  SNAME   (global input) CHARACTER*(*)

*          On entry, SNAME specifies the subroutine  name  calling  this

*          subprogram.

*

*  N       (global input) INTEGER

*          On entry, N specifies the length of the subvector operands.

*

*  ALPHA   (global input) COMPLEX

*          On entry, ALPHA specifies the scalar alpha.

*

*  IX      (global input) INTEGER

*          On entry, IX  specifies X's global row index, which points to

*          the beginning of the submatrix sub( X ).

*

*  JX      (global input) INTEGER

*          On entry, JX  specifies X's global column index, which points

*          to the beginning of the submatrix sub( X ).

*

*  DESCX   (global and local input) INTEGER array

*          On entry, DESCX  is an integer array of dimension DLEN_. This

*          is the array descriptor for the matrix X.

*

*  INCX    (global input) INTEGER

*          On entry,  INCX   specifies  the  global  increment  for  the

*          elements of  X.  Only two values of  INCX   are  supported in

*          this version, namely 1 and M_X. INCX  must not be zero.

*

*  IY      (global input) INTEGER

*          On entry, IY  specifies Y's global row index, which points to

*          the beginning of the submatrix sub( Y ).

*

*  JY      (global input) INTEGER

*          On entry, JY  specifies Y's global column index, which points

*          to the beginning of the submatrix sub( Y ).

*

*  DESCY   (global and local input) INTEGER array

*          On entry, DESCY  is an integer array of dimension DLEN_. This

*          is the array descriptor for the matrix Y.

*

*  INCY    (global input) INTEGER

*          On entry,  INCY   specifies  the  global  increment  for  the

*          elements of  Y.  Only two values of  INCY   are  supported in

*          this version, namely 1 and M_Y. INCY  must not be zero.

*

*  INFO    (global input/global output) INTEGER

*          When INFO = 0 on entry, the values of the arguments which are

*          INPUT only arguments to a PBLAS routine are copied into  sta-

*          tic variables and INFO is unchanged on exit.  Otherwise,  the

*          values  of  the  arguments are compared against the saved co-

*          pies. In case no error has been found INFO is zero on return,

*          otherwise it is non zero.

*

*  -- Written on April 1, 1998 by

*     Antoine Petitet, University  of  Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Parameters ..

      INTEGER            BLOCK_CYCLIC_2D_INB, CSRC_, CTXT_, DLEN_,

     $                   DTYPE_, IMB_, INB_, LLD_, MB_, M_, NB_, N_,

     $                   RSRC_

      PARAMETER          ( BLOCK_CYCLIC_2D_INB = 2, dlen_ = 11,

     $                   dtype_ = 1, ctxt_ = 2, m_ = 3, n_ = 4,

     $                   imb_ = 5, inb_ = 6, mb_ = 7, nb_ = 8,

     $                   rsrc_ = 9, csrc_ = 10, lld_ = 11 )

*     ..

*     .. Local Scalars ..

      INTEGER            I, INCXREF, INCYREF, IXREF, IYREF, JXREF,

     $                   JYREF, MYCOL, MYROW, NPCOL, NPROW, NREF

      COMPLEX            ALPHAREF

*     ..

*     .. Local Arrays ..

      CHARACTER*15       ARGNAME

      INTEGER            DESCXREF( DLEN_ ), DESCYREF( DLEN_ )

*     ..

*     .. External Subroutines ..

      EXTERNAL           blacs_gridinfo, igsum2d

*     ..

*     .. Save Statements ..

      SAVE

*     ..

*     .. Executable Statements ..

*

*     Get grid parameters

*

      CALL blacs_gridinfo( ictxt, nprow, npcol, myrow, mycol )

*

*     Check if first call. If yes, then save.

*

      IF( info.EQ.0 ) THEN

*

         nref = n

         ixref = ix

         jxref = jx

         DO 10 i = 1, dlen_

            descxref( i ) = descx( i )

   10    CONTINUE

         incxref = incx

         iyref = iy

         jyref = jy

         DO 20 i = 1, dlen_

            descyref( i ) = descy( i )

   20    CONTINUE

         incyref = incy

         alpharef = alpha

*

      ELSE

*

*        Test saved args. Return with first mismatch.

*

         argname = ' '

         IF( n.NE.nref ) THEN

            WRITE( argname, fmt = '(A)' ) 'N'

         ELSE IF( ix.NE.ixref ) THEN

            WRITE( argname, fmt = '(A)' ) 'IX'

         ELSE IF( jx.NE.jxref ) THEN

            WRITE( argname, fmt = '(A)' ) 'JX'

         ELSE IF( descx( dtype_ ).NE.descxref( dtype_ ) ) THEN

            WRITE( argname, fmt = '(A)' ) 'DESCX( DTYPE_ )'

         ELSE IF( descx( m_ ).NE.descxref( m_ ) ) THEN

            WRITE( argname, fmt = '(A)' ) 'DESCX( M_ )'

         ELSE IF( descx( n_ ).NE.descxref( n_ ) ) THEN

            WRITE( argname, fmt = '(A)' ) 'DESCX( N_ )'

         ELSE IF( descx( imb_ ).NE.descxref( imb_ ) ) THEN

            WRITE( argname, fmt = '(A)' ) 'DESCX( IMB_ )'

         ELSE IF( descx( inb_ ).NE.descxref( inb_ ) ) THEN

            WRITE( argname, fmt = '(A)' ) 'DESCX( INB_ )'

         ELSE IF( descx( mb_ ).NE.descxref( mb_ ) ) THEN

            WRITE( argname, fmt = '(A)' ) 'DESCX( MB_ )'

         ELSE IF( descx( nb_ ).NE.descxref( nb_ ) ) THEN

            WRITE( argname, fmt = '(A)' ) 'DESCX( NB_ )'

         ELSE IF( descx( rsrc_ ).NE.descxref( rsrc_ ) ) THEN

            WRITE( argname, fmt = '(A)' ) 'DESCX( RSRC_ )'

         ELSE IF( descx( csrc_ ).NE.descxref( csrc_ ) ) THEN

            WRITE( argname, fmt = '(A)' ) 'DESCX( CSRC_ )'

         ELSE IF( descx( ctxt_ ).NE.descxref( ctxt_ ) ) THEN

            WRITE( argname, fmt = '(A)' ) 'DESCX( CTXT_ )'

         ELSE IF( descx( lld_ ).NE.descxref( lld_ ) ) THEN

            WRITE( argname, fmt = '(A)' ) 'DESCX( LLD_ )'

         ELSE IF( incx.NE.incxref ) THEN

            WRITE( argname, fmt = '(A)' ) 'INCX'

         ELSE IF( iy.NE.iyref ) THEN

            WRITE( argname, fmt = '(A)' ) 'IY'

         ELSE IF( jy.NE.jyref ) THEN

            WRITE( argname, fmt = '(A)' ) 'JY'

         ELSE IF( descy( dtype_ ).NE.descyref( dtype_ ) ) THEN

            WRITE( argname, fmt = '(A)' ) 'DESCY( DTYPE_ )'

         ELSE IF( descy( m_ ).NE.descyref( m_ ) ) THEN

            WRITE( argname, fmt = '(A)' ) 'DESCY( M_ )'

         ELSE IF( descy( n_ ).NE.descyref( n_ ) ) THEN

            WRITE( argname, fmt = '(A)' ) 'DESCY( N_ )'

         ELSE IF( descy( imb_ ).NE.descyref( imb_ ) ) THEN

            WRITE( argname, fmt = '(A)' ) 'DESCY( IMB_ )'

         ELSE IF( descy( inb_ ).NE.descyref( inb_ ) ) THEN

            WRITE( argname, fmt = '(A)' ) 'DESCY( INB_ )'

         ELSE IF( descy( mb_ ).NE.descyref( mb_ ) ) THEN

            WRITE( argname, fmt = '(A)' ) 'DESCY( MB_ )'

         ELSE IF( descy( nb_ ).NE.descyref( nb_ ) ) THEN

            WRITE( argname, fmt = '(A)' ) 'DESCY( NB_ )'

         ELSE IF( descy( rsrc_ ).NE.descyref( rsrc_ ) ) THEN

            WRITE( argname, fmt = '(A)' ) 'DESCY( RSRC_ )'

         ELSE IF( descy( csrc_ ).NE.descyref( csrc_ ) ) THEN

            WRITE( argname, fmt = '(A)' ) 'DESCY( CSRC_ )'

         ELSE IF( descy( ctxt_ ).NE.descyref( ctxt_ ) ) THEN

            WRITE( argname, fmt = '(A)' ) 'DESCY( CTXT_ )'

         ELSE IF( descy( lld_ ).NE.descyref( lld_ ) ) THEN

            WRITE( argname, fmt = '(A)' ) 'DESCY( LLD_ )'

         ELSE IF( incy.NE.incyref ) THEN

            WRITE( argname, fmt = '(A)' ) 'INCY'

         ELSE IF( alpha.NE.alpharef ) THEN

            WRITE( argname, fmt = '(A)' ) 'ALPHA'

         ELSE

            info = 0

         END IF

*

         CALL igsum2d( ictxt, 'All', ' ', 1, 1, info, 1, -1, 0 )

*

         IF( myrow.EQ.0 .AND. mycol.EQ.0 ) THEN

*

            IF( info.GT.0 ) THEN

               WRITE( nout, fmt = 9999 ) argname, sname

            ELSE

               WRITE( nout, fmt = 9998 ) sname

            END IF

*

         END IF

*

      END IF

*

 9999 FORMAT( 2x, '   ***** Input-only parameter check: ', a,

     $        ' FAILED  changed ', a, ' *****' )

 9998 FORMAT( 2x, '   ***** Input-only parameter check: ', a,

     $        ' PASSED  *****' )

*

      RETURN

*

*     End of PCCHKARG1

*


      END


      LOGICAL FUNCTION pisinscope( ICTXT, N, IX, JX, DESCX, INCX )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Scalar Arguments ..

      INTEGER            ictxt, incx, ix, jx, n

*     ..

*     .. Array Arguments ..

      INTEGER            descx( * )

*     ..

*

*  Purpose

*  =======

*

*  PISINSCOPE returns  .TRUE.  if the calling process is in the scope of

*  sub( X ) = X( IX+(JX-1)*DESCX(M_)+(i-1)*INCX ) and  .FALSE.  if it is

*  not.  This  routine is used to determine which processes should check

*  the answer returned by some Level 1 PBLAS routines.

*

*  Notes

*  =====

*

*  A description  vector  is associated with each 2D block-cyclicly dis-

*  tributed matrix.  This  vector  stores  the  information  required to

*  establish the  mapping  between a  matrix entry and its corresponding

*  process and memory location.

*

*  In  the  following  comments,   the character _  should  be  read  as

*  "of  the  distributed  matrix".  Let  A  be a generic term for any 2D

*  block cyclicly distributed matrix.  Its description vector is DESCA:

*

*  NOTATION         STORED IN       EXPLANATION

*  ---------------- --------------- ------------------------------------

*  DTYPE_A (global) DESCA( DTYPE_ ) The descriptor type.

*  CTXT_A  (global) DESCA( CTXT_  ) The BLACS context handle, indicating

*                                   the NPROW x NPCOL BLACS process grid

*                                   A  is distributed over.  The context

*                                   itself  is  global,  but  the handle

*                                   (the integer value) may vary.

*  M_A     (global) DESCA( M_     ) The  number of rows in the distribu-

*                                   ted matrix A, M_A >= 0.

*  N_A     (global) DESCA( N_     ) The number of columns in the distri-

*                                   buted matrix A, N_A >= 0.

*  IMB_A   (global) DESCA( IMB_   ) The number of rows of the upper left

*                                   block of the matrix A, IMB_A > 0.

*  INB_A   (global) DESCA( INB_   ) The  number  of columns of the upper

*                                   left   block   of   the   matrix  A,

*                                   INB_A > 0.

*  MB_A    (global) DESCA( MB_    ) The blocking factor used to  distri-

*                                   bute the last  M_A-IMB_A rows of  A,

*                                   MB_A > 0.

*  NB_A    (global) DESCA( NB_    ) The blocking factor used to  distri-

*                                   bute the last  N_A-INB_A  columns of

*                                   A, NB_A > 0.

*  RSRC_A  (global) DESCA( RSRC_  ) The process row over which the first

*                                   row of the matrix  A is distributed,

*                                   NPROW > RSRC_A >= 0.

*  CSRC_A  (global) DESCA( CSRC_  ) The  process  column  over which the

*                                   first  column of  A  is distributed.

*                                   NPCOL > CSRC_A >= 0.

*  LLD_A   (local)  DESCA( LLD_   ) The  leading  dimension of the local

*                                   array  storing  the  local blocks of

*                                   the distributed matrix A,

*                                   IF( Lc( 1, N_A ) > 0 )

*                                      LLD_A >= MAX( 1, Lr( 1, M_A ) )

*                                   ELSE

*                                      LLD_A >= 1.

*

*  Let K be the number of  rows of a matrix A starting at the global in-

*  dex IA,i.e, A( IA:IA+K-1, : ). Lr( IA, K ) denotes the number of rows

*  that the process of row coordinate MYROW ( 0 <= MYROW < NPROW ) would

*  receive if these K rows were distributed over NPROW processes.  If  K

*  is the number of columns of a matrix  A  starting at the global index

*  JA, i.e, A( :, JA:JA+K-1, : ), Lc( JA, K ) denotes the number  of co-

*  lumns that the process MYCOL ( 0 <= MYCOL < NPCOL ) would  receive if

*  these K columns were distributed over NPCOL processes.

*

*  The values of Lr() and Lc() may be determined via a call to the func-

*  tion PB_NUMROC:

*  Lr( IA, K ) = PB_NUMROC( K, IA, IMB_A, MB_A, MYROW, RSRC_A, NPROW )

*  Lc( JA, K ) = PB_NUMROC( K, JA, INB_A, NB_A, MYCOL, CSRC_A, NPCOL )

*

*  Arguments

*  =========

*

*  ICTXT   (local input) INTEGER

*          On entry,  ICTXT  specifies the BLACS context handle, indica-

*          ting the global  context of the operation. The context itself

*          is global, but the value of ICTXT is local.

*

*  N       (global input) INTEGER

*          The length of the subvector sub( X ).

*

*  IX      (global input) INTEGER

*          On entry, IX  specifies X's global row index, which points to

*          the beginning of the submatrix sub( X ).

*

*  JX      (global input) INTEGER

*          On entry, JX  specifies X's global column index, which points

*          to the beginning of the submatrix sub( X ).

*

*  DESCX   (global and local input) INTEGER array

*          On entry, DESCX  is an integer array of dimension DLEN_. This

*          is the array descriptor for the matrix X.

*

*  INCX    (global input) INTEGER

*          On entry,  INCX   specifies  the  global  increment  for  the

*          elements of  X.  Only two values of  INCX   are  supported in

*          this version, namely 1 and M_X. INCX  must not be zero.

*

*  -- Written on April 1, 1998 by

*     Antoine Petitet, University  of  Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Parameters ..

      INTEGER            block_cyclic_2d_inb, csrc_, ctxt_, dlen_,

     $                   dtype_, imb_, inb_, lld_, mb_, m_, nb_, n_,

     $                   rsrc_

      PARAMETER          ( block_cyclic_2d_inb = 2, dlen_ = 11,

     $                   dtype_ = 1, ctxt_ = 2, m_ = 3, n_ = 4,

     $                   imb_ = 5, inb_ = 6, mb_ = 7, nb_ = 8,

     $                   rsrc_ = 9, csrc_ = 10, lld_ = 11 )

*     ..

*     .. Local Scalars ..

      LOGICAL            colrep, rowrep

      INTEGER            iix, ixcol, ixrow, jjx, mycol, myrow, npcol,

     $                   nprow

*     ..

*     .. External Subroutines ..

      EXTERNAL           blacs_gridinfo, pb_infog2l

*     ..

*     .. Executable Statements ..

*

      CALL blacs_gridinfo( ictxt, nprow, npcol, myrow, mycol )

*

      CALL pb_infog2l( ix, jx, descx, nprow, npcol, myrow, mycol,

     $                 iix, jjx, ixrow, ixcol )

      rowrep = ( ixrow.EQ.-1 )

      colrep = ( ixcol.EQ.-1 )

*

      IF( descx( m_ ).EQ.1 .AND. n.EQ.1 ) THEN

*

*        This is the special case, find process owner of IX, JX, and

*        only this process is the scope.

*

         pisinscope = ( ( ixrow.EQ.myrow .OR. rowrep ) .AND.

     $                   ( ixcol.EQ.mycol .OR. colrep ) )

*

      ELSE

*

         IF( incx.EQ.descx( m_ ) ) THEN

*

*           row vector

*

            pisinscope = ( myrow.EQ.ixrow .OR. rowrep )

*

         ELSE

*

*           column vector

*

            pisinscope = ( mycol.EQ.ixcol .OR. colrep )

*

         END IF

*

      END IF

*

      RETURN

*

*     End of PISINSCOPE

*


      END


      SUBROUTINE pcblas1tstchk( ICTXT, NOUT, NROUT, N, PSCLR, PUSCLR,

     $                          PISCLR, X, PX, IX, JX, DESCX, INCX, Y,

     $                          PY, IY, JY, DESCY, INCY, INFO )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Scalar Arguments ..

      INTEGER            ICTXT, INCX, INCY, INFO, IX, IY, JX, JY, N,

     $                   nout, nrout, pisclr

      REAL               PUSCLR

      COMPLEX            PSCLR

*     ..

*     .. Array Arguments ..

      INTEGER            DESCX( * ), DESCY( * )

      COMPLEX            PX( * ), PY( * ), X( * ), Y( * )

*     ..

*

*  Purpose

*  =======

*

*  PCBLAS1TSTCHK performs the computational tests of the Level 1 PBLAS.

*

*  Notes

*  =====

*

*  A description  vector  is associated with each 2D block-cyclicly dis-

*  tributed matrix.  This  vector  stores  the  information  required to

*  establish the  mapping  between a  matrix entry and its corresponding

*  process and memory location.

*

*  In  the  following  comments,   the character _  should  be  read  as

*  "of  the  distributed  matrix".  Let  A  be a generic term for any 2D

*  block cyclicly distributed matrix.  Its description vector is DESCA:

*

*  NOTATION         STORED IN       EXPLANATION

*  ---------------- --------------- ------------------------------------

*  DTYPE_A (global) DESCA( DTYPE_ ) The descriptor type.

*  CTXT_A  (global) DESCA( CTXT_  ) The BLACS context handle, indicating

*                                   the NPROW x NPCOL BLACS process grid

*                                   A  is distributed over.  The context

*                                   itself  is  global,  but  the handle

*                                   (the integer value) may vary.

*  M_A     (global) DESCA( M_     ) The  number of rows in the distribu-

*                                   ted matrix A, M_A >= 0.

*  N_A     (global) DESCA( N_     ) The number of columns in the distri-

*                                   buted matrix A, N_A >= 0.

*  IMB_A   (global) DESCA( IMB_   ) The number of rows of the upper left

*                                   block of the matrix A, IMB_A > 0.

*  INB_A   (global) DESCA( INB_   ) The  number  of columns of the upper

*                                   left   block   of   the   matrix  A,

*                                   INB_A > 0.

*  MB_A    (global) DESCA( MB_    ) The blocking factor used to  distri-

*                                   bute the last  M_A-IMB_A rows of  A,

*                                   MB_A > 0.

*  NB_A    (global) DESCA( NB_    ) The blocking factor used to  distri-

*                                   bute the last  N_A-INB_A  columns of

*                                   A, NB_A > 0.

*  RSRC_A  (global) DESCA( RSRC_  ) The process row over which the first

*                                   row of the matrix  A is distributed,

*                                   NPROW > RSRC_A >= 0.

*  CSRC_A  (global) DESCA( CSRC_  ) The  process  column  over which the

*                                   first  column of  A  is distributed.

*                                   NPCOL > CSRC_A >= 0.

*  LLD_A   (local)  DESCA( LLD_   ) The  leading  dimension of the local

*                                   array  storing  the  local blocks of

*                                   the distributed matrix A,

*                                   IF( Lc( 1, N_A ) > 0 )

*                                      LLD_A >= MAX( 1, Lr( 1, M_A ) )

*                                   ELSE

*                                      LLD_A >= 1.

*

*  Let K be the number of  rows of a matrix A starting at the global in-

*  dex IA,i.e, A( IA:IA+K-1, : ). Lr( IA, K ) denotes the number of rows

*  that the process of row coordinate MYROW ( 0 <= MYROW < NPROW ) would

*  receive if these K rows were distributed over NPROW processes.  If  K

*  is the number of columns of a matrix  A  starting at the global index

*  JA, i.e, A( :, JA:JA+K-1, : ), Lc( JA, K ) denotes the number  of co-

*  lumns that the process MYCOL ( 0 <= MYCOL < NPCOL ) would  receive if

*  these K columns were distributed over NPCOL processes.

*

*  The values of Lr() and Lc() may be determined via a call to the func-

*  tion PB_NUMROC:

*  Lr( IA, K ) = PB_NUMROC( K, IA, IMB_A, MB_A, MYROW, RSRC_A, NPROW )

*  Lc( JA, K ) = PB_NUMROC( K, JA, INB_A, NB_A, MYCOL, CSRC_A, NPCOL )

*

*  Arguments

*  =========

*

*  ICTXT   (local input) INTEGER

*          On entry,  ICTXT  specifies the BLACS context handle, indica-

*          ting the global  context of the operation. The context itself

*          is global, but the value of ICTXT is local.

*

*  NOUT    (global input) INTEGER

*          On entry, NOUT specifies the unit number for the output file.

*          When NOUT is 6, output to screen,  when  NOUT is 0, output to

*          stderr. NOUT is only defined for process 0.

*

*  NROUT   (global input) INTEGER

*          On entry,  NROUT  specifies  which  routine will be tested as

*          follows:

*             If NROUT = 1,       PCSWAP  will be tested;

*             else if NROUT = 2,  PCSCAL  will be tested;

*             else if NROUT = 3,  PCSSCAL will be tested;

*             else if NROUT = 4,  PCCOPY  will be tested;

*             else if NROUT = 5,  PCAXPY  will be tested;

*             else if NROUT = 6,  PCDOTU  will be tested;

*             else if NROUT = 7,  PCDOTC  will be tested;

*             else if NROUT = 8,  PSCNRM2 will be tested;

*             else if NROUT = 9,  PSCASUM will be tested;

*             else if NROUT = 10, PCAMAX  will be tested.

*

*  N       (global input) INTEGER

*          On entry, N specifies the length of the subvector operands.

*

*  PSCLR   (global input) COMPLEX

*          On entry, depending on the value of  NROUT,  PSCLR  specifies

*          the scalar ALPHA, or the output scalar returned by the PBLAS,

*          i.e., the dot product, the 2-norm,  the  absolute sum  or the

*          value of AMAX.

*

*  PUSCLR  (global input) REAL

*          On entry, PUSCLR specifies the real part of the  scalar ALPHA

*          used  by  the  real  scaling, the 2-norm, or the absolute sum

*          routines.  PUSCLR  is  not  used in the real versions of this

*          routine.

*

*  PISCLR  (global input) REAL

*          On entry, PISCLR  specifies the value of the global index re-

*          turned by PCAMAX, otherwise PISCLR is not used.

*

*  X       (local input/local output) COMPLEX array

*          On entry, X is an array of  dimension  (DESCX( M_ ),*).  This

*          array contains a local copy of the initial entire matrix PX.

*

*  PX      (local input) COMPLEX array

*          On entry, PX is an array of dimension (DESCX( LLD_ ),*). This

*          array contains the local entries of the matrix PX.

*

*  IX      (global input) INTEGER

*          On entry, IX  specifies X's global row index, which points to

*          the beginning of the submatrix sub( X ).

*

*  JX      (global input) INTEGER

*          On entry, JX  specifies X's global column index, which points

*          to the beginning of the submatrix sub( X ).

*

*  DESCX   (global and local input) INTEGER array

*          On entry, DESCX  is an integer array of dimension DLEN_. This

*          is the array descriptor for the matrix X.

*

*  INCX    (global input) INTEGER

*          On entry,  INCX   specifies  the  global  increment  for  the

*          elements of  X.  Only two values of  INCX   are  supported in

*          this version, namely 1 and M_X. INCX  must not be zero.

*

*  Y       (local input/local output) COMPLEX array

*          On entry, Y is an array of  dimension  (DESCY( M_ ),*).  This

*          array contains a local copy of the initial entire matrix PY.

*

*  PY      (local input) COMPLEX array

*          On entry, PY is an array of dimension (DESCY( LLD_ ),*). This

*          array contains the local entries of the matrix PY.

*

*  IY      (global input) INTEGER

*          On entry, IY  specifies Y's global row index, which points to

*          the beginning of the submatrix sub( Y ).

*

*  JY      (global input) INTEGER

*          On entry, JY  specifies Y's global column index, which points

*          to the beginning of the submatrix sub( Y ).

*

*  DESCY   (global and local input) INTEGER array

*          On entry, DESCY  is an integer array of dimension DLEN_. This

*          is the array descriptor for the matrix Y.

*

*  INCY    (global input) INTEGER

*          On entry,  INCY   specifies  the  global  increment  for  the

*          elements of  Y.  Only two values of  INCY   are  supported in

*          this version, namely 1 and M_Y. INCY  must not be zero.

*

*  INFO    (global output) INTEGER

*          On exit, if INFO = 0,  no  error  has  been  found, otherwise

*          if( MOD( INFO,   2 ) = 1 ) then an error on X has been found,

*          if( MOD( INFO/2, 2 ) = 1 ) then an error on Y has been found.

*

*  -- Written on April 1, 1998 by

*     Antoine Petitet, University  of  Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Parameters ..

      REAL               RZERO

      COMPLEX            ZERO

      PARAMETER          ( ZERO = ( 0.0e+0, 0.0e+0 ),

     $                   rzero = 0.0e+0 )

      INTEGER            BLOCK_CYCLIC_2D_INB, CSRC_, CTXT_, DLEN_,

     $                   DTYPE_, IMB_, INB_, LLD_, MB_, M_, NB_, N_,

     $                   RSRC_

      PARAMETER          ( BLOCK_CYCLIC_2D_INB = 2, dlen_ = 11,

     $                   dtype_ = 1, ctxt_ = 2, m_ = 3, n_ = 4,

     $                   imb_ = 5, inb_ = 6, mb_ = 7, nb_ = 8,

     $                   rsrc_ = 9, csrc_ = 10, lld_ = 11 )

*     ..

*     .. Local Scalars ..

      LOGICAL            COLREP, INXSCOPE, INYSCOPE, ROWREP

      INTEGER            I, IB, ICURCOL, ICURROW, IDUMM, IIX, IIY, IN,

     $                   ioffx, ioffy, isclr, ixcol, ixrow, iycol,

     $                   iyrow, j, jb, jjx, jjy, jn, kk, ldx, ldy,

     $                   mycol, myrow, npcol, nprow

      REAL               ERR, ERRMAX, PREC, USCLR

      COMPLEX            SCLR

*     ..

*     .. Local Arrays ..

      INTEGER            IERR( 6 )

      CHARACTER*5        ARGIN1, ARGIN2, ARGOUT1, ARGOUT2

*     ..

*     .. External Subroutines ..

      EXTERNAL           blacs_gridinfo, ccopy, cswap, igamx2d,

     $                   pb_infog2l, pcchkvin, pcerrasum, pcerraxpy,

     $                   pcerrdotc, pcerrdotu, pcerrnrm2, pcerrscal,

     $                   pcserrscal

*     ..

*     .. External Functions ..

      LOGICAL            PISINSCOPE

      INTEGER            ICAMAX

      REAL               PSLAMCH

      EXTERNAL           ICAMAX, PISINSCOPE, PSLAMCH

*     ..

*     .. Intrinsic Functions ..

      INTRINSIC          min

*     ..

*     .. Executable Statements ..

*

      info    = 0

*

*     Quick return if possible

*

      IF( n.LE.0 )

     $   RETURN

*

      CALL blacs_gridinfo( ictxt, nprow, npcol, myrow, mycol )

*

      argin1  = '     '

      argin2  = '     '

      argout1 = '     '

      argout2 = '     '

      DO 10 i = 1, 6

         ierr( i ) = 0

   10 CONTINUE

*

      prec = pslamch( ictxt, 'precision' )

*

      IF( nrout.EQ.1 ) THEN

*

*        Test PCSWAP

*

         ioffx = ix + ( jx - 1 ) * descx( m_ )

         ioffy = iy + ( jy - 1 ) * descy( m_ )

         CALL cswap( n, x( ioffx ), incx, y( ioffy ), incy )

         CALL pcchkvin( errmax, n, x, px, ix, jx, descx, incx,

     $                    ierr( 1 ) )

         CALL pcchkvin( errmax, n, y, py, iy, jy, descy, incy,

     $                    ierr( 2 ) )

*

      ELSE IF( nrout.EQ.2 ) THEN

*

*        Test PCSCAL

*

         ldx   = descx( lld_ )

         ioffx = ix + ( jx - 1 ) * descx( m_ )

         CALL pb_infog2l( ix, jx, descx, nprow, npcol, myrow, mycol,

     $                    iix, jjx, ixrow, ixcol )

         icurrow = ixrow

         icurcol = ixcol

         rowrep = ( ixrow.EQ.-1 )

         colrep = ( ixcol.EQ.-1 )

*

         IF( incx.EQ.descx( m_ ) ) THEN

*

*           sub( X ) is a row vector

*

            jb = descx( inb_ ) - jx + 1

            IF( jb.LE.0 )

     $         jb = ( (-jb ) / descx( nb_ ) + 1 ) * descx( nb_ ) + jb

            jb = min( jb, n )

            jn = jx + jb - 1

*

            DO 20 j = jx, jn

*

               CALL pcerrscal( err, psclr, x( ioffx ), prec )

*

               IF( ( myrow.EQ.icurrow .OR. rowrep ) .AND.

     $             ( mycol.EQ.icurcol .OR. colrep ) ) THEN

                  IF( abs( px( iix+(jjx-1)*ldx ) - x( ioffx ) ).GT.

     $                err )

     $             ierr( 1 ) = 1

                  jjx = jjx + 1

               END IF

*

               ioffx = ioffx + incx

*

   20       CONTINUE

*

            icurcol = mod( icurcol+1, npcol )

*

            DO 40 j = jn+1, jx+n-1, descx( nb_ )

               jb = min( jx+n-j, descx( nb_ ) )

*

               DO 30 kk = 0, jb-1

*

                  CALL pcerrscal( err, psclr, x( ioffx ), prec )

*

                  IF( ( myrow.EQ.icurrow .OR. rowrep ) .AND.

     $                ( mycol.EQ.icurcol .OR. colrep ) ) THEN

                     IF( abs( px( iix+(jjx-1)*ldx ) - x( ioffx ) ).GT.

     $                   err )

     $                  ierr( 1 ) = 1

                     jjx = jjx + 1

                  END IF

*

                  ioffx = ioffx + incx

*

   30          CONTINUE

*

               icurcol = mod( icurcol+1, npcol )

*

   40       CONTINUE

*

         ELSE

*

*           sub( X ) is a column vector

*

            ib = descx( imb_ ) - ix + 1

            IF( ib.LE.0 )

     $         ib = ( (-ib ) / descx( mb_ ) + 1 ) * descx( mb_ ) + ib

            ib = min( ib, n )

            in = ix + ib - 1

*

            DO 50 i = ix, in

*

               CALL pcerrscal( err, psclr, x( ioffx ), prec )

*

               IF( ( myrow.EQ.icurrow .OR. rowrep ) .AND.

     $             ( mycol.EQ.icurcol .OR. colrep ) ) THEN

                  IF( abs( px( iix+(jjx-1)*ldx ) - x( ioffx ) ).GT.

     $                err )

     $               ierr( 1 ) = 1

                  iix = iix + 1

               END IF

*

               ioffx = ioffx + incx

*

   50       CONTINUE

*

            icurrow = mod( icurrow+1, nprow )

*

            DO 70 i = in+1, ix+n-1, descx( mb_ )

               ib = min( ix+n-i, descx( mb_ ) )

*

               DO 60 kk = 0, ib-1

*

                  CALL pcerrscal( err, psclr, x( ioffx ), prec )

*

                  IF( ( myrow.EQ.icurrow .OR. rowrep ) .AND.

     $                ( mycol.EQ.icurcol .OR. colrep ) ) THEN

                     IF( abs( px( iix+(jjx-1)*ldx ) - x( ioffx ) ).GT.

     $                   err )

     $                  ierr( 1 ) = 1

                     iix = iix + 1

                  END IF

*

                  ioffx = ioffx + incx

   60          CONTINUE

*

               icurrow = mod( icurrow+1, nprow )

*

   70       CONTINUE

*

         END IF

*

      ELSE IF( nrout.EQ.3 ) THEN

*

*        Test PCSSCAL

*

         ldx   = descx( lld_ )

         ioffx = ix + ( jx - 1 ) * descx( m_ )

         CALL pb_infog2l( ix, jx, descx, nprow, npcol, myrow, mycol,

     $                    iix, jjx, ixrow, ixcol )

         icurrow = ixrow

         icurcol = ixcol

         rowrep  = ( ixrow.EQ.-1 )

         colrep  = ( ixcol.EQ.-1 )

*

         IF( incx.EQ.descx( m_ ) ) THEN

*

*           sub( X ) is a row vector

*

            jb = descx( inb_ ) - jx + 1

            IF( jb.LE.0 )

     $         jb = ( (-jb ) / descx( nb_ ) + 1 ) * descx( nb_ ) + jb

            jb = min( jb, n )

            jn = jx + jb - 1

*

            DO 80 j = jx, jn

*

               CALL pcserrscal( err, pusclr, x( ioffx ), prec )

*

               IF( ( myrow.EQ.icurrow .OR. rowrep ) .AND.

     $             ( mycol.EQ.icurcol .OR. colrep ) ) THEN

                  IF( abs( px( iix+(jjx-1)*ldx ) - x( ioffx ) ).GT.

     $                err )

     $             ierr( 1 ) = 1

                  jjx = jjx + 1

               END IF

*

               ioffx = ioffx + incx

*

   80       CONTINUE

*

            icurcol = mod( icurcol+1, npcol )

*

            DO 100 j = jn+1, jx+n-1, descx( nb_ )

               jb = min( jx+n-j, descx( nb_ ) )

*

               DO 90 kk = 0, jb-1

*

                  CALL pcserrscal( err, pusclr, x( ioffx ), prec )

*

                  IF( ( myrow.EQ.icurrow .OR. rowrep ) .AND.

     $                ( mycol.EQ.icurcol .OR. colrep ) ) THEN

                     IF( abs( px( iix+(jjx-1)*ldx ) - x( ioffx ) ).GT.

     $                   err )

     $                  ierr( 1 ) = 1

                     jjx = jjx + 1

                  END IF

*

                  ioffx = ioffx + incx

*

   90          CONTINUE

*

               icurcol = mod( icurcol+1, npcol )

*

  100       CONTINUE

*

         ELSE

*

*           sub( X ) is a column vector

*

            ib = descx( imb_ ) - ix + 1

            IF( ib.LE.0 )

     $         ib = ( (-ib ) / descx( mb_ ) + 1 ) * descx( mb_ ) + ib

            ib = min( ib, n )

            in = ix + ib - 1

*

            DO 110 i = ix, in

*

               CALL pcserrscal( err, pusclr, x( ioffx ), prec )

*

               IF( ( myrow.EQ.icurrow .OR. rowrep ) .AND.

     $             ( mycol.EQ.icurcol .OR. colrep ) ) THEN

                  IF( abs( px( iix+(jjx-1)*ldx ) - x( ioffx ) ).GT.

     $                err )

     $               ierr( 1 ) = 1

                  iix = iix + 1

               END IF

*

               ioffx = ioffx + incx

*

  110       CONTINUE

*

            icurrow = mod( icurrow+1, nprow )

*

            DO 130 i = in+1, ix+n-1, descx( mb_ )

               ib = min( ix+n-i, descx( mb_ ) )

*

               DO 120 kk = 0, ib-1

*

                  CALL pcserrscal( err, pusclr, x( ioffx ), prec )

*

                  IF( ( myrow.EQ.icurrow .OR. rowrep ) .AND.

     $                ( mycol.EQ.icurcol .OR. colrep ) ) THEN

                     IF( abs( px( iix+(jjx-1)*ldx ) - x( ioffx ) ).GT.

     $                   err )

     $                  ierr( 1 ) = 1

                     iix = iix + 1

                  END IF

*

                  ioffx = ioffx + incx

  120          CONTINUE

*

               icurrow = mod( icurrow+1, nprow )

*

  130       CONTINUE

*

         END IF

*

      ELSE IF( nrout.EQ.4 ) THEN

*

*        Test PCCOPY

*

         ioffx = ix + ( jx - 1 ) * descx( m_ )

         ioffy = iy + ( jy - 1 ) * descy( m_ )

         CALL ccopy( n, x( ioffx ), incx, y( ioffy ), incy )

         CALL pcchkvin( errmax, n, x, px, ix, jx, descx, incx,

     $                  ierr( 1 ) )

         CALL pcchkvin( errmax, n, y, py, iy, jy, descy, incy,

     $                  ierr( 2 ) )

*

      ELSE IF( nrout.EQ.5 ) THEN

*

*        Test PCAXPY

*

         CALL pcchkvin( errmax, n, x, px, ix, jx, descx, incx,

     $                  ierr( 1 ) )

         ldy = descy( lld_ )

         ioffx = ix + ( jx - 1 ) * descx( m_ )

         ioffy = iy + ( jy - 1 ) * descy( m_ )

         CALL pb_infog2l( iy, jy, descy, nprow, npcol, myrow, mycol,

     $                    iiy, jjy, iyrow, iycol )

         icurrow = iyrow

         icurcol = iycol

         rowrep  = ( iyrow.EQ.-1 )

         colrep  = ( iycol.EQ.-1 )

*

         IF( incy.EQ.descy( m_ ) ) THEN

*

*           sub( Y ) is a row vector

*

            jb = descy( inb_ ) - jy + 1

            IF( jb.LE.0 )

     $         jb = ( (-jb ) / descy( nb_ ) + 1 ) * descy( nb_ ) + jb

            jb = min( jb, n )

            jn = jy + jb - 1

*

            DO 140 j = jy, jn

*

               CALL pcerraxpy( err, psclr, x( ioffx ), y( ioffy ),

     $                         prec )

*

               IF( ( myrow.EQ.icurrow .OR. rowrep ) .AND.

     $             ( mycol.EQ.icurcol .OR. colrep ) ) THEN

                  IF( abs( py( iiy+(jjy-1)*ldy ) - y( ioffy ) ).GT.

     $                err ) THEN

                     ierr( 2 ) = 1

                  END IF

                  jjy = jjy + 1

               END IF

*

               ioffx = ioffx + incx

               ioffy = ioffy + incy

*

  140       CONTINUE

*

            icurcol = mod( icurcol+1, npcol )

*

            DO 160 j = jn+1, jy+n-1, descy( nb_ )

               jb = min( jy+n-j, descy( nb_ ) )

*

               DO 150 kk = 0, jb-1

*

                  CALL pcerraxpy( err, psclr, x( ioffx ), y( ioffy ),

     $                            prec )

*

                  IF( ( myrow.EQ.icurrow .OR. rowrep ) .AND.

     $                ( mycol.EQ.icurcol .OR. colrep ) ) THEN

                     IF( abs( py( iiy+(jjy-1)*ldy ) - y( ioffy ) ).GT.

     $                   err ) THEN

                        ierr( 2 ) = 1

                     END IF

                     jjy = jjy + 1

                  END IF

*

                  ioffx = ioffx + incx

                  ioffy = ioffy + incy

*

  150          CONTINUE

*

               icurcol = mod( icurcol+1, npcol )

*

  160       CONTINUE

*

         ELSE

*

*           sub( Y ) is a column vector

*

            ib = descy( imb_ ) - iy + 1

            IF( ib.LE.0 )

     $         ib = ( (-ib ) / descy( mb_ ) + 1 ) * descy( mb_ ) + ib

            ib = min( ib, n )

            in = iy + ib - 1

*

            DO 170 i = iy, in

*

               CALL pcerraxpy( err, psclr, x( ioffx ), y( ioffy ),

     $                         prec )

*

               IF( ( myrow.EQ.icurrow .OR. rowrep ) .AND.

     $             ( mycol.EQ.icurcol .OR. colrep ) ) THEN

                  IF( abs( py( iiy+(jjy-1)*ldy ) - y( ioffy ) ).GT.

     $                err ) THEN

                     ierr( 2 ) = 1

                  END IF

                  iiy = iiy + 1

               END IF

*

               ioffx = ioffx + incx

               ioffy = ioffy + incy

*

  170       CONTINUE

*

            icurrow = mod( icurrow+1, nprow )

*

            DO 190 i = in+1, iy+n-1, descy( mb_ )

               ib = min( iy+n-i, descy( mb_ ) )

*

               DO 180 kk = 0, ib-1

*

                  CALL pcerraxpy( err, psclr, x( ioffx ), y( ioffy ),

     $                            prec )

*

                  IF( ( myrow.EQ.icurrow .OR. rowrep ) .AND.

     $                ( mycol.EQ.icurcol .OR. colrep ) ) THEN

                     IF( abs( py( iiy+(jjy-1)*ldy ) - y( ioffy ) ).GT.

     $                   err ) THEN

                        ierr( 2 ) = 1

                     END IF

                     iiy = iiy + 1

                  END IF

*

                  ioffx = ioffx + incx

                  ioffy = ioffy + incy

*

  180          CONTINUE

*

               icurrow = mod( icurrow+1, nprow )

*

  190       CONTINUE

*

         END IF

*

      ELSE IF( nrout.EQ.6 ) THEN

*

*        Test PCDOTU

*

         CALL pcchkvin( errmax, n, x, px, ix, jx, descx, incx,

     $                  ierr( 1 ) )

         CALL pcchkvin( errmax, n, y, py, iy, jy, descy, incy,

     $                  ierr( 2 ) )

         ioffx = ix + ( jx - 1 ) * descx( m_ )

         ioffy = iy + ( jy - 1 ) * descy( m_ )

         CALL pcerrdotu( err, n, sclr, x( ioffx ), incx, y( ioffy ),

     $                   incy, prec )

         inxscope = pisinscope( ictxt, n, ix, jx, descx, incx )

         inyscope = pisinscope( ictxt, n, iy, jy, descy, incy )

         IF( inxscope.OR.inyscope ) THEN

            IF( abs( psclr - sclr ).GT.err ) THEN

               ierr( 3 ) = 1

               WRITE( argin1, fmt = '(A)' ) 'DOTU'

               IF( myrow.EQ.0 .AND. mycol.EQ.0 ) THEN

                  WRITE( nout, fmt = 9998 ) argin1

                  WRITE( nout, fmt = 9996 ) sclr, psclr

               END IF

            END IF

         ELSE

            sclr = zero

            IF( psclr.NE.sclr ) THEN

               ierr( 4 ) = 1

               WRITE( argout1, fmt = '(A)' ) 'DOTU'

               IF( myrow.EQ.0 .AND. mycol.EQ.0 ) THEN

                  WRITE( nout, fmt = 9997 ) argout1

                  WRITE( nout, fmt = 9996 ) sclr, psclr

               END IF

            END IF

         END IF

*

      ELSE IF( nrout.EQ.7 ) THEN

*

*        Test PCDOTC

*

         CALL pcchkvin( errmax, n, x, px, ix, jx, descx, incx,

     $                  ierr( 1 ) )

         CALL pcchkvin( errmax, n, y, py, iy, jy, descy, incy,

     $                  ierr( 2 ) )

         ioffx = ix + ( jx - 1 ) * descx( m_ )

         ioffy = iy + ( jy - 1 ) * descy( m_ )

         CALL pcerrdotc( err, n, sclr, x( ioffx ), incx, y( ioffy ),

     $                   incy, prec )

         inxscope = pisinscope( ictxt, n, ix, jx, descx, incx )

         inyscope = pisinscope( ictxt, n, iy, jy, descy, incy )

         IF( inxscope.OR.inyscope ) THEN

            IF( abs( psclr - sclr ).GT.err ) THEN

               ierr( 3 ) = 1

               WRITE( argin1, fmt = '(A)' ) 'DOTC'

               IF( myrow.EQ.0 .AND. mycol.EQ.0 ) THEN

                  WRITE( nout, fmt = 9998 ) argin1

                  WRITE( nout, fmt = 9996 ) sclr, psclr

               END IF

            END IF

         ELSE

            sclr = zero

            IF( psclr.NE.sclr ) THEN

               ierr( 4 ) = 1

               WRITE( argout1, fmt = '(A)' ) 'DOTC'

               IF( myrow.EQ.0 .AND. mycol.EQ.0 ) THEN

                  WRITE( nout, fmt = 9997 ) argout1

                  WRITE( nout, fmt = 9996 ) sclr, psclr

               END IF

            END IF

         END IF

*

      ELSE IF( nrout.EQ.8 ) THEN

*

*        Test PSCNRM2

*

         CALL pcchkvin( errmax, n, x, px, ix, jx, descx, incx,

     $                  ierr( 1 ) )

         ioffx = ix + ( jx - 1 ) * descx( m_ )

         CALL pcerrnrm2( err, n, usclr, x( ioffx ), incx, prec )

         IF( pisinscope( ictxt, n, ix, jx, descx, incx ) ) THEN

            IF( abs( pusclr - usclr ).GT.err ) THEN

               ierr( 3 ) = 1

               WRITE( argin1, fmt = '(A)' ) 'NRM2'

               IF( myrow.EQ.0 .AND. mycol.EQ.0 ) THEN

                  WRITE( nout, fmt = 9998 ) argin1

                  WRITE( nout, fmt = 9994 ) usclr, pusclr

               END IF

            END IF

         ELSE

            usclr = rzero

            IF( pusclr.NE.usclr ) THEN

               ierr( 4 ) = 1

               WRITE( argout1, fmt = '(A)' ) 'NRM2'

               IF( myrow.EQ.0 .AND. mycol.EQ.0 ) THEN

                  WRITE( nout, fmt = 9997 ) argout1

                  WRITE( nout, fmt = 9994 ) usclr, pusclr

               END IF

            END IF

         END IF

*

      ELSE IF( nrout.EQ.9 ) THEN

*

*        Test PSCASUM

*

         CALL pcchkvin( errmax, n, x, px, ix, jx, descx, incx,

     $                  ierr( 1 ) )

         ioffx = ix + ( jx - 1 ) * descx( m_ )

         CALL pcerrasum( err, n, usclr, x( ioffx ), incx, prec )

         IF( pisinscope( ictxt, n, ix, jx, descx, incx ) ) THEN

            IF( abs( pusclr - usclr ) .GT. err ) THEN

               ierr( 3 ) = 1

               WRITE( argin1, fmt = '(A)' ) 'ASUM'

               IF( myrow.EQ.0 .AND. mycol.EQ.0 ) THEN

                  WRITE( nout, fmt = 9998 ) argin1

                  WRITE( nout, fmt = 9994 ) usclr, pusclr

               END IF

            END IF

         ELSE

            usclr = rzero

            IF( pusclr.NE.usclr ) THEN

               ierr( 4 ) = 1

               WRITE( argout1, fmt = '(A)' ) 'ASUM'

               IF( myrow.EQ.0 .AND. mycol.EQ.0 ) THEN

                  WRITE( nout, fmt = 9997 ) argout1

                  WRITE( nout, fmt = 9994 ) usclr, pusclr

               END IF

            END IF

         END IF

*

      ELSE IF( nrout.EQ.10 ) THEN

*

*        Test PCAMAX

*

         CALL pcchkvin( errmax, n, x, px, ix, jx, descx, incx,

     $                  ierr( 1 ) )

         ioffx = ix + ( jx - 1 ) * descx( m_ )

         IF( pisinscope( ictxt, n, ix, jx, descx, incx ) ) THEN

            isclr = icamax( n, x( ioffx ), incx )

            IF( n.LT.1 ) THEN

               sclr = zero

            ELSE IF( ( incx.EQ.1 ).AND.( descx( m_ ).EQ.1 ).AND.

     $               ( n.EQ.1 ) ) THEN

               isclr = jx

               sclr = x( ioffx )

            ELSE IF( incx.EQ.descx( m_ ) ) THEN

               isclr = jx + isclr - 1

               sclr = x( ix + ( isclr - 1 ) * descx( m_ ) )

            ELSE

               isclr = ix + isclr - 1

               sclr = x( isclr + ( jx - 1 ) * descx( m_ ) )

            END IF

*

            IF( psclr.NE.sclr ) THEN

               ierr( 3 ) = 1

               WRITE( argin1, fmt = '(A)' ) 'AMAX'

               IF( myrow.EQ.0 .AND. mycol.EQ.0 ) THEN

                  WRITE( nout, fmt = 9998 ) argin1

                  WRITE( nout, fmt = 9996 ) sclr, psclr

               END IF

            END IF

*

            IF( pisclr.NE.isclr ) THEN

               ierr( 5 ) = 1

               WRITE( argin2, fmt = '(A)' ) 'INDX'

               IF( myrow.EQ.0 .AND. mycol.EQ.0 ) THEN

                  WRITE( nout, fmt = 9998 ) argin2

                  WRITE( nout, fmt = 9995 ) isclr, pisclr

               END IF

            END IF

         ELSE

            isclr = 0

            sclr  = zero

            IF( psclr.NE.sclr ) THEN

               ierr( 4 ) = 1

               WRITE( argout1, fmt = '(A)' ) 'AMAX'

               IF( myrow.EQ.0 .AND. mycol.EQ.0 ) THEN

                  WRITE( nout, fmt = 9997 ) argout1

                  WRITE( nout, fmt = 9996 ) sclr, psclr

               END IF

            END IF

            IF( pisclr.NE.isclr ) THEN

               ierr( 6 ) = 1

               WRITE( argout2, fmt = '(A)' ) 'INDX'

               IF( myrow.EQ.0 .AND. mycol.EQ.0 ) THEN

                  WRITE( nout, fmt = 9997 ) argout2

                  WRITE( nout, fmt = 9995 ) isclr, pisclr

               END IF

            END IF

         END IF

*

      END IF

*

*     Find IERR across all processes

*

      CALL igamx2d( ictxt, 'All', ' ', 6, 1, ierr, 6, idumm, idumm, -1,

     $              -1, 0 )

*

*     Encode the errors found in INFO

*

      IF( ierr( 1 ).NE.0 ) THEN

         info = info + 1

         IF( myrow.EQ.0 .AND. mycol.EQ.0 )

     $      WRITE( nout, fmt = 9999 ) 'X'

      END IF

*

      IF( ierr( 2 ).NE.0 ) THEN

         info = info + 2

         IF( myrow.EQ.0 .AND. mycol.EQ.0 )

     $      WRITE( nout, fmt = 9999 ) 'Y'

      END IF

*

      IF( ierr( 3 ).NE.0 )

     $   info = info + 4

*

      IF( ierr( 4 ).NE.0 )

     $   info = info + 8

*

      IF( ierr( 5 ).NE.0 )

     $   info = info + 16

*

      IF( ierr( 6 ).NE.0 )

     $   info = info + 32

*

 9999 FORMAT( 2x, '   ***** ERROR: Vector operand ', a,

     $        ' is incorrect.' )

 9998 FORMAT( 2x, '   ***** ERROR: Output scalar result ', a,

     $        ' in scope is incorrect.' )

 9997 FORMAT( 2x, '   ***** ERROR: Output scalar result ', a,

     $        ' out of scope is incorrect.' )

 9996 FORMAT( 2x, '   ***** Expected value is: ', e16.8, '+i*(',

     $        e16.8, '),', /2x, '         Obtained value is: ',

     $        e16.8, '+i*(', e16.8, ')' )

 9995 FORMAT( 2x, '   ***** Expected value is: ', i6, /2x,

     $        '         Obtained value is: ', i6 )

 9994 FORMAT( 2x, '   ***** Expected value is: ', e16.8, /2x,

     $        '         Obtained value is: ', e16.8 )

*

      RETURN

*

*     End of PCBLAS1TSTCHK

*


      END


      SUBROUTINE pcerrdotu( ERRBND, N, SCLR, X, INCX, Y, INCY, PREC )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Scalar Arguments ..

      INTEGER            INCX, INCY, N

      REAL               ERRBND, PREC

      COMPLEX            SCLR

*     ..

*     .. Array Arguments ..

      COMPLEX            X( * ), Y( * )

*     ..

*

*  Purpose

*  =======

*

*  PCERRDOTU serially  computes  the  dot product X**T * Y and returns a

*  scaled relative acceptable error bound on the result.

*

*  Notes

*  =====

*

*  If dot1 = SCLR and  dot2 are two different computed results, and dot1

*  is being assumed to be correct, we require

*

*     abs( dot1 - dot2 ) <= ERRBND = ERRFACT * abs( dot1 ),

*

*  where ERRFACT is computed as the maximum of the positive and negative

*  partial  sums  multiplied  by  a constant proportional to the machine

*  precision.

*

*  Arguments

*  =========

*

*  ERRBND  (global output) REAL

*          On exit, ERRBND  specifies the scaled relative acceptable er-

*          ror bound.

*

*  N       (global input) INTEGER

*          On entry, N specifies the length of the vector operands.

*

*  SCLR    (global output) COMPLEX

*          On exit,  SCLR  specifies  the dot product of the two vectors

*          X and Y.

*

*  X       (global input) COMPLEX array

*          On   entry,   X   is   an   array   of   dimension  at  least

*          ( 1 + ( n - 1 )*abs( INCX ) ).  Before  entry,  the incremen-

*          ted array X must contain the vector x.

*

*  INCX    (global input) INTEGER.

*          On entry, INCX specifies the increment for the elements of X.

*          INCX must not be zero.

*

*  Y       (global input) COMPLEX array

*          On   entry,   Y   is   an   array   of   dimension  at  least

*          ( 1 + ( n - 1 )*abs( INCY ) ).  Before  entry,  the incremen-

*          ted array Y must contain the vector y.

*

*  INCY    (global input) INTEGER.

*          On entry, INCY specifies the increment for the elements of Y.

*          INCY must not be zero.

*

*  PREC    (global input) REAL

*          On entry, PREC specifies the machine precision.

*

*  -- Written on April 1, 1998 by

*     Antoine Petitet, University  of  Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Parameters ..

      REAL               ONE, TWO, ZERO

      PARAMETER          ( ONE = 1.0e+0, two = 2.0e+0,

     $                   zero = 0.0e+0 )

*     ..

*     .. Local Scalars ..

      INTEGER            I, IX, IY

      REAL               ADDBND, FACT, SUMINEG, SUMIPOS, SUMRNEG,

     $                   SUMRPOS, TMP

*     ..

*     .. Intrinsic Functions ..

      INTRINSIC          ABS, AIMAG, MAX, REAL

*     ..

*     .. Executable Statements ..

*

      ix = 1

      iy = 1

      sclr = zero

      sumipos = zero

      sumineg = zero

      sumrpos = zero

      sumrneg = zero

      fact = two * ( one + prec )

      addbnd = two * two * two * prec

*

      DO 10 i = 1, n

*

         sclr = sclr + x( ix ) * y( iy )

*

         tmp = real( x( ix ) ) * real( y( iy ) )

         IF( tmp.GE.zero ) THEN

            sumrpos = sumrpos + tmp * fact

         ELSE

            sumrneg = sumrneg - tmp * fact

         END IF

*

         tmp = - aimag( x( ix ) ) * aimag( y( iy ) )

         IF( tmp.GE.zero ) THEN

            sumrpos = sumrpos + tmp * fact

         ELSE

            sumrneg = sumrneg - tmp * fact

         END IF

*

         tmp = aimag( x( ix ) ) * real( y( iy ) )

         IF( tmp.GE.zero ) THEN

            sumipos = sumipos + tmp * fact

         ELSE

            sumineg = sumineg - tmp * fact

         END IF

*

         tmp = real( x( ix ) ) * aimag( y( iy ) )

         IF( tmp.GE.zero ) THEN

            sumipos = sumipos + tmp * fact

         ELSE

            sumineg = sumineg - tmp * fact

         END IF

*

         ix = ix + incx

         iy = iy + incy

*

   10 CONTINUE

*

      errbnd = addbnd * max( max( sumrpos, sumrneg ),

     $                       max( sumipos, sumineg ) )

*

      RETURN

*

*     End of PCERRDOTU

*


      END


      SUBROUTINE pcerrdotc( ERRBND, N, SCLR, X, INCX, Y, INCY, PREC )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Scalar Arguments ..

      INTEGER            INCX, INCY, N

      REAL               ERRBND, PREC

      COMPLEX            SCLR

*     ..

*     .. Array Arguments ..

      COMPLEX            X( * ), Y( * )

*     ..

*

*  Purpose

*  =======

*

*  PCERRDOTC serially  computes  the  dot product X**H * Y and returns a

*  scaled relative acceptable error bound on the result.

*

*  Notes

*  =====

*

*  If dot1 = SCLR and  dot2 are two different computed results, and dot1

*  is being assumed to be correct, we require

*

*     abs( dot1 - dot2 ) <= ERRBND = ERRFACT * abs( dot1 ),

*

*  where ERRFACT is computed as the maximum of the positive and negative

*  partial  sums  multiplied  by  a constant proportional to the machine

*  precision.

*

*  Arguments

*  =========

*

*  ERRBND  (global output) REAL

*          On exit, ERRBND  specifies the scaled relative acceptable er-

*          ror bound.

*

*  N       (global input) INTEGER

*          On entry, N specifies the length of the vector operands.

*

*  SCLR    (global output) COMPLEX

*          On exit,  SCLR  specifies  the dot product of the two vectors

*          X and Y.

*

*  X       (global input) COMPLEX array

*          On   entry,   X   is   an   array   of   dimension  at  least

*          ( 1 + ( n - 1 )*abs( INCX ) ).  Before  entry,  the incremen-

*          ted array X must contain the vector x.

*

*  INCX    (global input) INTEGER.

*          On entry, INCX specifies the increment for the elements of X.

*          INCX must not be zero.

*

*  Y       (global input) COMPLEX array

*          On   entry,   Y   is   an   array   of   dimension  at  least

*          ( 1 + ( n - 1 )*abs( INCY ) ).  Before  entry,  the incremen-

*          ted array Y must contain the vector y.

*

*  INCY    (global input) INTEGER.

*          On entry, INCY specifies the increment for the elements of Y.

*          INCY must not be zero.

*

*  PREC    (global input) REAL

*          On entry, PREC specifies the machine precision.

*

*  -- Written on April 1, 1998 by

*     Antoine Petitet, University  of  Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Parameters ..

      REAL               ONE, TWO, ZERO

      PARAMETER          ( ONE = 1.0e+0, two = 2.0e+0,

     $                   zero = 0.0e+0 )

*     ..

*     .. Local Scalars ..

      INTEGER            I, IX, IY

      REAL               ADDBND, FACT, SUMINEG, SUMIPOS, SUMRNEG,

     $                   SUMRPOS, TMP

*     ..

*     .. Intrinsic Functions ..

      INTRINSIC          ABS, AIMAG, CONJG, MAX, REAL

*     ..

*     .. Executable Statements ..

*

      ix = 1

      iy = 1

      sclr = zero

      sumipos = zero

      sumineg = zero

      sumrpos = zero

      sumrneg = zero

      fact = two * ( one + prec )

      addbnd = two * two * two * prec

*

      DO 10 i = 1, n

*

         sclr = sclr + conjg( x( ix ) ) * y( iy )

*

         tmp = real( x( ix ) ) * real( y( iy ) )

         IF( tmp.GE.zero ) THEN

            sumrpos = sumrpos + tmp * fact

         ELSE

            sumrneg = sumrneg - tmp * fact

         END IF

*

         tmp = aimag( x( ix ) ) * aimag( y( iy ) )

         IF( tmp.GE.zero ) THEN

            sumrpos = sumrpos + tmp * fact

         ELSE

            sumrneg = sumrneg - tmp * fact

         END IF

*

         tmp = - aimag( x( ix ) ) * real( y( iy ) )

         IF( tmp.GE.zero ) THEN

            sumipos = sumipos + tmp * fact

         ELSE

            sumineg = sumineg - tmp * fact

         END IF

*

         tmp = real( x( ix ) ) * aimag( y( iy ) )

         IF( tmp.GE.zero ) THEN

            sumipos = sumipos + tmp * fact

         ELSE

            sumineg = sumineg - tmp * fact

         END IF

*

         ix = ix + incx

         iy = iy + incy

*

   10 CONTINUE

*

      errbnd = addbnd * max( max( sumrpos, sumrneg ),

     $                       max( sumipos, sumineg ) )

*

      RETURN

*

*     End of PCERRDOTC

*


      END


      SUBROUTINE pcerrnrm2( ERRBND, N, USCLR, X, INCX, PREC )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Scalar Arguments ..

      INTEGER            INCX, N

      REAL               ERRBND, PREC, USCLR

*     ..

*     .. Array Arguments ..

      COMPLEX            X( * )

*     ..

*

*  Purpose

*  =======

*

*  PCERRNRM2  serially  computes  the  2-norm the vector X and returns a

*  scaled relative acceptable error bound on the result.

*

*  Notes

*  =====

*

*  If  norm1 = SCLR  and  norm2  are two different computed results, and

*  norm1 being assumed to be correct, we require

*

*     abs( norm1 - norm2 ) <= ERRBND = ERRFACT * abs( norm1 ),

*

*  where ERRFACT is computed as the maximum of the positive and negative

*  partial  sums  multiplied  by  a constant proportional to the machine

*  precision.

*

*  Arguments

*  =========

*

*  ERRBND  (global output) REAL

*          On exit, ERRBND  specifies the scaled relative acceptable er-

*          ror bound.

*

*  N       (global input) INTEGER

*          On entry, N specifies the length of the vector operand.

*

*  USCLR   (global output) REAL

*          On exit, USCLR specifies the 2-norm of the vector X.

*

*  X       (global input) COMPLEX array

*          On   entry,   X   is   an   array   of   dimension  at  least

*          ( 1 + ( n - 1 )*abs( INCX ) ).  Before  entry,  the incremen-

*          ted array X must contain the vector x.

*

*  INCX    (global input) INTEGER.

*          On entry, INCX specifies the increment for the elements of X.

*          INCX must not be zero.

*

*  PREC    (global input) REAL

*          On entry, PREC specifies the machine precision.

*

*  -- Written on April 1, 1998 by

*     Antoine Petitet, University  of  Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Parameters ..

      REAL               ONE, TWO, ZERO

      PARAMETER          ( ONE = 1.0e+0, two = 2.0e+0,

     $                   zero = 0.0e+0 )

*     ..

*     .. Local Scalars ..

      INTEGER            IX

      REAL               ABSXI, ADDBND, FACT, SCALE, SSQ, SUMSCA, SUMSSQ

*     ..

*     .. Intrinsic Functions ..

      INTRINSIC          ABS, AIMAG, REAL

*     ..

*     .. Executable Statements ..

*

      usclr = zero

      sumssq = one

      sumsca = zero

      addbnd = two * two * two * prec

      fact = one + two * ( ( one + prec )**3 - one )

*

      scale = zero

      ssq = one

      DO 10 ix = 1, 1 + ( n - 1 )*incx, incx

         IF( real( x( ix ) ).NE.zero ) THEN

            absxi = abs( real( x( ix ) ) )

            IF( scale.LT.absxi )THEN

               sumssq = one + ( ssq*( scale/absxi )**2 ) * fact

               errbnd = addbnd * sumssq

               sumssq = sumssq + errbnd

               ssq    = one + ssq*( scale/absxi )**2

               sumsca = absxi

               scale  = absxi

            ELSE

               sumssq = ssq + ( ( absxi/scale )**2 ) * fact

               errbnd = addbnd * sumssq

               sumssq = sumssq + errbnd

               ssq    = ssq + ( absxi/scale )**2

            END IF

         END IF

         IF( aimag( x( ix ) ).NE.zero ) THEN

            absxi = abs( aimag( x( ix ) ) )

            IF( scale.LT.absxi )THEN

               sumssq = one + ( ssq*( scale/absxi )**2 ) * fact

               errbnd = addbnd * sumssq

               sumssq = sumssq + errbnd

               ssq    = one + ssq*( scale/absxi )**2

               sumsca = absxi

               scale  = absxi

            ELSE

               sumssq = ssq + ( ( absxi/scale )**2 ) * fact

               errbnd = addbnd * sumssq

               sumssq = sumssq + errbnd

               ssq    = ssq + ( absxi/scale )**2

            END IF

         END IF

   10 CONTINUE

*

      usclr = scale * sqrt( ssq )

*

*     Error on square root

*

      errbnd = sqrt( sumssq ) * ( one + two * ( 1.00001e+0 * prec ) )

*

      errbnd = ( sumsca * errbnd ) - usclr

*

      RETURN

*

*     End of PCERRNRM2

*


      END


      SUBROUTINE pcerrasum( ERRBND, N, USCLR, X, INCX, PREC )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Scalar Arguments ..

      INTEGER            INCX, N

      REAL               ERRBND, PREC, USCLR

*     ..

*     .. Array Arguments ..

      COMPLEX            X( * )

*     ..

*

*  Purpose

*  =======

*

*  PCERRASUM  serially computes the sum of absolute values of the vector

*  X and returns a scaled relative acceptable error bound on the result.

*

*  Arguments

*  =========

*

*  ERRBND  (global output) REAL

*          On exit, ERRBND  specifies a scaled relative acceptable error

*          bound. In this case the error bound is just the absolute  sum

*          multiplied  by  a constant proportional to the machine preci-

*          sion.

*

*  N       (global input) INTEGER

*          On entry, N specifies the length of the vector operand.

*

*  USCLR   (global output) REAL

*          On exit, USCLR  specifies  the  sum of absolute values of the

*          vector X.

*

*  X       (global input) COMPLEX array

*          On   entry,   X   is   an   array   of   dimension  at  least

*          ( 1 + ( n - 1 )*abs( INCX ) ).  Before  entry,  the incremen-

*          ted array X must contain the vector x.

*

*  INCX    (global input) INTEGER.

*          On entry, INCX specifies the increment for the elements of X.

*          INCX must not be zero.

*

*  PREC    (global input) REAL

*          On entry, PREC specifies the machine precision.

*

*  -- Written on April 1, 1998 by

*     Antoine Petitet, University  of  Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Parameters ..

      REAL               TWO, ZERO

      PARAMETER          ( TWO = 2.0e+0, zero = 0.0e+0 )

*     ..

*     .. Local Scalars ..

      INTEGER            IX

      REAL               ADDBND

*     ..

*     .. Intrinsic Functions ..

      INTRINSIC          ABS, AIMAG, REAL

*     ..

*     .. Executable Statements ..

*

      ix = 1

      usclr = zero

      addbnd = two * two * two * prec

*

      DO 10 ix = 1, 1 + ( n - 1 )*incx, incx

         usclr = usclr + abs( real( x( ix ) ) ) +

     $                   abs( aimag( x( ix ) ) )

   10 CONTINUE

*

      errbnd = addbnd * usclr

*

      RETURN

*

*     End of PCERRASUM

*


      END


      SUBROUTINE pcerrscal( ERRBND, PSCLR, X, PREC )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Scalar Arguments ..

      REAL               ERRBND, PREC

      COMPLEX            PSCLR, X

*     ..

*

*  Purpose

*  =======

*

*  PCERRSCAL serially computes the product PSCLR * X and returns a sca-

*  led relative acceptable error bound on the result.

*

*  Notes

*  =====

*

*  If s1 = PSCLR*X and  s2 are two different computed results, and s1 is

*  being assumed to be correct, we require

*

*        abs( s1 - s2 ) <= ERRBND = ERRFACT * abs( s1 ),

*

*  where ERRFACT is computed as two times the machine precision.

*

*  Arguments

*  =========

*

*  ERRBND  (global output) REAL

*          On exit, ERRBND  specifies the scaled relative acceptable er-

*          ror bound.

*

*  PSCLR   (global input) COMPLEX

*          On entry, PSCLR specifies the scale factor.

*

*  X       (global input/global output) COMPLEX

*          On entry, X  specifies the scalar to be scaled. On exit, X is

*          the scaled entry.

*

*  PREC    (global input) REAL

*          On entry, PREC specifies the machine precision.

*

*  -- Written on April 1, 1998 by

*     Antoine Petitet, University  of  Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Parameters ..

      REAL               TWO

      PARAMETER          ( TWO = 2.0e+0 )

*     ..

*     .. Intrinsic Functions ..

      INTRINSIC          abs

*     ..

*     .. Executable Statements ..

*

      x = psclr * x

*

      errbnd = ( two * prec ) * abs( x )

*

      RETURN

*

*     End of PCERRSCAL

*


      END


      SUBROUTINE pcserrscal( ERRBND, PUSCLR, X, PREC )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Scalar Arguments ..

      REAL               ERRBND, PREC, PUSCLR

      COMPLEX            X

*     ..

*

*  Purpose

*  =======

*

*  PCSERRSCAL  serially  computes  the  product PUSCLR * X and returns a

*  scaled relative acceptable error bound on the result.

*

*  Notes

*  =====

*

*  If s1 = PUSCLR*X and s2 are two different computed results, and s1 is

*  being assumed to be correct, we require

*

*        abs( s1 - s2 ) <= ERRBND = ERRFACT * abs( s1 ),

*

*  where ERRFACT is computed as two times the machine precision.

*

*  Arguments

*  =========

*

*  ERRBND  (global output) REAL

*          On exit, ERRBND  specifies the scaled relative acceptable er-

*          ror bound.

*

*  PUSCLR  (global input) REAL

*          On entry, PUSCLR specifies the real scale factor.

*

*  X       (global input/global output) COMPLEX

*          On entry, X  specifies the scalar to be scaled. On exit, X is

*          the scaled entry.

*

*  PREC    (global input) REAL

*          On entry, PREC specifies the machine precision.

*

*  -- Written on April 1, 1998 by

*     Antoine Petitet, University  of  Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Parameters ..

      REAL               TWO

      PARAMETER          ( TWO = 2.0e+0 )

*     ..

*     .. Intrinsic Functions ..

      INTRINSIC          abs, aimag, cmplx, real

*     ..

*     .. Executable Statements ..

*

      x = cmplx( pusclr * real( x ), pusclr * aimag( x ) )

*

      errbnd = ( two * prec ) * abs( x )

*

      RETURN

*

*     End of PCSERRSCAL

*


      END


      SUBROUTINE pcerraxpy( ERRBND, PSCLR, X, Y, PREC )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Scalar Arguments ..

      REAL               ERRBND, PREC

      COMPLEX            PSCLR, X, Y

*     ..

*

*  Purpose

*  =======

*

*  PCERRAXPY  serially computes Y := Y + PSCLR * X and returns a scaled

*  relative acceptable error bound on the result.

*

*  Arguments

*  =========

*

*  ERRBND  (global output) REAL

*          On exit, ERRBND  specifies the scaled relative acceptable er-

*          ror bound.

*

*  PSCLR   (global input) COMPLEX

*          On entry, PSCLR specifies the scale factor.

*

*  X       (global input) COMPLEX

*          On entry, X  specifies the scalar to be scaled.

*

*  Y       (global input/global output) COMPLEX

*          On entry, Y specifies the scalar to be added. On exit, Y con-

*          tains the resulting scalar.

*

*  PREC    (global input) REAL

*          On entry, PREC specifies the machine precision.

*

*  -- Written on April 1, 1998 by

*     Antoine Petitet, University  of  Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Parameters ..

      REAL               ONE, TWO, ZERO

      PARAMETER          ( ONE = 1.0e+0, two = 2.0e+0,

     $                   zero = 0.0e+0 )

*     ..

*     .. Local Scalars ..

      REAL               ADDBND, FACT, SUMINEG, SUMIPOS, SUMRNEG,

     $                   SUMRPOS

      COMPLEX            TMP

*     ..

*     .. Intrinsic Functions ..

      INTRINSIC          AIMAG, MAX, REAL

*     ..

*     .. Executable Statements ..

*

      sumipos = zero

      sumineg = zero

      sumrpos = zero

      sumrneg = zero

      fact = one + two * prec

      addbnd = two * two * two * prec

*

      tmp = psclr * x

      IF( real( tmp ).GE.zero ) THEN

         sumrpos = sumrpos + real( tmp ) * fact

      ELSE

         sumrneg = sumrneg - real( tmp ) * fact

      END IF

      IF( aimag( tmp ).GE.zero ) THEN

         sumipos = sumipos + aimag( tmp ) * fact

      ELSE

         sumineg = sumineg - aimag( tmp ) * fact

      END IF

*

      tmp = y

      IF( real( tmp ).GE.zero ) THEN

         sumrpos = sumrpos + real( tmp )

      ELSE

         sumrneg = sumrneg - real( tmp )

      END IF

      IF( aimag( tmp ).GE.zero ) THEN

         sumipos = sumipos + aimag( tmp )

      ELSE

         sumineg = sumineg - aimag( tmp )

      END IF

*

      y = y + ( psclr * x )

*

      errbnd = addbnd * max( max( sumrpos, sumrneg ),

     $                       max( sumipos, sumineg ) )

*

      RETURN

*

*     End of PCERRAXPY

*


      END

cmplx
float cmplx[2]
Definition pblas.h:136

pvdimchk
subroutine pvdimchk(ictxt, nout, n, matrix, ix, jx, descx, incx, info)
Definition pblastst.f:3

icopy
subroutine icopy(n, sx, incx, sy, incy)
Definition pblastst.f:1525

pb_descset2
subroutine pb_descset2(desc, m, n, imb, inb, mb, nb, rsrc, csrc, ctxt, lld)
Definition pblastst.f:3172

pb_infog2l
subroutine pb_infog2l(i, j, desc, nprow, npcol, myrow, mycol, ii, jj, prow, pcol)
Definition pblastst.f:1673

pvdescchk
subroutine pvdescchk(ictxt, nout, matrix, descx, dtx, mx, nx, imbx, inbx, mbx, nbx, rsrcx, csrcx, incx, mpx, nqx, iprex, imidx, ipostx, igap, gapmul, info)
Definition pblastst.f:388

pcerrnrm2
subroutine pcerrnrm2(errbnd, n, usclr, x, incx, prec)
Definition pcblas1tst.f:3426

pcbla1tstinfo
subroutine pcbla1tstinfo(summry, nout, nmat, nval, mxval, nxval, imbxval, mbxval, inbxval, nbxval, rscxval, cscxval, ixval, jxval, incxval, myval, nyval, imbyval, mbyval, inbyval, nbyval, rscyval, cscyval, iyval, jyval, incyval, ldval, ngrids, pval, ldpval, qval, ldqval, ltest, sof, tee, iam, igap, iverb, nprocs, alpha, work)
Definition pcblas1tst.f:802

pcserrscal
subroutine pcserrscal(errbnd, pusclr, x, prec)
Definition pcblas1tst.f:3710

pcerrdotu
subroutine pcerrdotu(errbnd, n, sclr, x, incx, y, incy, prec)
Definition pcblas1tst.f:3138

pcerrscal
subroutine pcerrscal(errbnd, psclr, x, prec)
Definition pcblas1tst.f:3642

pcbla1tst
program pcbla1tst
Definition pcblas1tst.f:12

pcerrdotc
subroutine pcerrdotc(errbnd, n, sclr, x, incx, y, incy, prec)
Definition pcblas1tst.f:3282

pcblas1tstchke
subroutine pcblas1tstchke(ltest, inout, nprocs)
Definition pcblas1tst.f:1495

pcchkarg1
subroutine pcchkarg1(ictxt, nout, sname, n, alpha, ix, jx, descx, incx, iy, jy, descy, incy, info)
Definition pcblas1tst.f:1778

pcblas1tstchk
subroutine pcblas1tstchk(ictxt, nout, nrout, n, psclr, pusclr, pisclr, x, px, ix, jx, descx, incx, y, py, iy, jy, descy, incy, info)
Definition pcblas1tst.f:2255

pisinscope
logical function pisinscope(ictxt, n, ix, jx, descx, incx)
Definition pcblas1tst.f:2078

pcerraxpy
subroutine pcerraxpy(errbnd, psclr, x, y, prec)
Definition pcblas1tst.f:3778

pcerrasum
subroutine pcerrasum(errbnd, n, usclr, x, incx, prec)
Definition pcblas1tst.f:3559

pclagen
subroutine pclagen(inplace, aform, diag, offa, m, n, ia, ja, desca, iaseed, a, lda)
Definition pcblastst.f:8491

pcchkvout
subroutine pcchkvout(n, x, px, ix, jx, descx, incx, info)
Definition pcblastst.f:2876

pcchkvin
subroutine pcchkvin(errmax, n, x, px, ix, jx, descx, incx, info)
Definition pcblastst.f:2582

pb_cchekpad
subroutine pb_cchekpad(ictxt, mess, m, n, a, lda, ipre, ipost, chkval)
Definition pcblastst.f:9873

pcvecee
subroutine pcvecee(ictxt, nout, subptr, scode, sname)
Definition pcblastst.f:936

pb_pclaprnt
subroutine pb_pclaprnt(m, n, a, ia, ja, desca, irprnt, icprnt, cmatnm, nout, work)
Definition pcblastst.f:9302

pcmprnt
subroutine pcmprnt(ictxt, nout, m, n, a, lda, irprnt, icprnt, cmatnm)
Definition pcblastst.f:3955

pcdimee
subroutine pcdimee(ictxt, nout, subptr, scode, sname)
Definition pcblastst.f:455

pb_cfillpad
subroutine pb_cfillpad(ictxt, m, n, a, lda, ipre, ipost, chkval)
Definition pcblastst.f:9760

pcvprnt
subroutine pcvprnt(ictxt, nout, n, x, incx, irprnt, icprnt, cvecnm)
Definition pcblastst.f:4067

pslamch
real function pslamch(ictxt, cmach)
Definition pcblastst.f:7455

max
#define max(A, B)
Definition pcgemr.c:180

min
#define min(A, B)
Definition pcgemr.c:181