program example2 implicit none * * simple example to show how to generate a scalapack matrix * contribution from Ed d'Azevedo, ORNL, 2005 * integer BLOCK_CYCLIC_2D, CSRC_, CTXT_, DLEN_, DTYPE_, $ LLD_, MB_, M_, NB_, N_, RSRC_ parameter ( BLOCK_CYCLIC_2D = 1, DLEN_ = 9, DTYPE_ = 1, $ CTXT_ = 2, M_ = 3, N_ = 4, MB_ = 5, NB_ = 6, $ RSRC_ = 7, CSRC_ = 8, LLD_ = 9 ) * * integer descA(DLEN_) * integer lwork parameter(lwork=10*1000) double precision work(lwork) * integer Asize parameter(Asize=32*1000*1000) * integer nout parameter(nout=16) * double precision aij double precision A(Asize) * integer m,n,mb,nb integer info, ierr(1) integer iam,nprocs integer icontext, myprow,mypcol,nprow,npcol integer rsrc,csrc,lld,Locp,Locq,Aneed * integer ia,ja,irprnt,icprnt logical isroot, isok * integer lrindx,lcindx,ipos logical do_print * integer lroffset,lcoffset integer ia_first, ja_first integer iastart,iaend, jastart,jaend * double precision t1,t2 double precision MPI_Wtime external MPI_Wtime * integer numroc, indxg2p external numroc, indxg2p external infog2l, descinit * mb = 50 nb = 50 m = 400 n = 400 * * ----------------------- * setup blacs environment * ----------------------- call blacs_pinfo( iam,nprocs) * do nprow=int( sqrt(real(nprocs)) )+1,1,-1 npcol = nprocs/nprow if (nprow*npcol.eq.nprocs) goto 11 enddo 11 continue * call blacs_get(-1,0,icontext) call blacs_gridinit( icontext, 'Col-major', nprow,npcol) call blacs_gridinfo( icontext, nprow,npcol, myprow,mypcol) isroot = (myprow.eq.0).and.(mypcol.eq.0) * if (isroot) then write(*,*) 'nprow,npcol ', nprow,npcol write(*,*) 'm,n ', m,n write(*,*) 'mb,nb ', mb,nb endif * * --------------------------------------------------------- * compute local extent and allocate storage for local piece * --------------------------------------------------------- * csrc = 0 rsrc = 0 * Locq = numroc(n,nb,mypcol,csrc,npcol) Locq = max(1,Locq) Locp = numroc(m,mb,myprow,rsrc,nprow) * lld = max(Locp,1) Aneed = lld*Locq isok = (Aneed.le.Asize) if (.not.isok) then if (isroot) then write(*,*) 'increase Asize to ',Aneed + 1 endif goto 999 endif * * ---------------- * setup descriptor * ---------------- * call descinit(descA,m,n,mb,nb,rsrc,csrc,icontext,lld,info) ierr(1) = info call igsum2d( icontext, 'All', ' ',1,1,ierr,1,-1,-1) isok = (info.eq.0) if (.not.isok) then if (isroot) then write(*,*) 'descinit returns info = ',info endif goto 999 endif * * ------------------------------ * better method to setup matrix * take advantage of the block 2D cyclic format * * (ia,ja) are global indices * ------------------------------ * call blacs_barrier( icontext, 'All') t1 = MPI_Wtime() * * ------------------------------------------------- * compute the first array index on local processor * ------------------------------------------------- * if (myprow.ge.descA(RSRC_)) then ia_first = (myprow-descA(RSRC_))*descA(MB_) + 1 else ia_first = (myprow + (nprow-descA(RSRC_)))*descA(MB_)+1 endif * if (mypcol.ge.descA(CSRC_)) then ja_first = (mypcol-descA(CSRC_))*descA(NB_) + 1 else ja_first = (mypcol + (npcol-descA(CSRC_)))*descA(NB_)+1 endif * * ---------------------------------- * Note skip by npcol*nb and nprow*mb * ---------------------------------- * do jastart=ja_first,descA(N_), npcol*descA(NB_) do iastart=ia_first,descA(M_), nprow*descA(MB_) * iaend = min( descA(M_), iastart + descA(MB_)-1) jaend = min( descA(N_), jastart + descA(NB_)-1) * * --------------------------------------------- * block (iastart:iaend, jastart:jaend) is * within the same block on the local processor * * Need to compute local array index for 1st entry * in the local block * --------------------------------------------- * ia = iastart ja = jastart call infog2l(ia,ja,descA,nprow,npcol,myprow,mypcol, & lroffset,lcoffset, rsrc,csrc) * do ja=jastart,jaend do ia=iastart,iaend * call generate_Aij( m,n, ia,ja, aij ) * lrindx = lroffset + (ia-iastart) lcindx = lcoffset + (ja-jastart) * ipos = lrindx + (lcindx-1)*descA(LLD_) A(ipos) = aij * enddo enddo * enddo enddo * call blacs_barrier( icontext, 'All') t2 = MPI_Wtime() if (isroot) then write(*,*) 'time to build matrix is ',t2-t1,' sec' endif * * -------------------------------------------- * if matrix is not too big, print out content * for debugging * -------------------------------------------- * do_print = ((m*n.le.200*1000).and.(lwork.ge.mb)) if (do_print) then * ia = 1 ja = 1 irprnt = 0 icprnt = 0 call pdlaprnt(m,n,A,ia,ja,descA,irprnt,icprnt,'A',nout,work) * endif * 999 continue * * --------------- * prepare to exit * --------------- * call blacs_barrier(icontext, 'All') call blacs_gridexit( icontext ) call blacs_exit(0) stop end * subroutine generate_Aij( m,n, ia,ja, aij ) implicit none integer m,n, ia,ja double precision aij aij = dble(ia) + dble(ja-1)*dble(m) return end *