pdblastim_8f_source.html

      SUBROUTINE pdlascal( TYPE, M, N, ALPHA, A, IA, JA, DESCA )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Scalar Arguments ..

      CHARACTER*1        TYPE

      INTEGER            IA, JA, M, N

      DOUBLE PRECISION   ALPHA

*     ..

*     .. Array Arguments ..

      INTEGER            DESCA( * )

      DOUBLE PRECISION   A( * )

*     ..

*

*  Purpose

*  =======

*

*  PDLASCAL  scales the  m by n submatrix A(IA:IA+M-1,JA:JA+N-1) denoted

*  by sub( A ) by the scalar alpha. TYPE  specifies if sub( A ) is full,

*  upper triangular, lower triangular or upper Hessenberg.

*

*  Notes

*  =====

*

*  A description  vector  is associated with each 2D block-cyclicly dis-

*  tributed matrix.  This  vector  stores  the  information  required to

*  establish the  mapping  between a  matrix entry and its corresponding

*  process and memory location.

*

*  In  the  following  comments,   the character _  should  be  read  as

*  "of  the  distributed  matrix".  Let  A  be a generic term for any 2D

*  block cyclicly distributed matrix.  Its description vector is DESCA:

*

*  NOTATION         STORED IN       EXPLANATION

*  ---------------- --------------- ------------------------------------

*  DTYPE_A (global) DESCA( DTYPE_ ) The descriptor type.

*  CTXT_A  (global) DESCA( CTXT_  ) The BLACS context handle, indicating

*                                   the NPROW x NPCOL BLACS process grid

*                                   A  is distributed over.  The context

*                                   itself  is  global,  but  the handle

*                                   (the integer value) may vary.

*  M_A     (global) DESCA( M_     ) The  number of rows in the distribu-

*                                   ted matrix A, M_A >= 0.

*  N_A     (global) DESCA( N_     ) The number of columns in the distri-

*                                   buted matrix A, N_A >= 0.

*  IMB_A   (global) DESCA( IMB_   ) The number of rows of the upper left

*                                   block of the matrix A, IMB_A > 0.

*  INB_A   (global) DESCA( INB_   ) The  number  of columns of the upper

*                                   left   block   of   the   matrix  A,

*                                   INB_A > 0.

*  MB_A    (global) DESCA( MB_    ) The blocking factor used to  distri-

*                                   bute the last  M_A-IMB_A rows of  A,

*                                   MB_A > 0.

*  NB_A    (global) DESCA( NB_    ) The blocking factor used to  distri-

*                                   bute the last  N_A-INB_A  columns of

*                                   A, NB_A > 0.

*  RSRC_A  (global) DESCA( RSRC_  ) The process row over which the first

*                                   row of the matrix  A is distributed,

*                                   NPROW > RSRC_A >= 0.

*  CSRC_A  (global) DESCA( CSRC_  ) The  process  column  over which the

*                                   first  column of  A  is distributed.

*                                   NPCOL > CSRC_A >= 0.

*  LLD_A   (local)  DESCA( LLD_   ) The  leading  dimension of the local

*                                   array  storing  the  local blocks of

*                                   the distributed matrix A,

*                                   IF( Lc( 1, N_A ) > 0 )

*                                      LLD_A >= MAX( 1, Lr( 1, M_A ) )

*                                   ELSE

*                                      LLD_A >= 1.

*

*  Let K be the number of  rows of a matrix A starting at the global in-

*  dex IA,i.e, A( IA:IA+K-1, : ). Lr( IA, K ) denotes the number of rows

*  that the process of row coordinate MYROW ( 0 <= MYROW < NPROW ) would

*  receive if these K rows were distributed over NPROW processes.  If  K

*  is the number of columns of a matrix  A  starting at the global index

*  JA, i.e, A( :, JA:JA+K-1, : ), Lc( JA, K ) denotes the number  of co-

*  lumns that the process MYCOL ( 0 <= MYCOL < NPCOL ) would  receive if

*  these K columns were distributed over NPCOL processes.

*

*  The values of Lr() and Lc() may be determined via a call to the func-

*  tion PB_NUMROC:

*  Lr( IA, K ) = PB_NUMROC( K, IA, IMB_A, MB_A, MYROW, RSRC_A, NPROW )

*  Lc( JA, K ) = PB_NUMROC( K, JA, INB_A, NB_A, MYCOL, CSRC_A, NPCOL )

*

*  Arguments

*  =========

*

*  TYPE    (global input) CHARACTER*1

*          On entry,  TYPE  specifies the type of the input submatrix as

*          follows:

*             = 'L' or 'l':  sub( A ) is a lower triangular matrix,

*             = 'U' or 'u':  sub( A ) is an upper triangular matrix,

*             = 'H' or 'h':  sub( A ) is an upper Hessenberg matrix,

*             otherwise sub( A ) is a  full matrix.

*

*  M       (global input) INTEGER

*          On entry,  M  specifies the number of rows of  the  submatrix

*          sub( A ). M  must be at least zero.

*

*  N       (global input) INTEGER

*          On entry, N  specifies the number of columns of the submatrix

*          sub( A ). N  must be at least zero.

*

*  ALPHA   (global input) DOUBLE PRECISION

*          On entry, ALPHA specifies the scalar alpha.

*

*  A       (local input/local output) DOUBLE PRECISION array

*          On entry, A is an array of dimension (LLD_A, Ka), where Ka is

*          at least Lc( 1, JA+N-1 ).  Before  entry, this array contains

*          the local entries of the matrix  A.

*          On exit, the local entries of this array corresponding to the

*          to  the entries of the submatrix sub( A ) are  overwritten by

*          the local entries of the m by n scaled submatrix.

*

*  IA      (global input) INTEGER

*          On entry, IA  specifies A's global row index, which points to

*          the beginning of the submatrix sub( A ).

*

*  JA      (global input) INTEGER

*          On entry, JA  specifies A's global column index, which points

*          to the beginning of the submatrix sub( A ).

*

*  DESCA   (global and local input) INTEGER array

*          On entry, DESCA  is an integer array of dimension DLEN_. This

*          is the array descriptor for the matrix A.

*

*  -- Written on April 1, 1998 by

*     Antoine Petitet, University  of  Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Parameters ..

      INTEGER            BLOCK_CYCLIC_2D_INB, CSRC_, CTXT_, DLEN_,

     $                   DTYPE_, IMB_, INB_, LLD_, MB_, M_, NB_, N_,

     $                   RSRC_

      parameter( block_cyclic_2d_inb = 2, dlen_ = 11,

     $                   dtype_ = 1, ctxt_ = 2, m_ = 3, n_ = 4,

     $                   imb_ = 5, inb_ = 6, mb_ = 7, nb_ = 8,

     $                   rsrc_ = 9, csrc_ = 10, lld_ = 11 )

*     ..

*     .. Local Scalars ..

      CHARACTER*1        UPLO

      LOGICAL            GODOWN, GOLEFT, LOWER, UPPER

      INTEGER            IACOL, IAROW, ICTXT, IIA, IIMAX, ILOW, IMB1,

     $                   IMBLOC, INB1, INBLOC, IOFFA, IOFFD, ITYPE,

     $                   IUPP, JJA, JJMAX, JOFFA, JOFFD, LCMT, LCMT00,

     $                   LDA, LMBLOC, LNBLOC, LOW, M1, MB, MBLKD, MBLKS,

     $                   MBLOC, MP, MRCOL, MRROW, MYCOL, MYROW, N1, NB,

     $                   NBLKD, NBLKS, NBLOC, NPCOL, NPROW, NQ, PMB,

     $                   QNB, TMP1, UPP

*     ..

*     .. Local Arrays ..

      INTEGER            DESCA2( DLEN_ )

*     ..

*     .. External Subroutines ..

      EXTERNAL           blacs_gridinfo, pb_ainfog2l, pb_binfo,

     $                   pb_desctrans, pb_dlascal, pb_infog2l

*     ..

*     .. External Functions ..

      LOGICAL            LSAME

      INTEGER            PB_NUMROC

      EXTERNAL           lsame, pb_numroc

*     ..

*     .. Intrinsic Functions ..

      INTRINSIC          min

*     ..

*     .. Executable Statements ..

*

*     Convert descriptor

*

      CALL pb_desctrans( desca, desca2 )

*

*     Get grid parameters

*

      ictxt = desca2( ctxt_ )

      CALL blacs_gridinfo( ictxt, nprow, npcol, myrow, mycol )

*

*     Quick return if possible

*

      IF( m.EQ.0 .OR. n.EQ.0 )

     $   RETURN

*

      IF( lsame( TYPE, 'L' ) ) then

         itype = 1

         uplo  = TYPE

         upper = .false.

         lower = .true.

         ioffd = 0

      ELSE IF( lsame( TYPE, 'U' ) ) then

         itype = 2

         uplo  = TYPE

         upper = .true.

         lower = .false.

         ioffd = 0

      ELSE IF( lsame( TYPE, 'H' ) ) then

         itype = 3

         uplo  = 'U'

         upper = .true.

         lower = .false.

         ioffd = 1

      ELSE

         itype = 0

         uplo  = 'A'

         upper = .true.

         lower = .true.

         ioffd = 0

      END IF

*

*     Compute local indexes

*

      IF( itype.EQ.0 ) THEN

*

*        Full matrix

*

         CALL pb_infog2l( ia, ja, desca2, nprow, npcol, myrow, mycol,

     $                    iia, jja, iarow, iacol )

         mp = pb_numroc( m, ia, desca2( imb_ ), desca2( mb_ ), myrow,

     $                   desca2( rsrc_ ), nprow )

         nq = pb_numroc( n, ja, desca2( inb_ ), desca2( nb_ ), mycol,

     $                   desca2( csrc_ ), npcol )

*

         IF( mp.LE.0 .OR. nq.LE.0 )

     $      RETURN

*

         lda   = desca2( lld_ )

         ioffa = iia + ( jja - 1 ) * lda

*

         CALL pb_dlascal( 'All', mp, nq, 0, alpha, a( ioffa ), lda )

*

      ELSE

*

*        Trapezoidal matrix

*

         CALL pb_ainfog2l( m, n, ia, ja, desca2, nprow, npcol, myrow,

     $                     mycol, imb1, inb1, mp, nq, iia, jja, iarow,

     $                     iacol, mrrow, mrcol )

*

         IF( mp.LE.0 .OR. nq.LE.0 )

     $      RETURN

*

*        Initialize LCMT00, MBLKS, NBLKS, IMBLOC, INBLOC, LMBLOC,

*        LNBLOC, ILOW, LOW, IUPP, and UPP.

*

         mb  = desca2( mb_ )

         nb  = desca2( nb_ )

         lda = desca2( lld_ )

*

         CALL pb_binfo( ioffd, mp, nq, imb1, inb1, mb, nb, mrrow,

     $                  mrcol, lcmt00, mblks, nblks, imbloc, inbloc,

     $                  lmbloc, lnbloc, ilow, low, iupp, upp )

*

         m1    = mp

         n1    = nq

         ioffa = iia - 1

         joffa = jja - 1

         iimax = ioffa + mp

         jjmax = joffa + nq

*

         IF( desca2( rsrc_ ).LT.0 ) THEN

            pmb = mb

         ELSE

            pmb = nprow * mb

         END IF

         IF( desca2( csrc_ ).LT.0 ) THEN

            qnb = nb

         ELSE

            qnb = npcol * nb

         END IF

*

*        Handle the first block of rows or columns separately, and

*        update LCMT00, MBLKS and NBLKS.

*

         godown = ( lcmt00.GT.iupp )

         goleft = ( lcmt00.LT.ilow )

*

         IF( .NOT.godown .AND. .NOT.goleft ) THEN

*

*           LCMT00 >= ILOW && LCMT00 <= IUPP

*

            goleft = ( ( lcmt00 - ( iupp - upp + pmb ) ).LT.ilow )

            godown = .NOT.goleft

*

            CALL pb_dlascal( uplo, imbloc, inbloc, lcmt00, alpha,

     $                       a( iia+joffa*lda ), lda )

            IF( godown ) THEN

               IF( upper .AND. nq.GT.inbloc )

     $            CALL pb_dlascal( 'All', imbloc, nq-inbloc, 0, alpha,

     $                             a( iia+(joffa+inbloc)*lda ), lda )

               iia = iia + imbloc

               m1  = m1 - imbloc

            ELSE

               IF( lower .AND. mp.GT.imbloc )

     $            CALL pb_dlascal( 'All', mp-imbloc, inbloc, 0, alpha,

     $                             a( iia+imbloc+joffa*lda ), lda )

               jja = jja + inbloc

               n1  = n1 - inbloc

            END IF

*

         END IF

*

         IF( godown ) THEN

*

            lcmt00 = lcmt00 - ( iupp - upp + pmb )

            mblks  = mblks - 1

            ioffa  = ioffa + imbloc

*

   10       CONTINUE

            IF( mblks.GT.0 .AND. lcmt00.GT.upp ) THEN

               lcmt00 = lcmt00 - pmb

               mblks  = mblks - 1

               ioffa  = ioffa + mb

               GO TO 10

            END IF

*

            tmp1 = min( ioffa, iimax ) - iia + 1

            IF( upper .AND. tmp1.GT.0 ) THEN

               CALL pb_dlascal( 'All', tmp1, n1, 0, alpha,

     $                          a( iia+joffa*lda ), lda )

               iia = iia + tmp1

               m1  = m1 - tmp1

            END IF

*

            IF( mblks.LE.0 )

     $         RETURN

*

            lcmt  = lcmt00

            mblkd = mblks

            ioffd = ioffa

*

            mbloc = mb

   20       CONTINUE

            IF( mblkd.GT.0 .AND. lcmt.GE.ilow ) THEN

               IF( mblkd.EQ.1 )

     $            mbloc = lmbloc

               CALL pb_dlascal( uplo, mbloc, inbloc, lcmt, alpha,

     $                          a( ioffd+1+joffa*lda ), lda )

               lcmt00 = lcmt

               lcmt   = lcmt - pmb

               mblks  = mblkd

               mblkd  = mblkd - 1

               ioffa  = ioffd

               ioffd  = ioffd + mbloc

               GO TO 20

            END IF

*

            tmp1 = m1 - ioffd + iia - 1

            IF( lower .AND. tmp1.GT.0 )

     $         CALL pb_dlascal( 'All', tmp1, inbloc, 0, alpha,

     $                          a( ioffd+1+joffa*lda ), lda )

*

            tmp1   = ioffa - iia + 1

            m1     = m1 - tmp1

            n1     = n1 - inbloc

            lcmt00 = lcmt00 + low - ilow + qnb

            nblks  = nblks - 1

            joffa  = joffa + inbloc

*

            IF( upper .AND. tmp1.GT.0 .AND. n1.GT.0 )

     $         CALL pb_dlascal( 'All', tmp1, n1, 0, alpha,

     $                          a( iia+joffa*lda ), lda )

*

            iia = ioffa + 1

            jja = joffa + 1

*

         ELSE IF( goleft ) THEN

*

            lcmt00 = lcmt00 + low - ilow + qnb

            nblks  = nblks - 1

            joffa  = joffa + inbloc

*

   30       CONTINUE

            IF( nblks.GT.0 .AND. lcmt00.LT.low ) THEN

               lcmt00 = lcmt00 + qnb

               nblks  = nblks - 1

               joffa  = joffa + nb

               GO TO 30

            END IF

*

            tmp1 = min( joffa, jjmax ) - jja + 1

            IF( lower .AND. tmp1.GT.0 ) THEN

               CALL pb_dlascal( 'All', m1, tmp1, 0, alpha,

     $                          a( iia+(jja-1)*lda ), lda )

               jja = jja + tmp1

               n1  = n1 - tmp1

            END IF

*

            IF( nblks.LE.0 )

     $         RETURN

*

            lcmt  = lcmt00

            nblkd = nblks

            joffd = joffa

*

            nbloc = nb

   40       CONTINUE

            IF( nblkd.GT.0 .AND. lcmt.LE.iupp ) THEN

               IF( nblkd.EQ.1 )

     $            nbloc = lnbloc

               CALL pb_dlascal( uplo, imbloc, nbloc, lcmt, alpha,

     $                          a( iia+joffd*lda ), lda )

               lcmt00 = lcmt

               lcmt   = lcmt + qnb

               nblks  = nblkd

               nblkd  = nblkd - 1

               joffa  = joffd

               joffd  = joffd + nbloc

               GO TO 40

            END IF

*

            tmp1 = n1 - joffd + jja - 1

            IF( upper .AND. tmp1.GT.0 )

     $         CALL pb_dlascal( 'All', imbloc, tmp1, 0, alpha,

     $                          a( iia+joffd*lda ), lda )

*

            tmp1   = joffa - jja + 1

            m1     = m1 - imbloc

            n1     = n1 - tmp1

            lcmt00 = lcmt00 - ( iupp - upp + pmb )

            mblks  = mblks - 1

            ioffa  = ioffa + imbloc

*

            IF( lower .AND. m1.GT.0 .AND. tmp1.GT.0 )

     $         CALL pb_dlascal( 'All', m1, tmp1, 0, alpha,

     $                          a( ioffa+1+(jja-1)*lda ), lda )

*

            iia = ioffa + 1

            jja = joffa + 1

*

         END IF

*

         nbloc = nb

   50    CONTINUE

         IF( nblks.GT.0 ) THEN

            IF( nblks.EQ.1 )

     $         nbloc = lnbloc

   60       CONTINUE

            IF( mblks.GT.0 .AND. lcmt00.GT.upp ) THEN

               lcmt00 = lcmt00 - pmb

               mblks  = mblks - 1

               ioffa  = ioffa + mb

               GO TO 60

            END IF

*

            tmp1 = min( ioffa, iimax ) - iia + 1

            IF( upper .AND. tmp1.GT.0 ) THEN

               CALL pb_dlascal( 'All', tmp1, n1, 0, alpha,

     $                          a( iia+joffa*lda ), lda )

               iia = iia + tmp1

               m1  = m1 - tmp1

            END IF

*

            IF( mblks.LE.0 )

     $         RETURN

*

            lcmt  = lcmt00

            mblkd = mblks

            ioffd = ioffa

*

            mbloc = mb

   70       CONTINUE

            IF( mblkd.GT.0 .AND. lcmt.GE.low ) THEN

               IF( mblkd.EQ.1 )

     $            mbloc = lmbloc

               CALL pb_dlascal( uplo, mbloc, nbloc, lcmt, alpha,

     $                          a( ioffd+1+joffa*lda ), lda )

               lcmt00 = lcmt

               lcmt   = lcmt - pmb

               mblks  = mblkd

               mblkd  = mblkd - 1

               ioffa  = ioffd

               ioffd  = ioffd + mbloc

               GO TO 70

            END IF

*

            tmp1 = m1 - ioffd + iia - 1

            IF( lower .AND. tmp1.GT.0 )

     $         CALL pb_dlascal( 'All', tmp1, nbloc, 0, alpha,

     $                          a( ioffd+1+joffa*lda ), lda )

*

            tmp1   = min( ioffa, iimax )  - iia + 1

            m1     = m1 - tmp1

            n1     = n1 - nbloc

            lcmt00 = lcmt00 + qnb

            nblks  = nblks - 1

            joffa  = joffa + nbloc

*

            IF( upper .AND. tmp1.GT.0 .AND. n1.GT.0 )

     $         CALL pb_dlascal( 'All', tmp1, n1, 0, alpha,

     $                          a( iia+joffa*lda ), lda )

*

            iia = ioffa + 1

            jja = joffa + 1

*

            GO TO 50

*

         END IF

*

      END IF

*

      RETURN

*

*     End of PDLASCAL

*


      END


      SUBROUTINE pdlagen( INPLACE, AFORM, DIAG, OFFA, M, N, IA, JA,

     $                    DESCA, IASEED, A, LDA )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Scalar Arguments ..

      LOGICAL            inplace

      CHARACTER*1        aform, diag

      INTEGER            ia, iaseed, ja, lda, m, n, offa

*     ..

*     .. Array Arguments ..

      INTEGER            desca( * )

      DOUBLE PRECISION   A( LDA, * )

*     ..

*

*  Purpose

*  =======

*

*  PDLAGEN  generates  (or regenerates)  a  submatrix  sub( A ) denoting

*  A(IA:IA+M-1,JA:JA+N-1).

*

*  Notes

*  =====

*

*  A description  vector  is associated with each 2D block-cyclicly dis-

*  tributed matrix.  This  vector  stores  the  information  required to

*  establish the  mapping  between a  matrix entry and its corresponding

*  process and memory location.

*

*  In  the  following  comments,   the character _  should  be  read  as

*  "of  the  distributed  matrix".  Let  A  be a generic term for any 2D

*  block cyclicly distributed matrix.  Its description vector is DESCA:

*

*  NOTATION         STORED IN       EXPLANATION

*  ---------------- --------------- ------------------------------------

*  DTYPE_A (global) DESCA( DTYPE_ ) The descriptor type.

*  CTXT_A  (global) DESCA( CTXT_  ) The BLACS context handle, indicating

*                                   the NPROW x NPCOL BLACS process grid

*                                   A  is distributed over.  The context

*                                   itself  is  global,  but  the handle

*                                   (the integer value) may vary.

*  M_A     (global) DESCA( M_     ) The  number of rows in the distribu-

*                                   ted matrix A, M_A >= 0.

*  N_A     (global) DESCA( N_     ) The number of columns in the distri-

*                                   buted matrix A, N_A >= 0.

*  IMB_A   (global) DESCA( IMB_   ) The number of rows of the upper left

*                                   block of the matrix A, IMB_A > 0.

*  INB_A   (global) DESCA( INB_   ) The  number  of columns of the upper

*                                   left   block   of   the   matrix  A,

*                                   INB_A > 0.

*  MB_A    (global) DESCA( MB_    ) The blocking factor used to  distri-

*                                   bute the last  M_A-IMB_A rows of  A,

*                                   MB_A > 0.

*  NB_A    (global) DESCA( NB_    ) The blocking factor used to  distri-

*                                   bute the last  N_A-INB_A  columns of

*                                   A, NB_A > 0.

*  RSRC_A  (global) DESCA( RSRC_  ) The process row over which the first

*                                   row of the matrix  A is distributed,

*                                   NPROW > RSRC_A >= 0.

*  CSRC_A  (global) DESCA( CSRC_  ) The  process  column  over which the

*                                   first  column of  A  is distributed.

*                                   NPCOL > CSRC_A >= 0.

*  LLD_A   (local)  DESCA( LLD_   ) The  leading  dimension of the local

*                                   array  storing  the  local blocks of

*                                   the distributed matrix A,

*                                   IF( Lc( 1, N_A ) > 0 )

*                                      LLD_A >= MAX( 1, Lr( 1, M_A ) )

*                                   ELSE

*                                      LLD_A >= 1.

*

*  Let K be the number of  rows of a matrix A starting at the global in-

*  dex IA,i.e, A( IA:IA+K-1, : ). Lr( IA, K ) denotes the number of rows

*  that the process of row coordinate MYROW ( 0 <= MYROW < NPROW ) would

*  receive if these K rows were distributed over NPROW processes.  If  K

*  is the number of columns of a matrix  A  starting at the global index

*  JA, i.e, A( :, JA:JA+K-1, : ), Lc( JA, K ) denotes the number  of co-

*  lumns that the process MYCOL ( 0 <= MYCOL < NPCOL ) would  receive if

*  these K columns were distributed over NPCOL processes.

*

*  The values of Lr() and Lc() may be determined via a call to the func-

*  tion PB_NUMROC:

*  Lr( IA, K ) = PB_NUMROC( K, IA, IMB_A, MB_A, MYROW, RSRC_A, NPROW )

*  Lc( JA, K ) = PB_NUMROC( K, JA, INB_A, NB_A, MYCOL, CSRC_A, NPCOL )

*

*  Arguments

*  =========

*

*  INPLACE (global input) LOGICAL

*          On entry, INPLACE specifies if the matrix should be generated

*          in place or not. If INPLACE is .TRUE., the local random array

*          to be generated  will start in memory at the local memory lo-

*          cation A( 1, 1 ),  otherwise it will start at the local posi-

*          tion induced by IA and JA.

*

*  AFORM   (global input) CHARACTER*1

*          On entry, AFORM specifies the type of submatrix to be genera-

*          ted as follows:

*             AFORM = 'S', sub( A ) is a symmetric matrix,

*             AFORM = 'H', sub( A ) is a Hermitian matrix,

*             AFORM = 'T', sub( A ) is overrwritten  with  the transpose

*                          of what would normally be generated,

*             AFORM = 'C', sub( A ) is overwritten  with  the  conjugate

*                          transpose  of  what would normally be genera-

*                          ted.

*             AFORM = 'N', a random submatrix is generated.

*

*  DIAG    (global input) CHARACTER*1

*          On entry, DIAG specifies if the generated submatrix is diago-

*          nally dominant or not as follows:

*             DIAG = 'D' : sub( A ) is diagonally dominant,

*             DIAG = 'N' : sub( A ) is not diagonally dominant.

*

*  OFFA    (global input) INTEGER

*          On entry, OFFA  specifies  the  offdiagonal of the underlying

*          matrix A(1:DESCA(M_),1:DESCA(N_)) of interest when the subma-

*          trix is symmetric, Hermitian or diagonally dominant. OFFA = 0

*          specifies the main diagonal,  OFFA > 0  specifies a subdiago-

*          nal,  and OFFA < 0 specifies a superdiagonal (see further de-

*          tails).

*

*  M       (global input) INTEGER

*          On entry, M specifies the global number of matrix rows of the

*          submatrix sub( A ) to be generated. M must be at least zero.

*

*  N       (global input) INTEGER

*          On entry,  N specifies the global number of matrix columns of

*          the  submatrix  sub( A )  to be generated. N must be at least

*          zero.

*

*  IA      (global input) INTEGER

*          On entry, IA  specifies A's global row index, which points to

*          the beginning of the submatrix sub( A ).

*

*  JA      (global input) INTEGER

*          On entry, JA  specifies A's global column index, which points

*          to the beginning of the submatrix sub( A ).

*

*  DESCA   (global and local input) INTEGER array

*          On entry, DESCA  is an integer array of dimension DLEN_. This

*          is the array descriptor for the matrix A.

*

*  IASEED  (global input) INTEGER

*          On entry, IASEED  specifies  the  seed number to generate the

*          matrix A. IASEED must be at least zero.

*

*  A       (local output) DOUBLE PRECISION array

*          On entry, A is an array of dimension (LLD_A, Ka), where Ka is

*          at least Lc( 1, JA+N-1 ).  On  exit, this array  contains the

*          local entries of the randomly generated submatrix sub( A ).

*

*  LDA     (local input) INTEGER

*          On entry,  LDA  specifies  the local leading dimension of the

*          array A. When INPLACE is .FALSE., LDA is usually DESCA(LLD_).

*          This restriction is however not enforced, and this subroutine

*          requires only that LDA >= MAX( 1, Mp ) where

*

*          Mp = PB_NUMROC( M, IA, IMB_A, MB_A, MYROW, RSRC_A, NPROW ).

*

*          PB_NUMROC  is  a ScaLAPACK tool function; MYROW, MYCOL, NPROW

*          and NPCOL  can  be determined by calling the BLACS subroutine

*          BLACS_GRIDINFO.

*

*  Further Details

*  ===============

*

*  OFFD  is  tied  to  the matrix described by  DESCA, as opposed to the

*  piece that is currently  (re)generated.  This is a global information

*  independent from the distribution  parameters.  Below are examples of

*  the meaning of OFFD for a global 7 by 5 matrix:

*

*  ---------------------------------------------------------------------

*  OFFD   |  0 -1 -2 -3 -4         0 -1 -2 -3 -4          0 -1 -2 -3 -4

*  -------|-------------------------------------------------------------

*         |     | OFFD=-1          |   OFFD=0                 OFFD=2

*         |     V                  V

*  0      |  .  d  .  .  .      -> d  .  .  .  .          .  .  .  .  .

*  1      |  .  .  d  .  .         .  d  .  .  .          .  .  .  .  .

*  2      |  .  .  .  d  .         .  .  d  .  .       -> d  .  .  .  .

*  3      |  .  .  .  .  d         .  .  .  d  .          .  d  .  .  .

*  4      |  .  .  .  .  .         .  .  .  .  d          .  .  d  .  .

*  5      |  .  .  .  .  .         .  .  .  .  .          .  .  .  d  .

*  6      |  .  .  .  .  .         .  .  .  .  .          .  .  .  .  d

*  ---------------------------------------------------------------------

*

*  -- Written on April 1, 1998 by

*     Antoine Petitet, University  of  Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Parameters ..

      INTEGER            BLOCK_CYCLIC_2D_INB, CSRC_, CTXT_, DLEN_,

     $                   dtype_, imb_, inb_, lld_, mb_, m_, nb_, n_,

     $                   rsrc_

      parameter( block_cyclic_2d_inb = 2, dlen_ = 11,

     $                   dtype_ = 1, ctxt_ = 2, m_ = 3, n_ = 4,

     $                   imb_ = 5, inb_ = 6, mb_ = 7, nb_ = 8,

     $                   rsrc_ = 9, csrc_ = 10, lld_ = 11 )

      INTEGER            JMP_1, JMP_COL, JMP_IMBV, JMP_INBV, JMP_LEN,

     $                   jmp_mb, jmp_nb, jmp_npimbloc, jmp_npmb,

     $                   jmp_nqinbloc, jmp_nqnb, jmp_row

      parameter( jmp_1 = 1, jmp_row = 2, jmp_col = 3,

     $                   jmp_mb = 4, jmp_imbv = 5, jmp_npmb = 6,

     $                   jmp_npimbloc = 7, jmp_nb = 8, jmp_inbv = 9,

     $                   jmp_nqnb = 10, jmp_nqinbloc = 11,

     $                   jmp_len = 11 )

*     ..

*     .. Local Scalars ..

      LOGICAL            DIAGDO, SYMM, HERM, NOTRAN

      INTEGER            CSRC, I, IACOL, IAROW, ICTXT, IIA, ILOCBLK,

     $                   ilocoff, ilow, imb, imb1, imbloc, imbvir, inb,

     $                   inb1, inbloc, inbvir, info, ioffda, itmp, iupp,

     $                   ivir, jja, jlocblk, jlocoff, jvir, lcmt00,

     $                   lmbloc, lnbloc, low, maxmn, mb, mblks, mp,

     $                   mrcol, mrrow, mycdist, mycol, myrdist, myrow,

     $                   nb, nblks, npcol, nprow, nq, nvir, rsrc, upp

      DOUBLE PRECISION   ALPHA

*     ..

*     .. Local Arrays ..

      INTEGER            DESCA2( DLEN_ ), IMULADD( 4, JMP_LEN ),

     $                   iran( 2 ), jmp( jmp_len ), muladd0( 4 )

*     ..

*     .. External Subroutines ..

      EXTERNAL           blacs_gridinfo, pb_ainfog2l, pb_binfo,

     $                   pb_chkmat, pb_desctrans, pb_dlagen, pb_initjmp,

     $                   pb_initmuladd, pb_jump, pb_jumpit, pb_locinfo,

     $                   pb_setlocran, pb_setran, pdladom, pxerbla

*     ..

*     .. External Functions ..

      LOGICAL            LSAME

      EXTERNAL           lsame

*     ..

*     .. Intrinsic Functions ..

      INTRINSIC          dble, max, min

*     ..

*     .. Data Statements ..

      DATA               ( muladd0( i ), i = 1, 4 ) / 20077, 16838,

     $                   12345, 0 /

*     ..

*     .. Executable Statements ..

*

*     Convert descriptor

*

      CALL pb_desctrans( desca, desca2 )

*

*     Test the input arguments

*

      ictxt = desca2( ctxt_ )

      CALL blacs_gridinfo( ictxt, nprow, npcol, myrow, mycol )

*

*     Test the input parameters

*

      info = 0

      IF( nprow.EQ.-1 ) THEN

         info = -( 1000 + ctxt_ )

      ELSE

         symm   = lsame( aform, 'S' )

         herm   = lsame( aform, 'H' )

         notran = lsame( aform, 'N' )

         diagdo = lsame( diag, 'D' )

         IF( .NOT.( symm.OR.herm.OR.notran ) .AND.

     $       .NOT.( lsame( aform, 'T' )    ) .AND.

     $       .NOT.( lsame( aform, 'C' )    ) ) THEN

            info = -2

         ELSE IF( ( .NOT.diagdo ) .AND.

     $            ( .NOT.lsame( diag, 'N' ) ) ) THEN

            info = -3

         END IF

         CALL pb_chkmat( ictxt, m, 5, n, 6, ia, ja, desca2, 10, info )

      END IF

*

      IF( info.NE.0 ) THEN

         CALL pxerbla( ictxt, 'PDLAGEN', -info )

         RETURN

      END IF

*

*     Quick return if possible

*

      IF( ( m.LE.0 ).OR.( n.LE.0 ) )

     $   RETURN

*

*     Start the operations

*

      mb   = desca2( mb_   )

      nb   = desca2( nb_   )

      imb  = desca2( imb_  )

      inb  = desca2( inb_  )

      rsrc = desca2( rsrc_ )

      csrc = desca2( csrc_ )

*

*     Figure out local information about the distributed matrix operand

*

      CALL pb_ainfog2l( m, n, ia, ja, desca2, nprow, npcol, myrow,

     $                  mycol, imb1, inb1, mp, nq, iia, jja, iarow,

     $                  iacol, mrrow, mrcol )

*

*     Decide where the entries shall be stored in memory

*

      IF( inplace ) THEN

         iia = 1

         jja = 1

      END IF

*

*     Initialize LCMT00, MBLKS, NBLKS, IMBLOC, INBLOC, LMBLOC, LNBLOC,

*     ILOW, LOW, IUPP, and UPP.

*

      ioffda = ja + offa - ia

      CALL pb_binfo( ioffda, mp, nq, imb1, inb1, mb, nb, mrrow,

     $               mrcol, lcmt00, mblks, nblks, imbloc, inbloc,

     $               lmbloc, lnbloc, ilow, low, iupp, upp )

*

*     Initialize ILOCBLK, ILOCOFF, MYRDIST, JLOCBLK, JLOCOFF, MYCDIST

*     This values correspond to the square virtual underlying matrix

*     of size MAX( M_ + MAX( 0, -OFFA ), N_ + MAX( 0, OFFA ) ) used

*     to set up the random sequence. For practical purposes, the size

*     of this virtual matrix is upper bounded by M_ + N_ - 1.

*

      itmp   = max( 0, -offa )

      ivir   = ia  + itmp

      imbvir = imb + itmp

      nvir   = desca2( m_ ) + itmp

*

      CALL pb_locinfo( ivir, imbvir, mb, myrow, rsrc, nprow, ilocblk,

     $                 ilocoff, myrdist )

*

      itmp   = max( 0, offa )

      jvir   = ja  + itmp

      inbvir = inb + itmp

      nvir   = max( max( nvir, desca2( n_ ) + itmp ),

     $              desca2( m_ ) + desca2( n_ ) - 1 )

*

      CALL pb_locinfo( jvir, inbvir, nb, mycol, csrc, npcol, jlocblk,

     $                 jlocoff, mycdist )

*

      IF( symm .OR. herm .OR. notran ) THEN

*

         CALL pb_initjmp( .true., nvir, imbvir, inbvir, imbloc, inbloc,

     $                    mb, nb, rsrc, csrc, nprow, npcol, 1, jmp )

*

*        Compute constants to jump JMP( * ) numbers in the sequence

*

         CALL pb_initmuladd( muladd0, jmp, imuladd )

*

*        Compute and set the random value corresponding to A( IA, JA )

*

         CALL pb_setlocran( iaseed, ilocblk, jlocblk, ilocoff, jlocoff,

     $                      myrdist, mycdist, nprow, npcol, jmp,

     $                      imuladd, iran )

*

         CALL pb_dlagen( 'Lower', aform, a( iia, jja ), lda, lcmt00,

     $                   iran, mblks, imbloc, mb, lmbloc, nblks, inbloc,

     $                   nb, lnbloc, jmp, imuladd )

*

      END IF

*

      IF( symm .OR. herm .OR. ( .NOT. notran ) ) THEN

*

         CALL pb_initjmp( .false., nvir, imbvir, inbvir, imbloc, inbloc,

     $                    mb, nb, rsrc, csrc, nprow, npcol, 1, jmp )

*

*        Compute constants to jump JMP( * ) numbers in the sequence

*

         CALL pb_initmuladd( muladd0, jmp, imuladd )

*

*        Compute and set the random value corresponding to A( IA, JA )

*

         CALL pb_setlocran( iaseed, ilocblk, jlocblk, ilocoff, jlocoff,

     $                      myrdist, mycdist, nprow, npcol, jmp,

     $                      imuladd, iran )

*

         CALL pb_dlagen( 'Upper', aform, a( iia, jja ), lda, lcmt00,

     $                   iran, mblks, imbloc, mb, lmbloc, nblks, inbloc,

     $                   nb, lnbloc, jmp, imuladd )

*

      END IF

*

      IF( diagdo ) THEN

*

         maxmn = max( desca2( m_ ), desca2( n_ ) )

         alpha = dble( maxmn )

*

         IF( ioffda.GE.0 ) THEN

            CALL pdladom( inplace, min( max( 0, m-ioffda ), n ), alpha,

     $                    a, min( ia+ioffda, ia+m-1 ), ja, desca )

         ELSE

            CALL pdladom( inplace, min( m, max( 0, n+ioffda ) ), alpha,

     $                    a, ia, min( ja-ioffda, ja+n-1 ), desca )

         END IF

*

      END IF

*

      RETURN

*

*     End of PDLAGEN

*


      END


      SUBROUTINE pdladom( INPLACE, N, ALPHA, A, IA, JA, DESCA )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Scalar Arguments ..

      LOGICAL            INPLACE

      INTEGER            IA, JA, N

      DOUBLE PRECISION   ALPHA

*     ..

*     .. Array Arguments ..

      INTEGER            DESCA( * )

      DOUBLE PRECISION   A( * )

*     ..

*

*  Purpose

*  =======

*

*  PDLADOM  adds alpha to the diagonal entries  of  an  n by n submatrix

*  sub( A ) denoting A( IA:IA+N-1, JA:JA+N-1 ).

*

*  Notes

*  =====

*

*  A description  vector  is associated with each 2D block-cyclicly dis-

*  tributed matrix.  This  vector  stores  the  information  required to

*  establish the  mapping  between a  matrix entry and its corresponding

*  process and memory location.

*

*  In  the  following  comments,   the character _  should  be  read  as

*  "of  the  distributed  matrix".  Let  A  be a generic term for any 2D

*  block cyclicly distributed matrix.  Its description vector is DESCA:

*

*  NOTATION         STORED IN       EXPLANATION

*  ---------------- --------------- ------------------------------------

*  DTYPE_A (global) DESCA( DTYPE_ ) The descriptor type.

*  CTXT_A  (global) DESCA( CTXT_  ) The BLACS context handle, indicating

*                                   the NPROW x NPCOL BLACS process grid

*                                   A  is distributed over.  The context

*                                   itself  is  global,  but  the handle

*                                   (the integer value) may vary.

*  M_A     (global) DESCA( M_     ) The  number of rows in the distribu-

*                                   ted matrix A, M_A >= 0.

*  N_A     (global) DESCA( N_     ) The number of columns in the distri-

*                                   buted matrix A, N_A >= 0.

*  IMB_A   (global) DESCA( IMB_   ) The number of rows of the upper left

*                                   block of the matrix A, IMB_A > 0.

*  INB_A   (global) DESCA( INB_   ) The  number  of columns of the upper

*                                   left   block   of   the   matrix  A,

*                                   INB_A > 0.

*  MB_A    (global) DESCA( MB_    ) The blocking factor used to  distri-

*                                   bute the last  M_A-IMB_A rows of  A,

*                                   MB_A > 0.

*  NB_A    (global) DESCA( NB_    ) The blocking factor used to  distri-

*                                   bute the last  N_A-INB_A  columns of

*                                   A, NB_A > 0.

*  RSRC_A  (global) DESCA( RSRC_  ) The process row over which the first

*                                   row of the matrix  A is distributed,

*                                   NPROW > RSRC_A >= 0.

*  CSRC_A  (global) DESCA( CSRC_  ) The  process  column  over which the

*                                   first  column of  A  is distributed.

*                                   NPCOL > CSRC_A >= 0.

*  LLD_A   (local)  DESCA( LLD_   ) The  leading  dimension of the local

*                                   array  storing  the  local blocks of

*                                   the distributed matrix A,

*                                   IF( Lc( 1, N_A ) > 0 )

*                                      LLD_A >= MAX( 1, Lr( 1, M_A ) )

*                                   ELSE

*                                      LLD_A >= 1.

*

*  Let K be the number of  rows of a matrix A starting at the global in-

*  dex IA,i.e, A( IA:IA+K-1, : ). Lr( IA, K ) denotes the number of rows

*  that the process of row coordinate MYROW ( 0 <= MYROW < NPROW ) would

*  receive if these K rows were distributed over NPROW processes.  If  K

*  is the number of columns of a matrix  A  starting at the global index

*  JA, i.e, A( :, JA:JA+K-1, : ), Lc( JA, K ) denotes the number  of co-

*  lumns that the process MYCOL ( 0 <= MYCOL < NPCOL ) would  receive if

*  these K columns were distributed over NPCOL processes.

*

*  The values of Lr() and Lc() may be determined via a call to the func-

*  tion PB_NUMROC:

*  Lr( IA, K ) = PB_NUMROC( K, IA, IMB_A, MB_A, MYROW, RSRC_A, NPROW )

*  Lc( JA, K ) = PB_NUMROC( K, JA, INB_A, NB_A, MYCOL, CSRC_A, NPCOL )

*

*  Arguments

*  =========

*

*  INPLACE (global input) LOGICAL

*          On entry, INPLACE specifies if the matrix should be generated

*          in place or not. If INPLACE is .TRUE., the local random array

*          to be generated  will start in memory at the local memory lo-

*          cation A( 1, 1 ),  otherwise it will start at the local posi-

*          tion induced by IA and JA.

*

*  N       (global input) INTEGER

*          On entry,  N  specifies  the  global  order  of the submatrix

*          sub( A ) to be modified. N must be at least zero.

*

*  ALPHA   (global input) DOUBLE PRECISION

*          On entry, ALPHA specifies the scalar alpha.

*

*  A       (local input/local output) DOUBLE PRECISION array

*          On entry, A is an array of dimension (LLD_A, Ka), where Ka is

*          at least Lc( 1, JA+N-1 ).  Before  entry, this array contains

*          the local entries of the matrix A. On exit, the local entries

*          of this array corresponding to the main diagonal of  sub( A )

*          have been updated.

*

*  IA      (global input) INTEGER

*          On entry, IA  specifies A's global row index, which points to

*          the beginning of the submatrix sub( A ).

*

*  JA      (global input) INTEGER

*          On entry, JA  specifies A's global column index, which points

*          to the beginning of the submatrix sub( A ).

*

*  DESCA   (global and local input) INTEGER array

*          On entry, DESCA  is an integer array of dimension DLEN_. This

*          is the array descriptor for the matrix A.

*

*  -- Written on April 1, 1998 by

*     Antoine Petitet, University  of  Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Parameters ..

      INTEGER            BLOCK_CYCLIC_2D_INB, CSRC_, CTXT_, DLEN_,

     $                   dtype_, imb_, inb_, lld_, mb_, m_, nb_, n_,

     $                   rsrc_

      parameter( block_cyclic_2d_inb = 2, dlen_ = 11,

     $                   dtype_ = 1, ctxt_ = 2, m_ = 3, n_ = 4,

     $                   imb_ = 5, inb_ = 6, mb_ = 7, nb_ = 8,

     $                   rsrc_ = 9, csrc_ = 10, lld_ = 11 )

*     ..

*     .. Local Scalars ..

      LOGICAL            GODOWN, GOLEFT

      INTEGER            I, IACOL, IAROW, ICTXT, IIA, IJOFFA, ILOW,

     $                   imb1, imbloc, inb1, inbloc, ioffa, ioffd, iupp,

     $                   jja, joffa, joffd, lcmt, lcmt00, lda, ldap1,

     $                   lmbloc, lnbloc, low, mb, mblkd, mblks, mbloc,

     $                   mrcol, mrrow, mycol, myrow, nb, nblkd, nblks,

     $                   nbloc, np, npcol, nprow, nq, pmb, qnb, upp

      DOUBLE PRECISION   ATMP

*     ..

*     .. Local Scalars ..

      INTEGER            DESCA2( DLEN_ )

*     ..

*     .. External Subroutines ..

      EXTERNAL           blacs_gridinfo, pb_ainfog2l, pb_binfo,

     $                   pb_desctrans

*     ..

*     .. Intrinsic Functions ..

      INTRINSIC          abs, max, min

*     ..

*     .. Executable Statements ..

*

*     Convert descriptor

*

      CALL pb_desctrans( desca, desca2 )

*

*     Get grid parameters

*

      ictxt = desca2( ctxt_ )

      CALL blacs_gridinfo( ictxt, nprow, npcol, myrow, mycol )

*

      IF( n.EQ.0 )

     $   RETURN

*

      CALL pb_ainfog2l( n, n, ia, ja, desca2, nprow, npcol, myrow,

     $                  mycol, imb1, inb1, np, nq, iia, jja, iarow,

     $                  iacol, mrrow, mrcol )

*

*     Decide where the entries shall be stored in memory

*

      IF( inplace ) THEN

         iia = 1

         jja = 1

      END IF

*

*     Initialize LCMT00, MBLKS, NBLKS, IMBLOC, INBLOC, LMBLOC, LNBLOC,

*     ILOW, LOW, IUPP, and UPP.

*

      mb = desca2( mb_ )

      nb = desca2( nb_ )

*

      CALL pb_binfo( 0, np, nq, imb1, inb1, mb, nb, mrrow, mrcol,

     $               lcmt00, mblks, nblks, imbloc, inbloc, lmbloc,

     $               lnbloc, ilow, low, iupp, upp )

*

      ioffa  = iia - 1

      joffa  = jja - 1

      lda    = desca2( lld_ )

      ldap1  = lda + 1

*

      IF( desca2( rsrc_ ).LT.0 ) THEN

         pmb = mb

      ELSE

         pmb = nprow * mb

      END IF

      IF( desca2( csrc_ ).LT.0 ) THEN

         qnb = nb

      ELSE

         qnb = npcol * nb

      END IF

*

*     Handle the first block of rows or columns separately, and update

*     LCMT00, MBLKS and NBLKS.

*

      godown = ( lcmt00.GT.iupp )

      goleft = ( lcmt00.LT.ilow )

*

      IF( .NOT.godown .AND. .NOT.goleft ) THEN

*

*        LCMT00 >= ILOW && LCMT00 <= IUPP

*

         IF( lcmt00.GE.0 ) THEN

            ijoffa = ioffa+lcmt00 + ( joffa - 1 ) * lda

            DO 10 i = 1, min( inbloc, max( 0, imbloc - lcmt00 ) )

               atmp = a( ijoffa + i*ldap1 )

               a( ijoffa + i*ldap1 ) = abs( atmp ) + alpha

   10       CONTINUE

         ELSE

            ijoffa = ioffa + ( joffa - lcmt00 - 1 ) * lda

            DO 20 i = 1, min( imbloc, max( 0, inbloc + lcmt00 ) )

               atmp = a( ijoffa + i*ldap1 )

               a( ijoffa + i*ldap1 ) = abs( atmp ) + alpha

   20       CONTINUE

         END IF

         goleft = ( ( lcmt00 - ( iupp - upp + pmb ) ).LT.ilow )

         godown = .NOT.goleft

*

      END IF

*

      IF( godown ) THEN

*

         lcmt00 = lcmt00 - ( iupp - upp + pmb )

         mblks  = mblks - 1

         ioffa  = ioffa + imbloc

*

   30    CONTINUE

         IF( mblks.GT.0 .AND. lcmt00.GT.upp ) THEN

            lcmt00 = lcmt00 - pmb

            mblks  = mblks - 1

            ioffa  = ioffa + mb

            GO TO 30

         END IF

*

         lcmt  = lcmt00

         mblkd = mblks

         ioffd = ioffa

*

         mbloc = mb

   40    CONTINUE

         IF( mblkd.GT.0 .AND. lcmt.GE.ilow ) THEN

            IF( mblkd.EQ.1 )

     $         mbloc = lmbloc

            IF( lcmt.GE.0 ) THEN

               ijoffa = ioffd + lcmt + ( joffa - 1 ) * lda

               DO 50 i = 1, min( inbloc, max( 0, mbloc - lcmt ) )

                  atmp = a( ijoffa + i*ldap1 )

                  a( ijoffa + i*ldap1 ) = abs( atmp ) + alpha

   50          CONTINUE

            ELSE

               ijoffa = ioffd + ( joffa - lcmt - 1 ) * lda

               DO 60 i = 1, min( mbloc, max( 0, inbloc + lcmt ) )

                  atmp = a( ijoffa + i*ldap1 )

                  a( ijoffa + i*ldap1 ) = abs( atmp ) + alpha

   60          CONTINUE

            END IF

            lcmt00 = lcmt

            lcmt   = lcmt - pmb

            mblks  = mblkd

            mblkd  = mblkd - 1

            ioffa  = ioffd

            ioffd  = ioffd + mbloc

            GO TO 40

         END IF

*

         lcmt00 = lcmt00 + low - ilow + qnb

         nblks  = nblks - 1

         joffa  = joffa + inbloc

*

      ELSE IF( goleft ) THEN

*

         lcmt00 = lcmt00 + low - ilow + qnb

         nblks  = nblks - 1

         joffa  = joffa + inbloc

*

   70    CONTINUE

         IF( nblks.GT.0 .AND. lcmt00.LT.low ) THEN

            lcmt00 = lcmt00 + qnb

            nblks  = nblks - 1

            joffa  = joffa + nb

            GO TO 70

         END IF

*

         lcmt  = lcmt00

         nblkd = nblks

         joffd = joffa

*

         nbloc = nb

   80    CONTINUE

         IF( nblkd.GT.0 .AND. lcmt.LE.iupp ) THEN

            IF( nblkd.EQ.1 )

     $         nbloc = lnbloc

            IF( lcmt.GE.0 ) THEN

               ijoffa = ioffa + lcmt + ( joffd - 1 ) * lda

               DO 90 i = 1, min( nbloc, max( 0, imbloc - lcmt ) )

                  atmp = a( ijoffa + i*ldap1 )

                  a( ijoffa + i*ldap1 ) = abs( atmp ) + alpha

   90          CONTINUE

            ELSE

               ijoffa = ioffa + ( joffd - lcmt - 1 ) * lda

               DO 100 i = 1, min( imbloc, max( 0, nbloc + lcmt ) )

                  atmp = a( ijoffa + i*ldap1 )

                  a( ijoffa + i*ldap1 ) = abs( atmp ) + alpha

  100          CONTINUE

            END IF

            lcmt00 = lcmt

            lcmt   = lcmt + qnb

            nblks  = nblkd

            nblkd  = nblkd - 1

            joffa  = joffd

            joffd  = joffd + nbloc

            GO TO 80

         END IF

*

         lcmt00 = lcmt00 - ( iupp - upp + pmb )

         mblks  = mblks - 1

         ioffa  = ioffa + imbloc

*

      END IF

*

      nbloc = nb

  110 CONTINUE

      IF( nblks.GT.0 ) THEN

         IF( nblks.EQ.1 )

     $      nbloc = lnbloc

  120    CONTINUE

         IF( mblks.GT.0 .AND. lcmt00.GT.upp ) THEN

            lcmt00 = lcmt00 - pmb

            mblks  = mblks - 1

            ioffa  = ioffa + mb

            GO TO 120

         END IF

*

         lcmt  = lcmt00

         mblkd = mblks

         ioffd = ioffa

*

         mbloc = mb

  130    CONTINUE

         IF( mblkd.GT.0 .AND. lcmt.GE.low ) THEN

            IF( mblkd.EQ.1 )

     $         mbloc = lmbloc

            IF( lcmt.GE.0 ) THEN

               ijoffa = ioffd + lcmt + ( joffa - 1 ) * lda

               DO 140 i = 1, min( nbloc, max( 0, mbloc - lcmt ) )

                  atmp = a( ijoffa + i*ldap1 )

                  a( ijoffa + i*ldap1 ) = abs( atmp ) + alpha

  140          CONTINUE

            ELSE

               ijoffa = ioffd + ( joffa - lcmt - 1 ) * lda

               DO 150 i = 1, min( mbloc, max( 0, nbloc + lcmt ) )

                  atmp = a( ijoffa + i*ldap1 )

                  a( ijoffa + i*ldap1 ) = abs( atmp ) + alpha

  150          CONTINUE

            END IF

            lcmt00 = lcmt

            lcmt   = lcmt - pmb

            mblks  = mblkd

            mblkd  = mblkd - 1

            ioffa  = ioffd

            ioffd  = ioffd + mbloc

            GO TO 130

         END IF

*

         lcmt00 = lcmt00 + qnb

         nblks  = nblks - 1

         joffa  = joffa + nbloc

         GO TO 110

*

      END IF

*

      RETURN

*

*     End of PDLADOM

*


      END


      SUBROUTINE pb_dlascal( UPLO, M, N, IOFFD, ALPHA, A, LDA )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Scalar Arguments ..

      CHARACTER*1        UPLO

      INTEGER            IOFFD, LDA, M, N

      DOUBLE PRECISION   ALPHA

*     ..

*     .. Array Arguments ..

      DOUBLE PRECISION   A( LDA, * )

*     ..

*

*  Purpose

*  =======

*

*  PB_DLASCAL scales a two-dimensional array A by the scalar alpha.

*

*  Arguments

*  =========

*

*  UPLO    (input) CHARACTER*1

*          On entry,  UPLO  specifies  which trapezoidal part of the ar-

*          ray A is to be scaled as follows:

*             = 'L' or 'l':          the lower trapezoid of A is scaled,

*             = 'U' or 'u':          the upper trapezoid of A is scaled,

*             = 'D' or 'd':       diagonal specified by IOFFD is scaled,

*             Otherwise:                   all of the array A is scaled.

*

*  M       (input) INTEGER

*          On entry,  M  specifies the number of rows of the array A.  M

*          must be at least zero.

*

*  N       (input) INTEGER

*          On entry,  N  specifies the number of columns of the array A.

*          N must be at least zero.

*

*  IOFFD   (input) INTEGER

*          On entry, IOFFD specifies the position of the offdiagonal de-

*          limiting the upper and lower trapezoidal part of A as follows

*          (see the notes below):

*

*             IOFFD = 0  specifies the main diagonal A( i, i ),

*                        with i = 1 ... MIN( M, N ),

*             IOFFD > 0  specifies the subdiagonal   A( i+IOFFD, i ),

*                        with i = 1 ... MIN( M-IOFFD, N ),

*             IOFFD < 0  specifies the superdiagonal A( i, i-IOFFD ),

*                        with i = 1 ... MIN( M, N+IOFFD ).

*

*  ALPHA   (input) DOUBLE PRECISION

*          On entry, ALPHA specifies the scalar alpha.

*

*  A       (input/output) DOUBLE PRECISION array

*          On entry, A is an array of dimension  (LDA,N).  Before  entry

*          with  UPLO = 'U' or 'u', the leading m by n part of the array

*          A must contain the upper trapezoidal  part  of the matrix  as

*          specified by  IOFFD to be scaled, and the strictly lower tra-

*          pezoidal part of A is not referenced; When UPLO = 'L' or 'l',

*          the leading m by n part of the array A must contain the lower

*          trapezoidal  part  of  the matrix as specified by IOFFD to be

*          scaled,  and  the strictly upper trapezoidal part of A is not

*          referenced. On exit, the entries of the  trapezoid part of  A

*          determined by UPLO and IOFFD are scaled.

*

*  LDA     (input) INTEGER

*          On entry, LDA specifies the leading dimension of the array A.

*          LDA must be at least max( 1, M ).

*

*  Notes

*  =====

*                           N                                    N

*             ----------------------------                  -----------

*            |       d                    |                |           |

*          M |         d        'U'       |                |      'U'  |

*            |  'L'     'D'               |                |d          |

*            |             d              |              M |  d        |

*             ----------------------------                 |   'D'     |

*                                                          |      d    |

*              IOFFD < 0                                   | 'L'    d  |

*                                                          |          d|

*                  N                                       |           |

*             -----------                                   -----------

*            |    d   'U'|

*            |      d    |                                   IOFFD > 0

*          M |       'D' |

*            |          d|                              N

*            |  'L'      |                 ----------------------------

*            |           |                |          'U'               |

*            |           |                |d                           |

*            |           |                | 'D'                        |

*            |           |                |    d                       |

*            |           |                |'L'   d                     |

*             -----------                  ----------------------------

*

*  -- Written on April 1, 1998 by

*     Antoine Petitet, University  of  Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Local Scalars ..

      INTEGER            I, J, JTMP, MN

*     ..

*     .. External Functions ..

      LOGICAL            LSAME

      EXTERNAL           lsame

*     ..

*     .. Intrinsic Functions ..

      INTRINSIC          max, min

*     ..

*     .. Executable Statements ..

*

*     Quick return if possible

*

      IF( m.LE.0 .OR. n.LE.0 )

     $   RETURN

*

*     Start the operations

*

      IF( lsame( uplo, 'L' ) ) THEN

*

*        Scales the lower triangular part of the array by ALPHA.

*

         mn = max( 0, -ioffd )

         DO 20 j = 1, min( mn, n )

            DO 10 i = 1, m

               a( i, j ) = alpha * a( i, j )

   10       CONTINUE

   20    CONTINUE

         DO 40 j = mn + 1, min( m - ioffd, n )

            DO 30 i = j + ioffd, m

               a( i, j ) = alpha * a( i, j )

   30       CONTINUE

   40    CONTINUE

*

      ELSE IF( lsame( uplo, 'U' ) ) THEN

*

*        Scales the upper triangular part of the array by ALPHA.

*

         mn = min( m - ioffd, n )

         DO 60 j = max( 0, -ioffd ) + 1, mn

            DO 50 i = 1, j + ioffd

               a( i, j ) = alpha * a( i, j )

   50       CONTINUE

   60    CONTINUE

         DO 80 j = max( 0, mn ) + 1, n

            DO 70 i = 1, m

               a( i, j ) = alpha * a( i, j )

   70       CONTINUE

   80    CONTINUE

*

      ELSE IF( lsame( uplo, 'D' ) ) THEN

*

*        Scales the diagonal entries by ALPHA.

*

         DO 90 j = max( 0, -ioffd ) + 1, min( m - ioffd, n )

            jtmp = j + ioffd

            a( jtmp, j ) = alpha * a( jtmp, j )

   90    CONTINUE

*

      ELSE

*

*        Scales the entire array by ALPHA.

*

         DO 110 j = 1, n

            DO 100 i = 1, m

               a( i, j ) = alpha * a( i, j )

  100       CONTINUE

  110    CONTINUE

*

      END IF

*

      RETURN

*

*     End of PB_DLASCAL

*


      END


      SUBROUTINE pb_dlagen( UPLO, AFORM, A, LDA, LCMT00, IRAN, MBLKS,

     $                      IMBLOC, MB, LMBLOC, NBLKS, INBLOC, NB,

     $                      LNBLOC, JMP, IMULADD )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Scalar Arguments ..

      CHARACTER*1        UPLO, AFORM

      INTEGER            IMBLOC, INBLOC, LCMT00, LDA, LMBLOC, LNBLOC,

     $                   MB, MBLKS, NB, NBLKS

*     ..

*     .. Array Arguments ..

      INTEGER            IMULADD( 4, * ), IRAN( * ), JMP( * )

      DOUBLE PRECISION   A( LDA, * )

*     ..

*

*  Purpose

*  =======

*

*  PB_DLAGEN locally initializes an array A.

*

*  Arguments

*  =========

*

*  UPLO    (global input) CHARACTER*1

*          On entry, UPLO  specifies whether the lower (UPLO='L') trape-

*          zoidal part or the upper (UPLO='U') trapezoidal part is to be

*          generated  when  the  matrix  to be generated is symmetric or

*          Hermitian. For  all  the  other values of AFORM, the value of

*          this input argument is ignored.

*

*  AFORM   (global input) CHARACTER*1

*          On entry, AFORM specifies the type of submatrix to be genera-

*          ted as follows:

*             AFORM = 'S', sub( A ) is a symmetric matrix,

*             AFORM = 'H', sub( A ) is a Hermitian matrix,

*             AFORM = 'T', sub( A ) is overrwritten  with  the transpose

*                          of what would normally be generated,

*             AFORM = 'C', sub( A ) is overwritten  with  the  conjugate

*                          transpose  of  what would normally be genera-

*                          ted.

*             AFORM = 'N', a random submatrix is generated.

*

*  A       (local output) DOUBLE PRECISION array

*          On entry,  A  is  an array of dimension (LLD_A, *).  On exit,

*          this array contains the local entries of the randomly genera-

*          ted submatrix sub( A ).

*

*  LDA     (local input) INTEGER

*          On entry,  LDA  specifies  the local leading dimension of the

*          array A. LDA must be at least one.

*

*  LCMT00  (global input) INTEGER

*          On entry, LCMT00 is the LCM value specifying the off-diagonal

*          of the underlying matrix of interest. LCMT00=0 specifies  the

*          main diagonal, LCMT00 > 0 specifies a subdiagonal, LCMT00 < 0

*          specifies superdiagonals.

*

*  IRAN    (local input) INTEGER array

*          On entry, IRAN  is an array of dimension 2 containing respec-

*          tively the 16-lower and 16-higher bits of the encoding of the

*          entry of  the  random  sequence  corresponding locally to the

*          first local array entry to generate. Usually,  this  array is

*          computed by PB_SETLOCRAN.

*

*  MBLKS   (local input) INTEGER

*          On entry, MBLKS specifies the local number of blocks of rows.

*          MBLKS is at least zero.

*

*  IMBLOC  (local input) INTEGER

*          On entry, IMBLOC specifies  the  number of rows (size) of the

*          local uppest  blocks. IMBLOC is at least zero.

*

*  MB      (global input) INTEGER

*          On entry, MB  specifies the blocking factor used to partition

*          the rows of the matrix.  MB  must be at least one.

*

*  LMBLOC  (local input) INTEGER

*          On entry, LMBLOC specifies the number of  rows  (size) of the

*          local lowest blocks. LMBLOC is at least zero.

*

*  NBLKS   (local input) INTEGER

*          On entry,  NBLKS  specifies the local number of blocks of co-

*          lumns. NBLKS is at least zero.

*

*  INBLOC  (local input) INTEGER

*          On entry,  INBLOC  specifies the number of columns (size)  of

*          the local leftmost blocks. INBLOC is at least zero.

*

*  NB      (global input) INTEGER

*          On entry, NB  specifies the blocking factor used to partition

*          the the columns of the matrix.  NB  must be at least one.

*

*  LNBLOC  (local input) INTEGER

*          On entry,  LNBLOC  specifies  the number of columns (size) of

*          the local rightmost blocks. LNBLOC is at least zero.

*

*  JMP     (local input) INTEGER array

*          On entry, JMP is an array of dimension JMP_LEN containing the

*          different jump values used by the random matrix generator.

*

*  IMULADD (local input) INTEGER array

*          On entry, IMULADD is an array of dimension (4, JMP_LEN).  The

*          jth  column  of this array contains the encoded initial cons-

*          tants a_j and c_j to  jump  from X( n ) to  X( n + JMP( j ) )

*          (= a_j * X( n ) + c_j) in the random sequence. IMULADD(1:2,j)

*          contains respectively the 16-lower and 16-higher bits of  the

*          constant a_j, and IMULADD(3:4,j)  contains  the 16-lower  and

*          16-higher bits of the constant c_j.

*

*  -- Written on April 1, 1998 by

*     Antoine Petitet, University  of  Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Parameters ..

      INTEGER            JMP_1, JMP_COL, JMP_IMBV, JMP_INBV, JMP_LEN,

     $                   JMP_MB, JMP_NB, JMP_NPIMBLOC, JMP_NPMB,

     $                   JMP_NQINBLOC, JMP_NQNB, JMP_ROW

      parameter( jmp_1 = 1, jmp_row = 2, jmp_col = 3,

     $                   jmp_mb = 4, jmp_imbv = 5, jmp_npmb = 6,

     $                   jmp_npimbloc = 7, jmp_nb = 8, jmp_inbv = 9,

     $                   jmp_nqnb = 10, jmp_nqinbloc = 11,

     $                   jmp_len = 11 )

*     ..

*     .. Local Scalars ..

      INTEGER            I, IB, IBLK, II, IK, ITMP, JB, JBLK, JJ, JK,

     $                   JTMP, LCMTC, LCMTR, LOW, MNB, UPP

      DOUBLE PRECISION   DUMMY

*     ..

*     .. Local Arrays ..

      INTEGER            IB0( 2 ), IB1( 2 ), IB2( 2 ), IB3( 2 )

*     ..

*     .. External Subroutines ..

      EXTERNAL           pb_jumpit

*     ..

*     .. External Functions ..

      LOGICAL            LSAME

      DOUBLE PRECISION   PB_DRAND

      EXTERNAL           LSAME, PB_DRAND

*     ..

*     .. Intrinsic Functions ..

      INTRINSIC          max, min

*     ..

*     .. Executable Statements ..

*

      DO 10 i = 1, 2

         ib1( i ) = iran( i )

         ib2( i ) = iran( i )

         ib3( i ) = iran( i )

   10 CONTINUE

*

      IF( lsame( aform, 'N' ) ) THEN

*

*        Generate random matrix

*

         jj = 1

*

         DO 50 jblk = 1, nblks

*

            IF( jblk.EQ.1 ) THEN

               jb = inbloc

            ELSE IF( jblk.EQ.nblks ) THEN

               jb = lnbloc

            ELSE

               jb = nb

            END IF

*

            DO 40 jk = jj, jj + jb - 1

*

               ii = 1

*

               DO 30 iblk = 1, mblks

*

                  IF( iblk.EQ.1 ) THEN

                     ib = imbloc

                  ELSE IF( iblk.EQ.mblks ) THEN

                     ib = lmbloc

                  ELSE

                     ib = mb

                  END IF

*

*                 Blocks are IB by JB

*

                  DO 20 ik = ii, ii + ib - 1

                     a( ik, jk ) = pb_drand( 0 )

   20             CONTINUE

*

                  ii = ii + ib

*

                  IF( iblk.EQ.1 ) THEN

*

*                    Jump IMBLOC + ( NPROW - 1 ) * MB rows

*

                     CALL pb_jumpit( imuladd( 1, jmp_npimbloc ), ib1,

     $                               ib0 )

*

                  ELSE

*

*                    Jump NPROW * MB rows

*

                     CALL pb_jumpit( imuladd( 1, jmp_npmb ), ib1, ib0 )

*

                  END IF

*

                  ib1( 1 ) = ib0( 1 )

                  ib1( 2 ) = ib0( 2 )

*

   30          CONTINUE

*

*              Jump one column

*

               CALL pb_jumpit( imuladd( 1, jmp_col ), ib2, ib0 )

*

               ib1( 1 ) = ib0( 1 )

               ib1( 2 ) = ib0( 2 )

               ib2( 1 ) = ib0( 1 )

               ib2( 2 ) = ib0( 2 )

*

   40       CONTINUE

*

            jj = jj + jb

*

            IF( jblk.EQ.1 ) THEN

*

*              Jump INBLOC + ( NPCOL - 1 ) * NB columns

*

               CALL pb_jumpit( imuladd( 1, jmp_nqinbloc ), ib3, ib0 )

*

            ELSE

*

*              Jump NPCOL * NB columns

*

               CALL pb_jumpit( imuladd( 1, jmp_nqnb ), ib3, ib0 )

*

            END IF

*

            ib1( 1 ) = ib0( 1 )

            ib1( 2 ) = ib0( 2 )

            ib2( 1 ) = ib0( 1 )

            ib2( 2 ) = ib0( 2 )

            ib3( 1 ) = ib0( 1 )

            ib3( 2 ) = ib0( 2 )

*

   50    CONTINUE

*

      ELSE IF( lsame( aform, 'T' ) .OR. lsame( aform, 'C' ) ) THEN

*

*        Generate the transpose of the matrix that would be normally

*        generated.

*

         ii = 1

*

         DO 90 iblk = 1, mblks

*

            IF( iblk.EQ.1 ) THEN

               ib = imbloc

            ELSE IF( iblk.EQ.mblks ) THEN

               ib = lmbloc

            ELSE

               ib = mb

            END IF

*

            DO 80 ik = ii, ii + ib - 1

*

               jj = 1

*

               DO 70 jblk = 1, nblks

*

                  IF( jblk.EQ.1 ) THEN

                     jb = inbloc

                  ELSE IF( jblk.EQ.nblks ) THEN

                     jb = lnbloc

                  ELSE

                     jb = nb

                  END IF

*

*                 Blocks are IB by JB

*

                  DO 60 jk = jj, jj + jb - 1

                     a( ik, jk ) = pb_drand( 0 )

   60             CONTINUE

*

                  jj = jj + jb

*

                  IF( jblk.EQ.1 ) THEN

*

*                    Jump INBLOC + ( NPCOL - 1 ) * NB columns

*

                     CALL pb_jumpit( imuladd( 1, jmp_nqinbloc ), ib1,

     $                               ib0 )

*

                  ELSE

*

*                    Jump NPCOL * NB columns

*

                     CALL pb_jumpit( imuladd( 1, jmp_nqnb ), ib1, ib0 )

*

                  END IF

*

                  ib1( 1 ) = ib0( 1 )

                  ib1( 2 ) = ib0( 2 )

*

   70          CONTINUE

*

*              Jump one row

*

               CALL pb_jumpit( imuladd( 1, jmp_row ), ib2, ib0 )

*

               ib1( 1 ) = ib0( 1 )

               ib1( 2 ) = ib0( 2 )

               ib2( 1 ) = ib0( 1 )

               ib2( 2 ) = ib0( 2 )

*

   80       CONTINUE

*

            ii = ii + ib

*

            IF( iblk.EQ.1 ) THEN

*

*              Jump IMBLOC + ( NPROW - 1 ) * MB rows

*

               CALL pb_jumpit( imuladd( 1, jmp_npimbloc ), ib3, ib0 )

*

            ELSE

*

*              Jump NPROW * MB rows

*

               CALL pb_jumpit( imuladd( 1, jmp_npmb ), ib3, ib0 )

*

            END IF

*

            ib1( 1 ) = ib0( 1 )

            ib1( 2 ) = ib0( 2 )

            ib2( 1 ) = ib0( 1 )

            ib2( 2 ) = ib0( 2 )

            ib3( 1 ) = ib0( 1 )

            ib3( 2 ) = ib0( 2 )

*

   90    CONTINUE

*

      ELSE IF( ( lsame( aform, 'S' ) ).OR.( lsame( aform, 'H' ) ) ) THEN

*

*        Generate a symmetric matrix

*

         IF( lsame( uplo, 'L' ) ) THEN

*

*           generate lower trapezoidal part

*

            jj = 1

            lcmtc = lcmt00

*

            DO 170 jblk = 1, nblks

*

               IF( jblk.EQ.1 ) THEN

                  jb  = inbloc

                  low = 1 - inbloc

               ELSE IF( jblk.EQ.nblks ) THEN

                  jb = lnbloc

                  low = 1 - nb

               ELSE

                  jb  = nb

                  low = 1 - nb

               END IF

*

               DO 160 jk = jj, jj + jb - 1

*

                  ii = 1

                  lcmtr = lcmtc

*

                  DO 150 iblk = 1, mblks

*

                     IF( iblk.EQ.1 ) THEN

                        ib  = imbloc

                        upp = imbloc - 1

                     ELSE IF( iblk.EQ.mblks ) THEN

                        ib  = lmbloc

                        upp = mb - 1

                     ELSE

                        ib  = mb

                        upp = mb - 1

                     END IF

*

*                    Blocks are IB by JB

*

                     IF( lcmtr.GT.upp ) THEN

*

                        DO 100 ik = ii, ii + ib - 1

                           dummy = pb_drand( 0 )

  100                   CONTINUE

*

                     ELSE IF( lcmtr.GE.low ) THEN

*

                        jtmp = jk - jj + 1

                        mnb  = max( 0, -lcmtr )

*

                        IF( jtmp.LE.min( mnb, jb ) ) THEN

*

                           DO 110 ik = ii, ii + ib - 1

                              a( ik, jk ) = pb_drand( 0 )

  110                      CONTINUE

*

                        ELSE IF( ( jtmp.GE.( mnb + 1 )         ) .AND.

     $                           ( jtmp.LE.min( ib-lcmtr, jb ) ) ) THEN

*

                           itmp = ii + jtmp + lcmtr - 1

*

                           DO 120 ik = ii, itmp - 1

                              dummy = pb_drand( 0 )

  120                      CONTINUE

*

                           DO 130 ik = itmp, ii + ib - 1

                              a( ik, jk ) = pb_drand( 0 )

  130                      CONTINUE

*

                        END IF

*

                     ELSE

*

                        DO 140 ik = ii, ii + ib - 1

                           a( ik, jk ) = pb_drand( 0 )

  140                   CONTINUE

*

                     END IF

*

                     ii = ii + ib

*

                     IF( iblk.EQ.1 ) THEN

*

*                       Jump IMBLOC + ( NPROW - 1 ) * MB rows

*

                        lcmtr = lcmtr - jmp( jmp_npimbloc )

                        CALL pb_jumpit( imuladd( 1, jmp_npimbloc ), ib1,

     $                                  ib0 )

*

                     ELSE

*

*                       Jump NPROW * MB rows

*

                        lcmtr = lcmtr - jmp( jmp_npmb )

                        CALL pb_jumpit( imuladd( 1, jmp_npmb ), ib1,

     $                                  ib0 )

*

                     END IF

*

                     ib1( 1 ) = ib0( 1 )

                     ib1( 2 ) = ib0( 2 )

*

  150             CONTINUE

*

*                 Jump one column

*

                  CALL pb_jumpit( imuladd( 1, jmp_col ), ib2, ib0 )

*

                  ib1( 1 ) = ib0( 1 )

                  ib1( 2 ) = ib0( 2 )

                  ib2( 1 ) = ib0( 1 )

                  ib2( 2 ) = ib0( 2 )

*

  160          CONTINUE

*

               jj = jj + jb

*

               IF( jblk.EQ.1 ) THEN

*

*                 Jump INBLOC + ( NPCOL - 1 ) * NB columns

*

                  lcmtc = lcmtc + jmp( jmp_nqinbloc )

                  CALL pb_jumpit( imuladd( 1, jmp_nqinbloc ), ib3, ib0 )

*

               ELSE

*

*                 Jump NPCOL * NB columns

*

                  lcmtc = lcmtc + jmp( jmp_nqnb )

                  CALL pb_jumpit( imuladd( 1, jmp_nqnb ), ib3, ib0 )

*

               END IF

*

               ib1( 1 ) = ib0( 1 )

               ib1( 2 ) = ib0( 2 )

               ib2( 1 ) = ib0( 1 )

               ib2( 2 ) = ib0( 2 )

               ib3( 1 ) = ib0( 1 )

               ib3( 2 ) = ib0( 2 )

*

  170       CONTINUE

*

         ELSE

*

*           generate upper trapezoidal part

*

            ii = 1

            lcmtr = lcmt00

*

            DO 250 iblk = 1, mblks

*

               IF( iblk.EQ.1 ) THEN

                  ib  = imbloc

                  upp = imbloc - 1

               ELSE IF( iblk.EQ.mblks ) THEN

                  ib  = lmbloc

                  upp = mb - 1

               ELSE

                  ib  = mb

                  upp = mb - 1

               END IF

*

               DO 240 ik = ii, ii + ib - 1

*

                  jj = 1

                  lcmtc = lcmtr

*

                  DO 230 jblk = 1, nblks

*

                     IF( jblk.EQ.1 ) THEN

                        jb  = inbloc

                        low = 1 - inbloc

                     ELSE IF( jblk.EQ.nblks ) THEN

                        jb  = lnbloc

                        low = 1 - nb

                     ELSE

                        jb  = nb

                        low = 1 - nb

                     END IF

*

*                    Blocks are IB by JB

*

                     IF( lcmtc.LT.low ) THEN

*

                        DO 180 jk = jj, jj + jb - 1

                           dummy = pb_drand( 0 )

  180                   CONTINUE

*

                     ELSE IF( lcmtc.LE.upp ) THEN

*

                        itmp = ik - ii + 1

                        mnb  = max( 0, lcmtc )

*

                        IF( itmp.LE.min( mnb, ib ) ) THEN

*

                           DO 190 jk = jj, jj + jb - 1

                              a( ik, jk ) = pb_drand( 0 )

  190                      CONTINUE

*

                        ELSE IF( ( itmp.GE.( mnb + 1 )         ) .AND.

     $                           ( itmp.LE.min( jb+lcmtc, ib ) ) ) THEN

*

                           jtmp = jj + itmp - lcmtc - 1

*

                           DO 200 jk = jj, jtmp - 1

                              dummy = pb_drand( 0 )

  200                      CONTINUE

*

                           DO 210 jk = jtmp, jj + jb - 1

                              a( ik, jk ) = pb_drand( 0 )

  210                      CONTINUE

*

                        END IF

*

                     ELSE

*

                        DO 220 jk = jj, jj + jb - 1

                           a( ik, jk ) = pb_drand( 0 )

  220                   CONTINUE

*

                     END IF

*

                     jj = jj + jb

*

                     IF( jblk.EQ.1 ) THEN

*

*                       Jump INBLOC + ( NPCOL - 1 ) * NB columns

*

                        lcmtc = lcmtc + jmp( jmp_nqinbloc )

                        CALL pb_jumpit( imuladd( 1, jmp_nqinbloc ), ib1,

     $                                  ib0 )

*

                     ELSE

*

*                       Jump NPCOL * NB columns

*

                        lcmtc = lcmtc + jmp( jmp_nqnb )

                        CALL pb_jumpit( imuladd( 1, jmp_nqnb ), ib1,

     $                                  ib0 )

*

                     END IF

*

                     ib1( 1 ) = ib0( 1 )

                     ib1( 2 ) = ib0( 2 )

*

  230             CONTINUE

*

*                 Jump one row

*

                  CALL pb_jumpit( imuladd( 1, jmp_row ), ib2, ib0 )

*

                  ib1( 1 ) = ib0( 1 )

                  ib1( 2 ) = ib0( 2 )

                  ib2( 1 ) = ib0( 1 )

                  ib2( 2 ) = ib0( 2 )

*

  240          CONTINUE

*

               ii = ii + ib

*

               IF( iblk.EQ.1 ) THEN

*

*                 Jump IMBLOC + ( NPROW - 1 ) * MB rows

*

                  lcmtr = lcmtr - jmp( jmp_npimbloc )

                  CALL pb_jumpit( imuladd( 1, jmp_npimbloc ), ib3, ib0 )

*

               ELSE

*

*                 Jump NPROW * MB rows

*

                  lcmtr = lcmtr - jmp( jmp_npmb )

                  CALL pb_jumpit( imuladd( 1, jmp_npmb ), ib3, ib0 )

*

               END IF

*

               ib1( 1 ) = ib0( 1 )

               ib1( 2 ) = ib0( 2 )

               ib2( 1 ) = ib0( 1 )

               ib2( 2 ) = ib0( 2 )

               ib3( 1 ) = ib0( 1 )

               ib3( 2 ) = ib0( 2 )

*

  250       CONTINUE

*

         END IF

*

      END IF

*

      RETURN

*

*     End of PB_DLAGEN

*


      END


      DOUBLE PRECISION   FUNCTION pb_drand( IDUMM )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Scalar Arguments ..

      INTEGER            idumm

*     ..

*

*  Purpose

*  =======

*

*  PB_DRAND generates the next number in the random sequence. This func-

*  tion ensures that this number will be in the interval ( -1.0, 1.0 ).

*

*  Arguments

*  =========

*

*  IDUMM   (local input) INTEGER

*          This argument is ignored, but necessary to a FORTRAN 77 func-

*          tion.

*

*  Further Details

*  ===============

*

*  On entry, the array IRAND stored in the common block  RANCOM contains

*  the information (2 integers)  required to generate the next number in

*  the sequence X( n ). This number is computed as

*

*     X( n ) = ( 2^16 * IRAND( 2 ) + IRAND( 1 ) ) / d,

*

*  where the constant d is the  largest  32 bit  positive  integer.  The

*  array  IRAND  is  then  updated for the generation of the next number

*  X( n+1 ) in the random sequence as follows X( n+1 ) = a * X( n ) + c.

*  The constants  a  and c  should have been preliminarily stored in the

*  array  IACS  as  2 pairs of integers. The initial set up of IRAND and

*  IACS is performed by the routine PB_SETRAN.

*

*  -- Written on April 1, 1998 by

*     Antoine Petitet, University  of  Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Parameters ..

      DOUBLE PRECISION   one, two

      PARAMETER          ( one = 1.0d+0, two = 2.0d+0 )

*     ..

*     .. External Functions ..

      DOUBLE PRECISION   pb_dran

      EXTERNAL           pb_dran

*     ..

*     .. Executable Statements ..

*

      pb_drand = one - two * pb_dran( idumm )

*

      RETURN

*

*     End of PB_DRAND

*


      END


      DOUBLE PRECISION   FUNCTION pb_dran( IDUMM )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Scalar Arguments ..

      INTEGER            idumm

*     ..

*

*  Purpose

*  =======

*

*  PB_DRAN generates the next number in the random sequence.

*

*  Arguments

*  =========

*

*  IDUMM   (local input) INTEGER

*          This argument is ignored, but necessary to a FORTRAN 77 func-

*          tion.

*

*  Further Details

*  ===============

*

*  On entry, the array IRAND stored in the common block  RANCOM contains

*  the information (2 integers)  required to generate the next number in

*  the sequence X( n ). This number is computed as

*

*     X( n ) = ( 2^16 * IRAND( 2 ) + IRAND( 1 ) ) / d,

*

*  where the constant d is the  largest  32 bit  positive  integer.  The

*  array  IRAND  is  then  updated for the generation of the next number

*  X( n+1 ) in the random sequence as follows X( n+1 ) = a * X( n ) + c.

*  The constants  a  and c  should have been preliminarily stored in the

*  array  IACS  as  2 pairs of integers. The initial set up of IRAND and

*  IACS is performed by the routine PB_SETRAN.

*

*  -- Written on April 1, 1998 by

*     Antoine Petitet, University  of  Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Parameters ..

      DOUBLE PRECISION   divfac, pow16

      PARAMETER          ( divfac = 2.147483648d+9,

     $                   pow16 = 6.5536d+4 )

*     ..

*     .. Local Arrays ..

      INTEGER            j( 2 )

*     ..

*     .. External Subroutines ..

      EXTERNAL           pb_ladd, pb_lmul

*     ..

*     .. Intrinsic Functions ..

      INTRINSIC          dble

*     ..

*     .. Common Blocks ..

      INTEGER            iacs( 4 ), irand( 2 )

      common             /rancom/ irand, iacs

*     ..

*     .. Save Statements ..

      SAVE               /rancom/

*     ..

*     .. Executable Statements ..

*

      pb_dran = ( dble( irand( 1 ) ) + pow16 * dble( irand( 2 ) ) ) /

     $            divfac

*

      CALL pb_lmul( irand, iacs, j )

      CALL pb_ladd( j, iacs( 3 ), irand )

*

      RETURN

*

*     End of PB_DRAN

*


      END

min
#define min(a, b)
Definition macros.h:20

max
#define max(a, b)
Definition macros.h:21

pxerbla
subroutine pxerbla(contxt, srname, info)
Definition mpi.f:1600

blacs_gridinfo
subroutine blacs_gridinfo(cntxt, nprow, npcol, myrow, mycol)
Definition mpi.f:754

pb_ainfog2l
subroutine pb_ainfog2l(m, n, i, j, desc, nprow, npcol, myrow, mycol, imb1, inb1, mp, nq, ii, jj, prow, pcol, rprow, rpcol)
Definition pblastst.f:2023

pb_ladd
subroutine pb_ladd(j, k, i)
Definition pblastst.f:4480

pb_binfo
subroutine pb_binfo(offd, m, n, imb1, inb1, mb, nb, mrrow, mrcol, lcmt00, mblks, nblks, imbloc, inbloc, lmbloc, lnbloc, ilow, low, iupp, upp)
Definition pblastst.f:3577

pb_setran
subroutine pb_setran(iran, iac)
Definition pblastst.f:4759

pb_infog2l
subroutine pb_infog2l(i, j, desc, nprow, npcol, myrow, mycol, ii, jj, prow, pcol)
Definition pblastst.f:1673

pb_locinfo
subroutine pb_locinfo(i, inb, nb, myroc, srcproc, nprocs, ilocblk, ilocoff, mydist)
Definition pblastst.f:3910

pb_chkmat
subroutine pb_chkmat(ictxt, m, mpos0, n, npos0, ia, ja, desca, dpos0, info)
Definition pblastst.f:2742

pb_lmul
subroutine pb_lmul(k, j, i)
Definition pblastst.f:4559

pb_jump
subroutine pb_jump(k, muladd, irann, iranm, ima)
Definition pblastst.f:4648

pb_setlocran
subroutine pb_setlocran(seed, ilocblk, jlocblk, ilocoff, jlocoff, myrdist, mycdist, nprow, npcol, jmp, imuladd, iran)
Definition pblastst.f:4302

pb_initmuladd
subroutine pb_initmuladd(muladd0, jmp, imuladd)
Definition pblastst.f:4196

pb_desctrans
subroutine pb_desctrans(descin, descout)
Definition pblastst.f:2964

pb_initjmp
subroutine pb_initjmp(colmaj, nvir, imbvir, inbvir, imbloc, inbloc, mb, nb, rsrc, csrc, nprow, npcol, stride, jmp)
Definition pblastst.f:4045

pb_jumpit
subroutine pb_jumpit(muladd, irann, iranm)
Definition pblastst.f:4822

pb_dran
double precision function pb_dran(idumm)
Definition pdblastim.f:2182

pdlagen
subroutine pdlagen(inplace, aform, diag, offa, m, n, ia, ja, desca, iaseed, a, lda)
Definition pdblastim.f:510

pb_dlagen
subroutine pb_dlagen(uplo, aform, a, lda, lcmt00, iran, mblks, imbloc, mb, lmbloc, nblks, inbloc, nb, lnbloc, jmp, imuladd)
Definition pdblastim.f:1479

pdlascal
subroutine pdlascal(type, m, n, alpha, a, ia, ja, desca)
Definition pdblastim.f:2

pdladom
subroutine pdladom(inplace, n, alpha, a, ia, ja, desca)
Definition pdblastim.f:907

pb_drand
double precision function pb_drand(idumm)
Definition pdblastim.f:2120

pb_dlascal
subroutine pb_dlascal(uplo, m, n, ioffd, alpha, a, lda)
Definition pdblastim.f:1298