Functions/Subroutines
subroutine	pdlaqr4 (wantt, wantz, n, ilo, ihi, a, desca, wr, wi, iloz, ihiz, z, descz, t, ldt, v, ldv, work, lwork, info)
Function/Subroutine Documentation

◆ pdlaqr4()

subroutine pdlaqr4	(	logical	wantt,
		logical	wantz,
		integer	n,
		integer	ilo,
		integer	ihi,
		double precision, dimension( * )	a,
		integer, dimension( * )	desca,
		double precision, dimension( * )	wr,
		double precision, dimension( * )	wi,
		integer	iloz,
		integer	ihiz,
		double precision, dimension( * )	z,
		integer, dimension( * )	descz,
		double precision, dimension( ldt, * )	t,
		integer	ldt,
		double precision, dimension( ldv, * )	v,
		integer	ldv,
		double precision, dimension( * )	work,
		integer	lwork,
		integer	info )
Definition at line 1 of file pdlaqr4.f.
*
*     Contribution from the Department of Computing Science and HPC2N,
*     Umea University, Sweden
*
*  -- ScaLAPACK routine (version 2.0.2) --
*     Univ. of Tennessee, Univ. of California Berkeley, Univ. of Colorado Denver
*     May 1 2012
*
      IMPLICIT NONE
*
*     .. Scalar Arguments ..
      LOGICAL            WANTT, WANTZ
      INTEGER            IHI, IHIZ, ILO, ILOZ, INFO, LDT, LDV, LWORK, N
*     ..
*     .. Array Arguments ..
      INTEGER            DESCA( * ), DESCZ( * )
      DOUBLE PRECISION   A( * ), T( LDT, * ), V( LDV, * ), WI( * ),
     $                   WORK( * ), WR( * ), Z( * )
*     ..
*
*  Purpose
*  =======
*
*  PDLAQR4 is an auxiliary routine used to find the Schur decomposition
*  and or eigenvalues of a matrix already in Hessenberg form from cols
*  ILO to IHI.  This routine requires that the active block is small
*  enough, i.e. IHI-ILO+1 .LE. LDT, so that it can be solved by LAPACK.
*  Normally, it is called by PDLAQR1.  All the inputs are assumed to be
*  valid without checking.
*
*  Notes
*  =====
*
*  Each global data object is described by an associated description
*  vector.  This vector stores the information required to establish
*  the mapping between an object element and its corresponding process
*  and memory location.
*
*  Let A be a generic term for any 2D block cyclicly distributed array.
*  Such a global array has an associated description vector DESCA.
*  In the following comments, the character _ should be read as
*  "of the global array".
*
*  NOTATION        STORED IN      EXPLANATION
*  --------------- -------------- --------------------------------------
*  DTYPE_A(global) DESCA( DTYPE_ )The descriptor type.  In this case,
*                                 DTYPE_A = 1.
*  CTXT_A (global) DESCA( CTXT_ ) The BLACS context handle, indicating
*                                 the BLACS process grid A is distribu-
*                                 ted over. The context itself is glo-
*                                 bal, but the handle (the integer
*                                 value) may vary.
*  M_A    (global) DESCA( M_ )    The number of rows in the global
*                                 array A.
*  N_A    (global) DESCA( N_ )    The number of columns in the global
*                                 array A.
*  MB_A   (global) DESCA( MB_ )   The blocking factor used to distribute
*                                 the rows of the array.
*  NB_A   (global) DESCA( NB_ )   The blocking factor used to distribute
*                                 the columns of the array.
*  RSRC_A (global) DESCA( RSRC_ ) The process row over which the first
*                                 row of the array A is distributed.
*  CSRC_A (global) DESCA( CSRC_ ) The process column over which the
*                                 first column of the array A is
*                                 distributed.
*  LLD_A  (local)  DESCA( LLD_ )  The leading dimension of the local
*                                 array.  LLD_A >= MAX(1,LOCr(M_A)).
*
*  Let K be the number of rows or columns of a distributed matrix,
*  and assume that its process grid has dimension p x q.
*  LOCr( K ) denotes the number of elements of K that a process
*  would receive if K were distributed over the p processes of its
*  process column.
*  Similarly, LOCc( K ) denotes the number of elements of K that a
*  process would receive if K were distributed over the q processes of
*  its process row.
*  The values of LOCr() and LOCc() may be determined via a call to the
*  ScaLAPACK tool function, NUMROC:
*          LOCr( M ) = NUMROC( M, MB_A, MYROW, RSRC_A, NPROW ),
*          LOCc( N ) = NUMROC( N, NB_A, MYCOL, CSRC_A, NPCOL ).
*  An upper bound for these quantities may be computed by:
*          LOCr( M ) <= ceil( ceil(M/MB_A)/NPROW )*MB_A
*          LOCc( N ) <= ceil( ceil(N/NB_A)/NPCOL )*NB_A
*
*  Arguments
*  =========
*
*  WANTT   (global input) LOGICAL
*          = .TRUE. : the full Schur form T is required;
*          = .FALSE.: only eigenvalues are required.
*
*  WANTZ   (global input) LOGICAL
*          = .TRUE. : the matrix of Schur vectors Z is required;
*          = .FALSE.: Schur vectors are not required.
*
*  N       (global input) INTEGER
*          The order of the Hessenberg matrix A (and Z if WANTZ).
*          N >= 0.
*
*  ILO     (global input) INTEGER
*  IHI     (global input) INTEGER
*          It is assumed that A is already upper quasi-triangular in
*          rows and columns IHI+1:N, and that A(ILO,ILO-1) = 0 (unless
*          ILO = 1). PDLAQR4 works primarily with the Hessenberg
*          submatrix in rows and columns ILO to IHI, but applies
*          transformations to all of H if WANTT is .TRUE..
*          1 <= ILO <= max(1,IHI); IHI <= N.
*
*  A       (global input/output) DOUBLE PRECISION array, dimension
*          (DESCA(LLD_),*)
*          On entry, the upper Hessenberg matrix A.
*          On exit, if WANTT is .TRUE., A is upper quasi-triangular in
*          rows and columns ILO:IHI, with any 2-by-2 or larger diagonal
*          blocks not yet in standard form. If WANTT is .FALSE., the
*          contents of A are unspecified on exit.
*
*  DESCA   (global and local input) INTEGER array of dimension DLEN_.
*          The array descriptor for the distributed matrix A.
*
*  WR      (global replicated output) DOUBLE PRECISION array,
*                                                         dimension (N)
*  WI      (global replicated output) DOUBLE PRECISION array,
*                                                         dimension (N)
*          The real and imaginary parts, respectively, of the computed
*          eigenvalues ILO to IHI are stored in the corresponding
*          elements of WR and WI. If two eigenvalues are computed as a
*          complex conjugate pair, they are stored in consecutive
*          elements of WR and WI, say the i-th and (i+1)th, with
*          WI(i) > 0 and WI(i+1) < 0. If WANTT is .TRUE., the
*          eigenvalues are stored in the same order as on the diagonal
*          of the Schur form returned in A.  A may be returned with
*          larger diagonal blocks until the next release.
*
*  ILOZ    (global input) INTEGER
*  IHIZ    (global input) INTEGER
*          Specify the rows of Z to which transformations must be
*          applied if WANTZ is .TRUE..
*          1 <= ILOZ <= ILO; IHI <= IHIZ <= N.
*
*  Z       (global input/output) DOUBLE PRECISION array.
*          If WANTZ is .TRUE., on entry Z must contain the current
*          matrix Z of transformations accumulated by PDHSEQR, and on
*          exit Z has been updated; transformations are applied only to
*          the submatrix Z(ILOZ:IHIZ,ILO:IHI).
*          If WANTZ is .FALSE., Z is not referenced.
*
*  DESCZ   (global and local input) INTEGER array of dimension DLEN_.
*          The array descriptor for the distributed matrix Z.
*
*  T       (local workspace) DOUBLE PRECISION array, dimension LDT*NW.
*
*  LDT     (local input) INTEGER
*          The leading dimension of the array T.
*          LDT >= IHI-ILO+1.
*
*  V       (local workspace) DOUBLE PRECISION array, dimension LDV*NW.
*
*  LDV     (local input) INTEGER
*          The leading dimension of the array V.
*          LDV >= IHI-ILO+1.
*
*  WORK    (local workspace) DOUBLE PRECISION array, dimension LWORK.
*
*  LWORK   (local input) INTEGER
*          The dimension of the work array WORK.
*          LWORK >= IHI-ILO+1.
*          WORK(LWORK) is a local array and LWORK is assumed big enough.
*          Typically LWORK >= 4*LDS*LDS if this routine is called by
*          PDLAQR1. (LDS = 385, see PDLAQR1)
*
*  INFO    (global output) INTEGER
*          < 0: parameter number -INFO incorrect or inconsistent;
*          = 0: successful exit;
*          > 0: PDLAQR4 failed to compute all the eigenvalues ILO to IHI
*               in a total of 30*(IHI-ILO+1) iterations; if INFO = i,
*               elements i+1:ihi of WR and WI contain those eigenvalues
*               which have been successfully computed.
*
*  ================================================================
*  Implemented by
*        Meiyue Shao, Department of Computing Science and HPC2N,
*        Umea University, Sweden
*
*  ================================================================
*  References:
*        B. Kagstrom, D. Kressner, and M. Shao,
*        On Aggressive Early Deflation in Parallel Variants of the QR
*        Algorithm.
*        Para 2010, to appear.
*
*  ================================================================
*     .. Parameters ..
      INTEGER            BLOCK_CYCLIC_2D, CSRC_, CTXT_, DLEN_, DTYPE_,
     $                   LLD_, MB_, M_, NB_, N_, RSRC_
      parameter( block_cyclic_2d = 1, dlen_ = 9, dtype_ = 1,
     $                     ctxt_ = 2, m_ = 3, n_ = 4, mb_ = 5, nb_ = 6,
     $                     rsrc_ = 7, csrc_ = 8, lld_ = 9 )
      DOUBLE PRECISION   ZERO, ONE
      parameter( zero = 0.0d+0, one = 1.0d+0 )
*     ..
*     .. Local Scalars ..
      INTEGER            CONTXT, HBL, I, I1, I2, IAFIRST, ICOL, ICOL1,
     $                   ICOL2, II, IROW, IROW1, IROW2, ITMP1, ITMP2,
     $                   IERR, J, JAFIRST, JJ, K, L, LDA, LDZ, LLDTMP,
     $                   MYCOL, MYROW, NODE, NPCOL, NPROW, NH, NMIN, NZ,
     $                   HSTEP, VSTEP, KKROW, KKCOL, KLN, LTOP, LEFT,
     $                   RIGHT, UP, DOWN, D1, D2
*     ..
*     .. Local Arrays ..
      INTEGER            DESCT( 9 ), DESCV( 9 ), DESCWH( 9 ),
     $                   DESCWV( 9 )
*     ..
*     .. External Functions ..
      INTEGER            NUMROC, ILAENV
      EXTERNAL           numroc, ilaenv
*     ..
*     .. External Subroutines ..
      EXTERNAL           blacs_gridinfo, infog2l, dlaset,
     $                   dlahqr, dlaqr4, descinit, pdgemm, pdgemr2d,
     $                   dgemm, dlamov, dgesd2d, dgerv2d,
     $                   dgebs2d, dgebr2d, igebs2d, igebr2d
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, min, mod
*     ..
*     .. Executable Statements ..
*
      info = 0
*
      nh = ihi - ilo + 1
      nz = ihiz - iloz + 1
      IF( n.EQ.0 .OR. nh.EQ.0 )
     $   RETURN
*
*     NODE (IAFIRST,JAFIRST) OWNS A(1,1)
*
      hbl = desca( mb_ )
      contxt = desca( ctxt_ )
      lda = desca( lld_ )
      iafirst = desca( rsrc_ )
      jafirst = desca( csrc_ )
      ldz = descz( lld_ )
      CALL blacs_gridinfo( contxt, nprow, npcol, myrow, mycol )
      node = myrow*npcol + mycol
      left = mod( mycol+npcol-1, npcol )
      right = mod( mycol+1, npcol )
      up = mod( myrow+nprow-1, nprow )
      down = mod( myrow+1, nprow )
*
*     I1 and I2 are the indices of the first row and last column of A
*     to which transformations must be applied.
*
      i = ihi
      l = ilo
      IF( wantt ) THEN
         i1 = 1
         i2 = n
         ltop = 1
      ELSE
         i1 = l
         i2 = i
         ltop = l
      END IF
*
*     Copy the diagonal block to local and call LAPACK.
*
      CALL infog2l( ilo, ilo, desca, nprow, npcol, myrow, mycol,
     $     irow, icol, ii, jj )
      IF ( myrow .EQ. ii ) THEN
         CALL descinit( desct, nh, nh, nh, nh, ii, jj, contxt,
     $        ldt, ierr )
         CALL descinit( descv, nh, nh, nh, nh, ii, jj, contxt,
     $        ldv, ierr )
      ELSE
         CALL descinit( desct, nh, nh, nh, nh, ii, jj, contxt,
     $        1, ierr )
         CALL descinit( descv, nh, nh, nh, nh, ii, jj, contxt,
     $        1, ierr )
      END IF
      CALL pdgemr2d( nh, nh, a, ilo, ilo, desca, t, 1, 1, desct,
     $     contxt )
      IF ( myrow .EQ. ii .AND. mycol .EQ. jj ) THEN
         CALL dlaset( 'All', nh, nh, zero, one, v, ldv )
         nmin = ilaenv( 12, 'DLAQR3', 'SV', nh, 1, nh, lwork )
         IF( nh .GT. nmin ) THEN
            CALL dlaqr4( .true., .true., nh, 1, nh, t, ldt, wr( ilo ),
     $           wi( ilo ), 1, nh, v, ldv, work, lwork, info )
*           Clean up the scratch used by DLAQR4.
            CALL dlaset( 'L', nh-2, nh-2, zero, zero, t( 3, 1 ), ldt )
         ELSE
            CALL dlahqr( .true., .true., nh, 1, nh, t, ldt, wr( ilo ),
     $           wi( ilo ), 1, nh, v, ldv, info )
         END IF
         CALL dgebs2d( contxt, 'All', ' ', nh, nh, v, ldv )
         CALL igebs2d( contxt, 'All', ' ', 1, 1, info, 1 )
      ELSE
         CALL dgebr2d( contxt, 'All', ' ', nh, nh, v, ldv, ii, jj )
         CALL igebr2d( contxt, 'All', ' ', 1, 1, info, 1, ii, jj )
      END IF
      IF( info .NE. 0 ) info = info+ilo-1
*
*     Copy the local matrix back to the diagonal block.
*
      CALL pdgemr2d( nh, nh, t, 1, 1, desct, a, ilo, ilo, desca,
     $     contxt )
*
*     Update T and Z.
*
      IF( mod( ilo-1, hbl )+nh .LE. hbl ) THEN
*
*        Simplest case: the diagonal block is located on one processor.
*        Call DGEMM directly to perform the update.
*
         hstep = lwork / nh
         vstep = hstep
*
         IF( wantt ) THEN
*
*           Update horizontal slab in A.
*
            CALL infog2l( ilo, i+1, desca, nprow, npcol, myrow,
     $           mycol, irow, icol, ii, jj )
            IF( myrow .EQ. ii ) THEN
               icol1 = numroc( n, hbl, mycol, jafirst, npcol )
               DO 10 kkcol = icol, icol1, hstep
                  kln = min( hstep, icol1-kkcol+1 )
                  CALL dgemm( 'T', 'N', nh, kln, nh, one, v,
     $                 ldv, a( irow+(kkcol-1)*lda ), lda, zero, work,
     $                 nh )
                  CALL dlamov( 'A', nh, kln, work, nh,
     $                 a( irow+(kkcol-1)*lda ), lda )
   10          CONTINUE
            END IF
*
*           Update vertical slab in A.
*
            CALL infog2l( ltop, ilo, desca, nprow, npcol, myrow,
     $           mycol, irow, icol, ii, jj )
            IF( mycol .EQ. jj ) THEN
               CALL infog2l( ilo-1, ilo, desca, nprow, npcol,
     $              myrow, mycol, irow1, icol1, itmp1, itmp2 )
               IF( myrow .NE. itmp1 ) irow1 = irow1-1
               DO 20 kkrow = irow, irow1, vstep
                  kln = min( vstep, irow1-kkrow+1 )
                  CALL dgemm( 'N', 'N', kln, nh, nh, one,
     $                 a( kkrow+(icol-1)*lda ), lda, v, ldv, zero,
     $                 work, kln )
                  CALL dlamov( 'A', kln, nh, work, kln,
     $                 a( kkrow+(icol-1)*lda ), lda )
   20          CONTINUE
            END IF
         END IF
*
*        Update vertical slab in Z.
*
         IF( wantz ) THEN
            CALL infog2l( iloz, ilo, descz, nprow, npcol, myrow,
     $           mycol, irow, icol, ii, jj )
            IF( mycol .EQ. jj ) THEN
               CALL infog2l( ihiz, ilo, descz, nprow, npcol,
     $              myrow, mycol, irow1, icol1, itmp1, itmp2 )
               IF( myrow .NE. itmp1 ) irow1 = irow1-1
               DO 30 kkrow = irow, irow1, vstep
                  kln = min( vstep, irow1-kkrow+1 )
                  CALL dgemm( 'N', 'N', kln, nh, nh, one,
     $                 z( kkrow+(icol-1)*ldz ), ldz, v, ldv, zero,
     $                 work, kln )
                  CALL dlamov( 'A', kln, nh, work, kln,
     $                 z( kkrow+(icol-1)*ldz ), ldz )
   30          CONTINUE
            END IF
         END IF
*
      ELSE IF( mod( ilo-1, hbl )+nh .LE. 2*hbl ) THEN
*
*        More complicated case: the diagonal block lay on a 2x2
*        processor mesh.
*        Call DGEMM locally and communicate by pair.
*
         d1 = hbl - mod( ilo-1, hbl )
         d2 = nh - d1
         hstep = lwork / nh
         vstep = hstep
*
         IF( wantt ) THEN
*
*           Update horizontal slab in A.
*
            CALL infog2l( ilo, i+1, desca, nprow, npcol, myrow,
     $           mycol, irow, icol, ii, jj )
            IF( myrow .EQ. up ) THEN
               IF( myrow .EQ. ii ) THEN
                  icol1 = numroc( n, hbl, mycol, jafirst, npcol )
                  DO 40 kkcol = icol, icol1, hstep
                     kln = min( hstep, icol1-kkcol+1 )
                     CALL dgemm( 'T', 'N', nh, kln, nh, one, v,
     $                    nh, a( irow+(kkcol-1)*lda ), lda, zero,
     $                    work, nh )
                     CALL dlamov( 'A', nh, kln, work, nh,
     $                    a( irow+(kkcol-1)*lda ), lda )
   40             CONTINUE
               END IF
            ELSE
               IF( myrow .EQ. ii ) THEN
                  icol1 = numroc( n, hbl, mycol, jafirst, npcol )
                  DO 50 kkcol = icol, icol1, hstep
                     kln = min( hstep, icol1-kkcol+1 )
                     CALL dgemm( 'T', 'N', d2, kln, d1, one,
     $                    v( 1, d1+1 ), ldv, a( irow+(kkcol-1)*lda ),
     $                    lda, zero, work( d1+1 ), nh )
                     CALL dgesd2d( contxt, d2, kln, work( d1+1 ),
     $                    nh, down, mycol )
                     CALL dgerv2d( contxt, d1, kln, work, nh, down,
     $                    mycol )
                     CALL dgemm( 'T', 'N', d1, kln, d1, one,
     $                    v, ldv, a( irow+(kkcol-1)*lda ), lda, one,
     $                    work, nh )
                     CALL dlamov( 'A', d1, kln, work, nh,
     $                    a( irow+(kkcol-1)*lda ), lda )
   50             CONTINUE
               ELSE IF( up .EQ. ii ) THEN
                  icol1 = numroc( n, hbl, mycol, jafirst, npcol )
                  DO 60 kkcol = icol, icol1, hstep
                     kln = min( hstep, icol1-kkcol+1 )
                     CALL dgemm( 'T', 'N', d1, kln, d2, one,
     $                    v( d1+1, 1 ), ldv, a( irow+(kkcol-1)*lda ),
     $                    lda, zero, work, nh )
                     CALL dgesd2d( contxt, d1, kln, work, nh, up,
     $                    mycol )
                     CALL dgerv2d( contxt, d2, kln, work( d1+1 ),
     $                    nh, up, mycol )
                     CALL dgemm( 'T', 'N', d2, kln, d2, one,
     $                    v( d1+1, d1+1 ), ldv,
     $                    a( irow+(kkcol-1)*lda ), lda, one,
     $                    work( d1+1 ), nh )
                     CALL dlamov( 'A', d2, kln, work( d1+1 ), nh,
     $                    a( irow+(kkcol-1)*lda ), lda )
   60             CONTINUE
               END IF
            END IF
*
*           Update vertical slab in A.
*
            CALL infog2l( ltop, ilo, desca, nprow, npcol, myrow,
     $           mycol, irow, icol, ii, jj )
            IF( mycol .EQ. left ) THEN
               IF( mycol .EQ. jj ) THEN
                  CALL infog2l( ilo-1, ilo, desca, nprow, npcol,
     $                 myrow, mycol, irow1, icol1, itmp1, itmp2 )
                  IF( myrow .NE. itmp1 ) irow1 = irow1-1
                  DO 70 kkrow = irow, irow1, vstep
                     kln = min( vstep, irow1-kkrow+1 )
                     CALL dgemm( 'N', 'N', kln, nh, nh, one,
     $                    a( kkrow+(icol-1)*lda ), lda, v, ldv,
     $                    zero, work, kln )
                     CALL dlamov( 'A', kln, nh, work, kln,
     $                    a( kkrow+(icol-1)*lda ), lda )
   70             CONTINUE
               END IF
            ELSE
               IF( mycol .EQ. jj ) THEN
                  CALL infog2l( ilo-1, ilo, desca, nprow, npcol,
     $                 myrow, mycol, irow1, icol1, itmp1, itmp2 )
                  IF( myrow .NE. itmp1 ) irow1 = irow1-1
                  DO 80 kkrow = irow, irow1, vstep
                     kln = min( vstep, irow1-kkrow+1 )
                     CALL dgemm( 'N', 'N', kln, d2, d1, one,
     $                    a( kkrow+(icol-1)*lda ), lda, v( 1, d1+1 ),
     $                    ldv, zero, work( 1+d1*kln ), kln )
                     CALL dgesd2d( contxt, kln, d2, work( 1+d1*kln ),
     $                    kln, myrow, right )
                     CALL dgerv2d( contxt, kln, d1, work, kln, myrow,
     $                    right )
                     CALL dgemm( 'N', 'N', kln, d1, d1, one,
     $                    a( kkrow+(icol-1)*lda ), lda, v, ldv, one,
     $                    work, kln )
                     CALL dlamov( 'A', kln, d1, work, kln,
     $                    a( kkrow+(icol-1)*lda ), lda )
   80             CONTINUE
               ELSE IF ( left .EQ. jj ) THEN
                  CALL infog2l( ilo-1, ilo, desca, nprow, npcol,
     $                 myrow, mycol, irow1, icol1, itmp1, itmp2 )
                  IF( myrow .NE. itmp1 ) irow1 = irow1-1
                  DO 90 kkrow = irow, irow1, vstep
                     kln = min( vstep, irow1-kkrow+1 )
                     CALL dgemm( 'N', 'N', kln, d1, d2, one,
     $                    a( kkrow+(icol-1)*lda ), lda, v( d1+1, 1 ),
     $                    ldv, zero, work, kln )
                     CALL dgesd2d( contxt, kln, d1, work, kln, myrow,
     $                    left )
                     CALL dgerv2d( contxt, kln, d2, work( 1+d1*kln ),
     $                    kln, myrow, left )
                     CALL dgemm( 'n', 'n', KLN, D2, D2, ONE,
     $                    A( KKROW+(ICOL-1)*LDA ), LDA, V( D1+1, D1+1 ),
     $                    LDV, ONE, WORK( 1+D1*KLN ), KLN )
                     CALL DLAMOV( 'a', KLN, D2, WORK( 1+D1*KLN ), KLN,
     $                    A( KKROW+(ICOL-1)*LDA ), LDA )
   90             CONTINUE
               END IF
            END IF
         END IF
*
*        Update vertical slab in Z.
*
         IF( WANTZ ) THEN
            CALL INFOG2L( ILOZ, ILO, DESCZ, NPROW, NPCOL, MYROW,
     $           MYCOL, IROW, ICOL, II, JJ )
.EQ.            IF( MYCOL  LEFT ) THEN
.EQ.               IF( MYCOL  JJ ) THEN
                  CALL INFOG2L( IHIZ, ILO, DESCZ, NPROW, NPCOL,
     $                 MYROW, MYCOL, IROW1, ICOL1, ITMP1, ITMP2 )
.NE.                  IF( MYROW  ITMP1 ) IROW1 = IROW1-1
                  DO 100 KKROW = IROW, IROW1, VSTEP
                     KLN = MIN( VSTEP, IROW1-KKROW+1 )
                     CALL DGEMM( 'n', 'n', KLN, NH, NH, ONE,
     $                    Z( KKROW+(ICOL-1)*LDZ ), LDZ, V, LDV, ZERO,
     $                    WORK, KLN )
                     CALL DLAMOV( 'a', KLN, NH, WORK, KLN,
     $                    Z( KKROW+(ICOL-1)*LDZ ), LDZ )
  100             CONTINUE
               END IF
            ELSE
.EQ.               IF( MYCOL  JJ ) THEN
                  CALL INFOG2L( IHIZ, ILO, DESCZ, NPROW, NPCOL,
     $                 MYROW, MYCOL, IROW1, ICOL1, ITMP1, ITMP2 )
.NE.                  IF( MYROW  ITMP1 ) IROW1 = IROW1-1
                  DO 110 KKROW = IROW, IROW1, VSTEP
                     KLN = MIN( VSTEP, IROW1-KKROW+1 )
                     CALL DGEMM( 'n', 'n', KLN, D2, D1, ONE,
     $                    Z( KKROW+(ICOL-1)*LDZ ), LDZ, V( 1, D1+1 ),
     $                    LDV, ZERO, WORK( 1+D1*KLN ), KLN )
                     CALL DGESD2D( CONTXT, KLN, D2, WORK( 1+D1*KLN ),
     $                    KLN, MYROW, RIGHT )
                     CALL DGERV2D( CONTXT, KLN, D1, WORK, KLN, MYROW,
     $                    RIGHT )
                     CALL DGEMM( 'n', 'n', KLN, D1, D1, ONE,
     $                    Z( KKROW+(ICOL-1)*LDZ ), LDZ, V, LDV, ONE,
     $                    WORK, KLN )
                     CALL DLAMOV( 'a', KLN, D1, WORK, KLN,
     $                    Z( KKROW+(ICOL-1)*LDZ ), LDZ )
  110             CONTINUE
.EQ.               ELSE IF( LEFT  JJ ) THEN
                  CALL INFOG2L( IHIZ, ILO, DESCZ, NPROW, NPCOL,
     $                 MYROW, MYCOL, IROW1, ICOL1, ITMP1, ITMP2 )
.NE.                  IF( MYROW  ITMP1 ) IROW1 = IROW1-1
                  DO 120 KKROW = IROW, IROW1, VSTEP
                     KLN = MIN( VSTEP, IROW1-KKROW+1 )
                     CALL DGEMM( 'n', 'n', KLN, D1, D2, ONE,
     $                    Z( KKROW+(ICOL-1)*LDZ ), LDZ, V( D1+1, 1 ),
     $                    LDV, ZERO, WORK, KLN )
                     CALL DGESD2D( CONTXT, KLN, D1, WORK, KLN, MYROW,
     $                    LEFT )
                     CALL DGERV2D( CONTXT, KLN, D2, WORK( 1+D1*KLN ),
     $                    KLN, MYROW, LEFT )
                     CALL DGEMM( 'n', 'n', KLN, D2, D2, ONE,
     $                    Z( KKROW+(ICOL-1)*LDZ ), LDZ,
     $                    V( D1+1, D1+1 ), LDV, ONE, WORK( 1+D1*KLN ),
     $                    KLN )
                     CALL DLAMOV( 'a', KLN, D2, WORK( 1+D1*KLN ),
     $                    KLN, Z( KKROW+(ICOL-1)*LDZ ), LDZ )
  120             CONTINUE
               END IF
            END IF
         END IF
*
      ELSE
*
*        Most complicated case: the diagonal block lay across the border
*        of the processor mesh.
*        Treat V as a distributed matrix and call PDGEMM.
*
         HSTEP = LWORK / NH * NPCOL
         VSTEP = LWORK / NH * NPROW
         LLDTMP = NUMROC( NH, NH, MYROW, 0, NPROW )
         LLDTMP = MAX( 1, LLDTMP )
         CALL DESCINIT( DESCV, NH, NH, NH, NH, 0, 0, CONTXT,
     $        LLDTMP, IERR )
         CALL DESCINIT( DESCWH, NH, HSTEP, NH, LWORK / NH, 0, 0,
     $        CONTXT, LLDTMP, IERR )
*
         IF( WANTT ) THEN
*
*           Update horizontal slab in A.
*
            DO 130 KKCOL = I+1, N, HSTEP
               KLN = MIN( HSTEP, N-KKCOL+1 )
               CALL PDGEMM( 't', 'n', NH, KLN, NH, ONE, V, 1, 1,
     $              DESCV, A, ILO, KKCOL, DESCA, ZERO, WORK, 1, 1,
     $              DESCWH )
               CALL PDGEMR2D( NH, KLN, WORK, 1, 1, DESCWH, A,
     $              ILO, KKCOL, DESCA, CONTXT )
  130       CONTINUE
*
*           Update vertical slab in A.
*
            DO 140 KKROW = LTOP, ILO-1, VSTEP
               KLN = MIN( VSTEP, ILO-KKROW )
               LLDTMP = NUMROC( KLN, LWORK / NH, MYROW, 0, NPROW )
               LLDTMP = MAX( 1, LLDTMP )
               CALL DESCINIT( DESCWV, KLN, NH, LWORK / NH, NH, 0, 0,
     $              CONTXT, LLDTMP, IERR )
               CALL PDGEMM( 'n', 'n', KLN, NH, NH, ONE, A, KKROW,
     $              ILO, DESCA, V, 1, 1, DESCV, ZERO, WORK, 1, 1,
     $              DESCWV )
               CALL PDGEMR2D( KLN, NH, WORK, 1, 1, DESCWV, A, KKROW,
     $              ILO, DESCA, CONTXT )
  140       CONTINUE
         END IF
*
*        Update vertical slab in Z.
*
         IF( WANTZ ) THEN
            DO 150 KKROW = ILOZ, IHIZ, VSTEP
               KLN = MIN( VSTEP, IHIZ-KKROW+1 )
               LLDTMP = NUMROC( KLN, LWORK / NH, MYROW, 0, NPROW )
               LLDTMP = MAX( 1, LLDTMP )
               CALL DESCINIT( DESCWV, KLN, NH, LWORK / NH, NH, 0, 0,
     $              CONTXT, LLDTMP, IERR )
               CALL PDGEMM( 'n', 'n', KLN, NH, NH, ONE, Z, KKROW,
     $              ILO, DESCZ, V, 1, 1, DESCV, ZERO, WORK, 1, 1,
     $              DESCWV )
               CALL PDGEMR2D( KLN, NH, WORK, 1, 1, DESCWV, Z,
     $              KKROW, ILO, DESCZ, CONTXT )
  150       CONTINUE
         END IF
      END IF
*
*     END OF PDLAQR4
*
OpenRadioss 2025.1.11 OpenRadioss project
Functions/Subroutines

Function/Subroutine Documentation

◆ pdlaqr4()