d3/d19/pdlaqr4_8f_source.html

      SUBROUTINE pdlaqr4( WANTT, WANTZ, N, ILO, IHI, A, DESCA, WR, WI,

     $                    ILOZ, IHIZ, Z, DESCZ, T, LDT, V, LDV, WORK,

     $                    LWORK, INFO )

*

*     Contribution from the Department of Computing Science and HPC2N,

*     Umea University, Sweden

*

*  -- ScaLAPACK routine (version 2.0.2) --

*     Univ. of Tennessee, Univ. of California Berkeley, Univ. of Colorado Denver

*     May 1 2012

*

      IMPLICIT NONE

*

*     .. Scalar Arguments ..

      LOGICAL            WANTT, WANTZ

      INTEGER            IHI, IHIZ, ILO, ILOZ, INFO, LDT, LDV, LWORK, N

*     ..

*     .. Array Arguments ..

      INTEGER            DESCA( * ), DESCZ( * )

      DOUBLE PRECISION   A( * ), T( LDT, * ), V( LDV, * ), WI( * ),

     $                   work( * ), wr( * ), z( * )

*     ..

*

*  Purpose

*  =======

*

*  PDLAQR4 is an auxiliary routine used to find the Schur decomposition

*  and or eigenvalues of a matrix already in Hessenberg form from cols

*  ILO to IHI.  This routine requires that the active block is small

*  enough, i.e. IHI-ILO+1 .LE. LDT, so that it can be solved by LAPACK.

*  Normally, it is called by PDLAQR1.  All the inputs are assumed to be

*  valid without checking.

*

*  Notes

*  =====

*

*  Each global data object is described by an associated description

*  vector.  This vector stores the information required to establish

*  the mapping between an object element and its corresponding process

*  and memory location.

*

*  Let A be a generic term for any 2D block cyclicly distributed array.

*  Such a global array has an associated description vector DESCA.

*  In the following comments, the character _ should be read as

*  "of the global array".

*

*  NOTATION        STORED IN      EXPLANATION

*  --------------- -------------- --------------------------------------

*  DTYPE_A(global) DESCA( DTYPE_ )The descriptor type.  In this case,

*                                 DTYPE_A = 1.

*  CTXT_A (global) DESCA( CTXT_ ) The BLACS context handle, indicating

*                                 the BLACS process grid A is distribu-

*                                 ted over. The context itself is glo-

*                                 bal, but the handle (the integer

*                                 value) may vary.

*  M_A    (global) DESCA( M_ )    The number of rows in the global

*                                 array A.

*  N_A    (global) DESCA( N_ )    The number of columns in the global

*                                 array A.

*  MB_A   (global) DESCA( MB_ )   The blocking factor used to distribute

*                                 the rows of the array.

*  NB_A   (global) DESCA( NB_ )   The blocking factor used to distribute

*                                 the columns of the array.

*  RSRC_A (global) DESCA( RSRC_ ) The process row over which the first

*                                 row of the array A is distributed.

*  CSRC_A (global) DESCA( CSRC_ ) The process column over which the

*                                 first column of the array A is

*                                 distributed.

*  LLD_A  (local)  DESCA( LLD_ )  The leading dimension of the local

*                                 array.  LLD_A >= MAX(1,LOCr(M_A)).

*

*  Let K be the number of rows or columns of a distributed matrix,

*  and assume that its process grid has dimension p x q.

*  LOCr( K ) denotes the number of elements of K that a process

*  would receive if K were distributed over the p processes of its

*  process column.

*  Similarly, LOCc( K ) denotes the number of elements of K that a

*  process would receive if K were distributed over the q processes of

*  its process row.

*  The values of LOCr() and LOCc() may be determined via a call to the

*  ScaLAPACK tool function, NUMROC:

*          LOCr( M ) = NUMROC( M, MB_A, MYROW, RSRC_A, NPROW ),

*          LOCc( N ) = NUMROC( N, NB_A, MYCOL, CSRC_A, NPCOL ).

*  An upper bound for these quantities may be computed by:

*          LOCr( M ) <= ceil( ceil(M/MB_A)/NPROW )*MB_A

*          LOCc( N ) <= ceil( ceil(N/NB_A)/NPCOL )*NB_A

*

*  Arguments

*  =========

*

*  WANTT   (global input) LOGICAL

*          = .TRUE. : the full Schur form T is required;

*          = .FALSE.: only eigenvalues are required.

*

*  WANTZ   (global input) LOGICAL

*          = .TRUE. : the matrix of Schur vectors Z is required;

*          = .FALSE.: Schur vectors are not required.

*

*  N       (global input) INTEGER

*          The order of the Hessenberg matrix A (and Z if WANTZ).

*          N >= 0.

*

*  ILO     (global input) INTEGER

*  IHI     (global input) INTEGER

*          It is assumed that A is already upper quasi-triangular in

*          rows and columns IHI+1:N, and that A(ILO,ILO-1) = 0 (unless

*          ILO = 1). PDLAQR4 works primarily with the Hessenberg

*          submatrix in rows and columns ILO to IHI, but applies

*          transformations to all of H if WANTT is .TRUE..

*          1 <= ILO <= max(1,IHI); IHI <= N.

*

*  A       (global input/output) DOUBLE PRECISION array, dimension

*          (DESCA(LLD_),*)

*          On entry, the upper Hessenberg matrix A.

*          On exit, if WANTT is .TRUE., A is upper quasi-triangular in

*          rows and columns ILO:IHI, with any 2-by-2 or larger diagonal

*          blocks not yet in standard form. If WANTT is .FALSE., the

*          contents of A are unspecified on exit.

*

*  DESCA   (global and local input) INTEGER array of dimension DLEN_.

*          The array descriptor for the distributed matrix A.

*

*  WR      (global replicated output) DOUBLE PRECISION array,

*                                                         dimension (N)

*  WI      (global replicated output) DOUBLE PRECISION array,

*                                                         dimension (N)

*          The real and imaginary parts, respectively, of the computed

*          eigenvalues ILO to IHI are stored in the corresponding

*          elements of WR and WI. If two eigenvalues are computed as a

*          complex conjugate pair, they are stored in consecutive

*          elements of WR and WI, say the i-th and (i+1)th, with

*          WI(i) > 0 and WI(i+1) < 0. If WANTT is .TRUE., the

*          eigenvalues are stored in the same order as on the diagonal

*          of the Schur form returned in A.  A may be returned with

*          larger diagonal blocks until the next release.

*

*  ILOZ    (global input) INTEGER

*  IHIZ    (global input) INTEGER

*          Specify the rows of Z to which transformations must be

*          applied if WANTZ is .TRUE..

*          1 <= ILOZ <= ILO; IHI <= IHIZ <= N.

*

*  Z       (global input/output) DOUBLE PRECISION array.

*          If WANTZ is .TRUE., on entry Z must contain the current

*          matrix Z of transformations accumulated by PDHSEQR, and on

*          exit Z has been updated; transformations are applied only to

*          the submatrix Z(ILOZ:IHIZ,ILO:IHI).

*          If WANTZ is .FALSE., Z is not referenced.

*

*  DESCZ   (global and local input) INTEGER array of dimension DLEN_.

*          The array descriptor for the distributed matrix Z.

*

*  T       (local workspace) DOUBLE PRECISION array, dimension LDT*NW.

*

*  LDT     (local input) INTEGER

*          The leading dimension of the array T.

*          LDT >= IHI-ILO+1.

*

*  V       (local workspace) DOUBLE PRECISION array, dimension LDV*NW.

*

*  LDV     (local input) INTEGER

*          The leading dimension of the array V.

*          LDV >= IHI-ILO+1.

*

*  WORK    (local workspace) DOUBLE PRECISION array, dimension LWORK.

*

*  LWORK   (local input) INTEGER

*          The dimension of the work array WORK.

*          LWORK >= IHI-ILO+1.

*          WORK(LWORK) is a local array and LWORK is assumed big enough.

*          Typically LWORK >= 4*LDS*LDS if this routine is called by

*          PDLAQR1. (LDS = 385, see PDLAQR1)

*

*  INFO    (global output) INTEGER

*          < 0: parameter number -INFO incorrect or inconsistent;

*          = 0: successful exit;

*          > 0: PDLAQR4 failed to compute all the eigenvalues ILO to IHI

*               in a total of 30*(IHI-ILO+1) iterations; if INFO = i,

*               elements i+1:ihi of WR and WI contain those eigenvalues

*               which have been successfully computed.

*

*  ================================================================

*  Implemented by

*        Meiyue Shao, Department of Computing Science and HPC2N,

*        Umea University, Sweden

*

*  ================================================================

*  References:

*        B. Kagstrom, D. Kressner, and M. Shao,

*        On Aggressive Early Deflation in Parallel Variants of the QR

*        Algorithm.

*        Para 2010, to appear.

*

*  ================================================================

*     .. Parameters ..

      INTEGER            BLOCK_CYCLIC_2D, CSRC_, CTXT_, DLEN_, DTYPE_,

     $                   LLD_, MB_, M_, NB_, N_, RSRC_

      parameter( block_cyclic_2d = 1, dlen_ = 9, dtype_ = 1,

     $                     ctxt_ = 2, m_ = 3, n_ = 4, mb_ = 5, nb_ = 6,

     $                     rsrc_ = 7, csrc_ = 8, lld_ = 9 )

      DOUBLE PRECISION   ZERO, ONE

      PARAMETER          ( ZERO = 0.0d+0, one = 1.0d+0 )

*     ..

*     .. Local Scalars ..

      INTEGER            CONTXT, HBL, I, I1, I2, IAFIRST, ICOL, ICOL1,

     $                   ICOL2, II, IROW, IROW1, IROW2, ITMP1, ITMP2,

     $                   ierr, j, jafirst, jj, k, l, lda, ldz, lldtmp,

     $                   mycol, myrow, node, npcol, nprow, nh, nmin, nz,

     $                   hstep, vstep, kkrow, kkcol, kln, ltop, left,

     $                   right, up, down, d1, d2

*     ..

*     .. Local Arrays ..

      INTEGER            DESCT( 9 ), DESCV( 9 ), DESCWH( 9 ),

     $                   DESCWV( 9 )

*     ..

*     .. External Functions ..

      INTEGER            NUMROC, ILAENV

      EXTERNAL           NUMROC, ILAENV

*     ..

*     .. External Subroutines ..

      EXTERNAL           blacs_gridinfo, infog2l, dlaset,

     $                   dlahqr, dlaqr4, descinit, pdgemm, pdgemr2d,

     $                   dgemm, dlamov, dgesd2d, dgerv2d,

     $                   dgebs2d, dgebr2d, igebs2d, igebr2d

*     ..

*     .. Intrinsic Functions ..

      INTRINSIC          max, min, mod

*     ..

*     .. Executable Statements ..

*

      info = 0

*

      nh = ihi - ilo + 1

      nz = ihiz - iloz + 1

      IF( n.EQ.0 .OR. nh.EQ.0 )

     $   RETURN

*

*     NODE (IAFIRST,JAFIRST) OWNS A(1,1)

*

      hbl = desca( mb_ )

      contxt = desca( ctxt_ )

      lda = desca( lld_ )

      iafirst = desca( rsrc_ )

      jafirst = desca( csrc_ )

      ldz = descz( lld_ )

      CALL blacs_gridinfo( contxt, nprow, npcol, myrow, mycol )

      node = myrow*npcol + mycol

      left = mod( mycol+npcol-1, npcol )

      right = mod( mycol+1, npcol )

      up = mod( myrow+nprow-1, nprow )

      down = mod( myrow+1, nprow )

*

*     I1 and I2 are the indices of the first row and last column of A

*     to which transformations must be applied.

*

      i = ihi

      l = ilo

      IF( wantt ) THEN

         i1 = 1

         i2 = n

         ltop = 1

      ELSE

         i1 = l

         i2 = i

         ltop = l

      END IF

*

*     Copy the diagonal block to local and call LAPACK.

*

      CALL infog2l( ilo, ilo, desca, nprow, npcol, myrow, mycol,

     $     irow, icol, ii, jj )

      IF ( myrow .EQ. ii ) THEN

         CALL descinit( desct, nh, nh, nh, nh, ii, jj, contxt,

     $        ldt, ierr )

         CALL descinit( descv, nh, nh, nh, nh, ii, jj, contxt,

     $        ldv, ierr )

      ELSE

         CALL descinit( desct, nh, nh, nh, nh, ii, jj, contxt,

     $        1, ierr )

         CALL descinit( descv, nh, nh, nh, nh, ii, jj, contxt,

     $        1, ierr )

      END IF

      CALL pdgemr2d( nh, nh, a, ilo, ilo, desca, t, 1, 1, desct,

     $     contxt )

      IF ( myrow .EQ. ii .AND. mycol .EQ. jj ) THEN

         CALL dlaset( 'All', nh, nh, zero, one, v, ldv )

         nmin = ilaenv( 12, 'DLAQR3', 'SV', nh, 1, nh, lwork )

         IF( nh .GT. nmin ) THEN

            CALL dlaqr4( .true., .true., nh, 1, nh, t, ldt, wr( ilo ),

     $           wi( ilo ), 1, nh, v, ldv, work, lwork, info )

*           Clean up the scratch used by DLAQR4.

            CALL dlaset( 'L', nh-2, nh-2, zero, zero, t( 3, 1 ), ldt )

         ELSE

            CALL dlahqr( .true., .true., nh, 1, nh, t, ldt, wr( ilo ),

     $           wi( ilo ), 1, nh, v, ldv, info )

         END IF

         CALL dgebs2d( contxt, 'All', ' ', nh, nh, v, ldv )

         CALL igebs2d( contxt, 'All', ' ', 1, 1, info, 1 )

      ELSE

         CALL dgebr2d( contxt, 'All', ' ', nh, nh, v, ldv, ii, jj )

         CALL igebr2d( contxt, 'All', ' ', 1, 1, info, 1, ii, jj )

      END IF

      IF( info .NE. 0 ) info = info+ilo-1

*

*     Copy the local matrix back to the diagonal block.

*

      CALL pdgemr2d( nh, nh, t, 1, 1, desct, a, ilo, ilo, desca,

     $     contxt )

*

*     Update T and Z.

*

      IF( mod( ilo-1, hbl )+nh .LE. hbl ) THEN

*

*        Simplest case: the diagonal block is located on one processor.

*        Call DGEMM directly to perform the update.

*

         hstep = lwork / nh

         vstep = hstep

*

         IF( wantt ) THEN

*

*           Update horizontal slab in A.

*

            CALL infog2l( ilo, i+1, desca, nprow, npcol, myrow,

     $           mycol, irow, icol, ii, jj )

            IF( myrow .EQ. ii ) THEN

               icol1 = numroc( n, hbl, mycol, jafirst, npcol )

               DO 10 kkcol = icol, icol1, hstep

                  kln = min( hstep, icol1-kkcol+1 )

                  CALL dgemm( 'T', 'N', nh, kln, nh, one, v,

     $                 ldv, a( irow+(kkcol-1)*lda ), lda, zero, work,

     $                 nh )

                  CALL dlamov( 'A', nh, kln, work, nh,

     $                 a( irow+(kkcol-1)*lda ), lda )

   10          CONTINUE

            END IF

*

*           Update vertical slab in A.

*

            CALL infog2l( ltop, ilo, desca, nprow, npcol, myrow,

     $           mycol, irow, icol, ii, jj )

            IF( mycol .EQ. jj ) THEN

               CALL infog2l( ilo-1, ilo, desca, nprow, npcol,

     $              myrow, mycol, irow1, icol1, itmp1, itmp2 )

               IF( myrow .NE. itmp1 ) irow1 = irow1-1

               DO 20 kkrow = irow, irow1, vstep

                  kln = min( vstep, irow1-kkrow+1 )

                  CALL dgemm( 'N', 'N', kln, nh, nh, one,

     $                 a( kkrow+(icol-1)*lda ), lda, v, ldv, zero,

     $                 work, kln )

                  CALL dlamov( 'A', kln, nh, work, kln,

     $                 a( kkrow+(icol-1)*lda ), lda )

   20          CONTINUE

            END IF

         END IF

*

*        Update vertical slab in Z.

*

         IF( wantz ) THEN

            CALL infog2l( iloz, ilo, descz, nprow, npcol, myrow,

     $           mycol, irow, icol, ii, jj )

            IF( mycol .EQ. jj ) THEN

               CALL infog2l( ihiz, ilo, descz, nprow, npcol,

     $              myrow, mycol, irow1, icol1, itmp1, itmp2 )

               IF( myrow .NE. itmp1 ) irow1 = irow1-1

               DO 30 kkrow = irow, irow1, vstep

                  kln = min( vstep, irow1-kkrow+1 )

                  CALL dgemm( 'N', 'N', kln, nh, nh, one,

     $                 z( kkrow+(icol-1)*ldz ), ldz, v, ldv, zero,

     $                 work, kln )

                  CALL dlamov( 'A', kln, nh, work, kln,

     $                 z( kkrow+(icol-1)*ldz ), ldz )

   30          CONTINUE

            END IF

         END IF

*

      ELSE IF( mod( ilo-1, hbl )+nh .LE. 2*hbl ) THEN

*

*        More complicated case: the diagonal block lay on a 2x2

*        processor mesh.

*        Call DGEMM locally and communicate by pair.

*

         d1 = hbl - mod( ilo-1, hbl )

         d2 = nh - d1

         hstep = lwork / nh

         vstep = hstep

*

         IF( wantt ) THEN

*

*           Update horizontal slab in A.

*

            CALL infog2l( ilo, i+1, desca, nprow, npcol, myrow,

     $           mycol, irow, icol, ii, jj )

            IF( myrow .EQ. up ) THEN

               IF( myrow .EQ. ii ) THEN

                  icol1 = numroc( n, hbl, mycol, jafirst, npcol )

                  DO 40 kkcol = icol, icol1, hstep

                     kln = min( hstep, icol1-kkcol+1 )

                     CALL dgemm( 'T', 'N', nh, kln, nh, one, v,

     $                    nh, a( irow+(kkcol-1)*lda ), lda, zero,

     $                    work, nh )

                     CALL dlamov( 'A', nh, kln, work, nh,

     $                    a( irow+(kkcol-1)*lda ), lda )

   40             CONTINUE

               END IF

            ELSE

               IF( myrow .EQ. ii ) THEN

                  icol1 = numroc( n, hbl, mycol, jafirst, npcol )

                  DO 50 kkcol = icol, icol1, hstep

                     kln = min( hstep, icol1-kkcol+1 )

                     CALL dgemm( 'T', 'N', d2, kln, d1, one,

     $                    v( 1, d1+1 ), ldv, a( irow+(kkcol-1)*lda ),

     $                    lda, zero, work( d1+1 ), nh )

                     CALL dgesd2d( contxt, d2, kln, work( d1+1 ),

     $                    nh, down, mycol )

                     CALL dgerv2d( contxt, d1, kln, work, nh, down,

     $                    mycol )

                     CALL dgemm( 'T', 'N', d1, kln, d1, one,

     $                    v, ldv, a( irow+(kkcol-1)*lda ), lda, one,

     $                    work, nh )

                     CALL dlamov( 'A', d1, kln, work, nh,

     $                    a( irow+(kkcol-1)*lda ), lda )

   50             CONTINUE

               ELSE IF( up .EQ. ii ) THEN

                  icol1 = numroc( n, hbl, mycol, jafirst, npcol )

                  DO 60 kkcol = icol, icol1, hstep

                     kln = min( hstep, icol1-kkcol+1 )

                     CALL dgemm( 'T', 'N', d1, kln, d2, one,

     $                    v( d1+1, 1 ), ldv, a( irow+(kkcol-1)*lda ),

     $                    lda, zero, work, nh )

                     CALL dgesd2d( contxt, d1, kln, work, nh, up,

     $                    mycol )

                     CALL dgerv2d( contxt, d2, kln, work( d1+1 ),

     $                    nh, up, mycol )

                     CALL dgemm( 'T', 'N', d2, kln, d2, one,

     $                    v( d1+1, d1+1 ), ldv,

     $                    a( irow+(kkcol-1)*lda ), lda, one,

     $                    work( d1+1 ), nh )

                     CALL dlamov( 'A', d2, kln, work( d1+1 ), nh,

     $                    a( irow+(kkcol-1)*lda ), lda )

   60             CONTINUE

               END IF

            END IF

*

*           Update vertical slab in A.

*

            CALL infog2l( ltop, ilo, desca, nprow, npcol, myrow,

     $           mycol, irow, icol, ii, jj )

            IF( mycol .EQ. left ) THEN

               IF( mycol .EQ. jj ) THEN

                  CALL infog2l( ilo-1, ilo, desca, nprow, npcol,

     $                 myrow, mycol, irow1, icol1, itmp1, itmp2 )

                  IF( myrow .NE. itmp1 ) irow1 = irow1-1

                  DO 70 kkrow = irow, irow1, vstep

                     kln = min( vstep, irow1-kkrow+1 )

                     CALL dgemm( 'N', 'N', kln, nh, nh, one,

     $                    a( kkrow+(icol-1)*lda ), lda, v, ldv,

     $                    zero, work, kln )

                     CALL dlamov( 'A', kln, nh, work, kln,

     $                    a( kkrow+(icol-1)*lda ), lda )

   70             CONTINUE

               END IF

            ELSE

               IF( mycol .EQ. jj ) THEN

                  CALL infog2l( ilo-1, ilo, desca, nprow, npcol,

     $                 myrow, mycol, irow1, icol1, itmp1, itmp2 )

                  IF( myrow .NE. itmp1 ) irow1 = irow1-1

                  DO 80 kkrow = irow, irow1, vstep

                     kln = min( vstep, irow1-kkrow+1 )

                     CALL dgemm( 'N', 'N', kln, d2, d1, one,

     $                    a( kkrow+(icol-1)*lda ), lda, v( 1, d1+1 ),

     $                    ldv, zero, work( 1+d1*kln ), kln )

                     CALL dgesd2d( contxt, kln, d2, work( 1+d1*kln ),

     $                    kln, myrow, right )

                     CALL dgerv2d( contxt, kln, d1, work, kln, myrow,

     $                    right )

                     CALL dgemm( 'N', 'N', kln, d1, d1, one,

     $                    a( kkrow+(icol-1)*lda ), lda, v, ldv, one,

     $                    work, kln )

                     CALL dlamov( 'A', kln, d1, work, kln,

     $                    a( kkrow+(icol-1)*lda ), lda )

   80             CONTINUE

               ELSE IF ( left .EQ. jj ) THEN

                  CALL infog2l( ilo-1, ilo, desca, nprow, npcol,

     $                 myrow, mycol, irow1, icol1, itmp1, itmp2 )

                  IF( myrow .NE. itmp1 ) irow1 = irow1-1

                  DO 90 kkrow = irow, irow1, vstep

                     kln = min( vstep, irow1-kkrow+1 )

                     CALL dgemm( 'N', 'N', kln, d1, d2, one,

     $                    a( kkrow+(icol-1)*lda ), lda, v( d1+1, 1 ),

     $                    ldv, zero, work, kln )

                     CALL dgesd2d( contxt, kln, d1, work, kln, myrow,

     $                    left )

                     CALL dgerv2d( contxt, kln, d2, work( 1+d1*kln ),

     $                    kln, myrow, left )

                     CALL dgemm( 'N', 'N', kln, d2, d2, one,

     $                    a( kkrow+(icol-1)*lda ), lda, v( d1+1, d1+1 ),

     $                    ldv, one, work( 1+d1*kln ), kln )

                     CALL dlamov( 'A', kln, d2, work( 1+d1*kln ), kln,

     $                    a( kkrow+(icol-1)*lda ), lda )

   90             CONTINUE

               END IF

            END IF

         END IF

*

*        Update vertical slab in Z.

*

         IF( wantz ) THEN

            CALL infog2l( iloz, ilo, descz, nprow, npcol, myrow,

     $           mycol, irow, icol, ii, jj )

            IF( mycol .EQ. left ) THEN

               IF( mycol .EQ. jj ) THEN

                  CALL infog2l( ihiz, ilo, descz, nprow, npcol,

     $                 myrow, mycol, irow1, icol1, itmp1, itmp2 )

                  IF( myrow .NE. itmp1 ) irow1 = irow1-1

                  DO 100 kkrow = irow, irow1, vstep

                     kln = min( vstep, irow1-kkrow+1 )

                     CALL dgemm( 'N', 'N', kln, nh, nh, one,

     $                    z( kkrow+(icol-1)*ldz ), ldz, v, ldv, zero,

     $                    work, kln )

                     CALL dlamov( 'A', kln, nh, work, kln,

     $                    z( kkrow+(icol-1)*ldz ), ldz )

  100             CONTINUE

               END IF

            ELSE

               IF( mycol .EQ. jj ) THEN

                  CALL infog2l( ihiz, ilo, descz, nprow, npcol,

     $                 myrow, mycol, irow1, icol1, itmp1, itmp2 )

                  IF( myrow .NE. itmp1 ) irow1 = irow1-1

                  DO 110 kkrow = irow, irow1, vstep

                     kln = min( vstep, irow1-kkrow+1 )

                     CALL dgemm( 'N', 'N', kln, d2, d1, one,

     $                    z( kkrow+(icol-1)*ldz ), ldz, v( 1, d1+1 ),

     $                    ldv, zero, work( 1+d1*kln ), kln )

                     CALL dgesd2d( contxt, kln, d2, work( 1+d1*kln ),

     $                    kln, myrow, right )

                     CALL dgerv2d( contxt, kln, d1, work, kln, myrow,

     $                    right )

                     CALL dgemm( 'N', 'N', kln, d1, d1, one,

     $                    z( kkrow+(icol-1)*ldz ), ldz, v, ldv, one,

     $                    work, kln )

                     CALL dlamov( 'A', kln, d1, work, kln,

     $                    z( kkrow+(icol-1)*ldz ), ldz )

  110             CONTINUE

               ELSE IF( left .EQ. jj ) THEN

                  CALL infog2l( ihiz, ilo, descz, nprow, npcol,

     $                 myrow, mycol, irow1, icol1, itmp1, itmp2 )

                  IF( myrow .NE. itmp1 ) irow1 = irow1-1

                  DO 120 kkrow = irow, irow1, vstep

                     kln = min( vstep, irow1-kkrow+1 )

                     CALL dgemm( 'N', 'N', kln, d1, d2, one,

     $                    z( kkrow+(icol-1)*ldz ), ldz, v( d1+1, 1 ),

     $                    ldv, zero, work, kln )

                     CALL dgesd2d( contxt, kln, d1, work, kln, myrow,

     $                    left )

                     CALL dgerv2d( contxt, kln, d2, work( 1+d1*kln ),

     $                    kln, myrow, left )

                     CALL dgemm( 'N', 'N', kln, d2, d2, one,

     $                    z( kkrow+(icol-1)*ldz ), ldz,

     $                    v( d1+1, d1+1 ), ldv, one, work( 1+d1*kln ),

     $                    kln )

                     CALL dlamov( 'A', kln, d2, work( 1+d1*kln ),

     $                    kln, z( kkrow+(icol-1)*ldz ), ldz )

  120             CONTINUE

               END IF

            END IF

         END IF

*

      ELSE

*

*        Most complicated case: the diagonal block lay across the border

*        of the processor mesh.

*        Treat V as a distributed matrix and call PDGEMM.

*

         hstep = lwork / nh * npcol

         vstep = lwork / nh * nprow

         lldtmp = numroc( nh, nh, myrow, 0, nprow )

         lldtmp = max( 1, lldtmp )

         CALL descinit( descv, nh, nh, nh, nh, 0, 0, contxt,

     $        lldtmp, ierr )

         CALL descinit( descwh, nh, hstep, nh, lwork / nh, 0, 0,

     $        contxt, lldtmp, ierr )

*

         IF( wantt ) THEN

*

*           Update horizontal slab in A.

*

            DO 130 kkcol = i+1, n, hstep

               kln = min( hstep, n-kkcol+1 )

               CALL pdgemm( 'T', 'N', nh, kln, nh, one, v, 1, 1,

     $              descv, a, ilo, kkcol, desca, zero, work, 1, 1,

     $              descwh )

               CALL pdgemr2d( nh, kln, work, 1, 1, descwh, a,

     $              ilo, kkcol, desca, contxt )

  130       CONTINUE

*

*           Update vertical slab in A.

*

            DO 140 kkrow = ltop, ilo-1, vstep

               kln = min( vstep, ilo-kkrow )

               lldtmp = numroc( kln, lwork / nh, myrow, 0, nprow )

               lldtmp = max( 1, lldtmp )

               CALL descinit( descwv, kln, nh, lwork / nh, nh, 0, 0,

     $              contxt, lldtmp, ierr )

               CALL pdgemm( 'N', 'N', kln, nh, nh, one, a, kkrow,

     $              ilo, desca, v, 1, 1, descv, zero, work, 1, 1,

     $              descwv )

               CALL pdgemr2d( kln, nh, work, 1, 1, descwv, a, kkrow,

     $              ilo, desca, contxt )

  140       CONTINUE

         END IF

*

*        Update vertical slab in Z.

*

         IF( wantz ) THEN

            DO 150 kkrow = iloz, ihiz, vstep

               kln = min( vstep, ihiz-kkrow+1 )

               lldtmp = numroc( kln, lwork / nh, myrow, 0, nprow )

               lldtmp = max( 1, lldtmp )

               CALL descinit( descwv, kln, nh, lwork / nh, nh, 0, 0,

     $              contxt, lldtmp, ierr )

               CALL pdgemm( 'N', 'N', kln, nh, nh, one, z, kkrow,

     $              ilo, descz, v, 1, 1, descv, zero, work, 1, 1,

     $              descwv )

               CALL pdgemr2d( kln, nh, work, 1, 1, descwv, z,

     $              kkrow, ilo, descz, contxt )

  150       CONTINUE

         END IF

      END IF

*

*     END OF PDLAQR4

*


      END

descinit
subroutine descinit(desc, m, n, mb, nb, irsrc, icsrc, ictxt, lld, info)
Definition descinit.f:3

infog2l
subroutine infog2l(grindx, gcindx, desc, nprow, npcol, myrow, mycol, lrindx, lcindx, rsrc, csrc)
Definition infog2l.f:3

max
#define max(A, B)
Definition pcgemr.c:180

min
#define min(A, B)
Definition pcgemr.c:181

pdlaqr4
subroutine pdlaqr4(wantt, wantz, n, ilo, ihi, a, desca, wr, wi, iloz, ihiz, z, descz, t, ldt, v, ldv, work, lwork, info)
Definition pdlaqr4.f:4