d1/d46/pslacp2_8f_source.html

      SUBROUTINE pslacp2( UPLO, M, N, A, IA, JA, DESCA, B, IB, JB,

     $                     DESCB )

*

*  -- ScaLAPACK auxiliary routine (version 2.0.2) --

*     Univ. of Tennessee, Univ. of California Berkeley, Univ. of Colorado Denver

*     May 1 2012

*

*     .. Scalar Arguments ..

      CHARACTER          UPLO

      INTEGER            IA, IB, JA, JB, M, N

*     ..

*     .. Array Arguments ..

      INTEGER            DESCA( * ), DESCB( * )

      REAL               A( * ), B( * )

*     ..

*

*  Purpose

*  =======

*

*  PSLACP2 copies all or part of a distributed matrix A to another

*  distributed matrix B.  No communication is performed, PSLACP2

*  performs a local copy sub( A ) := sub( B ), where sub( A ) denotes

*  A(IA:IA+M-1,JA:JA+N-1) and sub( B ) denotes B(IB:IB+M-1,JB:JB+N-1).

*  PSLACP2 requires that only dimension of the matrix operands is

*  distributed.

*

*  Notes

*  =====

*

*  Each global data object is described by an associated description

*  vector.  This vector stores the information required to establish

*  the mapping between an object element and its corresponding process

*  and memory location.

*

*  Let A be a generic term for any 2D block cyclicly distributed array.

*  Such a global array has an associated description vector DESCA.

*  In the following comments, the character _ should be read as

*  "of the global array".

*

*  NOTATION        STORED IN      EXPLANATION

*  --------------- -------------- --------------------------------------

*  DTYPE_A(global) DESCA( DTYPE_ )The descriptor type.  In this case,

*                                 DTYPE_A = 1.

*  CTXT_A (global) DESCA( CTXT_ ) The BLACS context handle, indicating

*                                 the BLACS process grid A is distribu-

*                                 ted over. The context itself is glo-

*                                 bal, but the handle (the integer

*                                 value) may vary.

*  M_A    (global) DESCA( M_ )    The number of rows in the global

*                                 array A.

*  N_A    (global) DESCA( N_ )    The number of columns in the global

*                                 array A.

*  MB_A   (global) DESCA( MB_ )   The blocking factor used to distribute

*                                 the rows of the array.

*  NB_A   (global) DESCA( NB_ )   The blocking factor used to distribute

*                                 the columns of the array.

*  RSRC_A (global) DESCA( RSRC_ ) The process row over which the first

*                                 row of the array A is distributed.

*  CSRC_A (global) DESCA( CSRC_ ) The process column over which the

*                                 first column of the array A is

*                                 distributed.

*  LLD_A  (local)  DESCA( LLD_ )  The leading dimension of the local

*                                 array.  LLD_A >= MAX(1,LOCr(M_A)).

*

*  Let K be the number of rows or columns of a distributed matrix,

*  and assume that its process grid has dimension p x q.

*  LOCr( K ) denotes the number of elements of K that a process

*  would receive if K were distributed over the p processes of its

*  process column.

*  Similarly, LOCc( K ) denotes the number of elements of K that a

*  process would receive if K were distributed over the q processes of

*  its process row.

*  The values of LOCr() and LOCc() may be determined via a call to the

*  ScaLAPACK tool function, NUMROC:

*          LOCr( M ) = NUMROC( M, MB_A, MYROW, RSRC_A, NPROW ),

*          LOCc( N ) = NUMROC( N, NB_A, MYCOL, CSRC_A, NPCOL ).

*  An upper bound for these quantities may be computed by:

*          LOCr( M ) <= ceil( ceil(M/MB_A)/NPROW )*MB_A

*          LOCc( N ) <= ceil( ceil(N/NB_A)/NPCOL )*NB_A

*

*  Arguments

*  =========

*

*  UPLO    (global input) CHARACTER

*          Specifies the part of the distributed matrix sub( A ) to be

*          copied:

*          = 'U':   Upper triangular part is copied; the strictly

*                   lower triangular part of sub( A ) is not referenced;

*          = 'L':   Lower triangular part is copied; the strictly

*                   upper triangular part of sub( A ) is not referenced;

*          Otherwise:  All of the matrix sub( A ) is copied.

*

*  M       (global input) INTEGER

*          The number of rows to be operated on i.e the number of rows

*          of the distributed submatrix sub( A ). M >= 0.

*

*  N       (global input) INTEGER

*          The number of columns to be operated on i.e the number of

*          columns of the distributed submatrix sub( A ). N >= 0.

*

*  A       (local input) REAL pointer into the local memory

*          to an array of dimension (LLD_A, LOCc(JA+N-1) ). This array

*          contains the local pieces of the distributed matrix sub( A )

*          to be copied from.

*

*  IA      (global input) INTEGER

*          The row index in the global array A indicating the first

*          row of sub( A ).

*

*  JA      (global input) INTEGER

*          The column index in the global array A indicating the

*          first column of sub( A ).

*

*  DESCA   (global and local input) INTEGER array of dimension DLEN_.

*          The array descriptor for the distributed matrix A.

*

*  B       (local output) REAL pointer into the local memory

*          to an array of dimension (LLD_B, LOCc(JB+N-1) ). This array

*          contains on exit the local pieces of the distributed matrix

*          sub( B ) set as follows:

*

*          if UPLO = 'U', B(IB+i-1,JB+j-1) = A(IA+i-1,JA+j-1),

*                         1<=i<=j, 1<=j<=N;

*          if UPLO = 'L', B(IB+i-1,JB+j-1) = A(IA+i-1,JA+j-1),

*                         j<=i<=M, 1<=j<=N;

*          otherwise,     B(IB+i-1,JB+j-1) = A(IA+i-1,JA+j-1),

*                         1<=i<=M, 1<=j<=N.

*

*  IB      (global input) INTEGER

*          The row index in the global array B indicating the first

*          row of sub( B ).

*

*  JB      (global input) INTEGER

*          The column index in the global array B indicating the

*          first column of sub( B ).

*

*  DESCB   (global and local input) INTEGER array of dimension DLEN_.

*          The array descriptor for the distributed matrix B.

*

*  =====================================================================

*

*     .. Parameters ..

      INTEGER            BLOCK_CYCLIC_2D, CSRC_, CTXT_, DLEN_, DTYPE_,

     $                   lld_, mb_, m_, nb_, n_, rsrc_

      parameter( block_cyclic_2d = 1, dlen_ = 9, dtype_ = 1,

     $                     ctxt_ = 2, m_ = 3, n_ = 4, mb_ = 5, nb_ = 6,

     $                     rsrc_ = 7, csrc_ = 8, lld_ = 9 )

*     ..

*     .. Local Scalars ..

      INTEGER            HEIGHT, IACOL, IAROW, IBASE, IBCOL, IBROW,

     $                   icoffa, iia, iiaa, iib, iibb, iibega, iibegb,

     $                   iienda, iinxta, iinxtb, ileft, iright, iroffa,

     $                   itop, jja, jjaa, jjb, jjbb, jjbega, jjbegb,

     $                   jjenda, jjnxta, jjnxtb, lda, ldb, mba, mp,

     $                   mpaa, mycol, mydist, myrow, nba, npcol, nprow,

     $                   nq, nqaa, wide

*     ..

*     .. External Subroutines ..

      EXTERNAL           blacs_gridinfo, infog2l, slamov

*     ..

*     .. External Functions ..

      LOGICAL            LSAME

      INTEGER            ICEIL, NUMROC

      EXTERNAL           iceil, lsame, numroc

*     ..

*     .. Intrinsic Functions ..

      INTRINSIC          max, min, mod

*     ..

*     .. Executable Statements ..

*

      IF( m.EQ.0 .OR. n.EQ.0 )

     $   RETURN

*

*     Get grid parameters

*

      CALL blacs_gridinfo( desca( ctxt_ ), nprow, npcol, myrow, mycol )

*

      CALL infog2l( ia, ja, desca, nprow, npcol, myrow, mycol, iia, jja,

     $              iarow, iacol )

      CALL infog2l( ib, jb, descb, nprow, npcol, myrow, mycol, iib, jjb,

     $              ibrow, ibcol )

*

      mba    = desca( mb_ )

      nba    = desca( nb_ )

      lda    = desca( lld_ )

      iroffa = mod( ia-1, mba )

      icoffa = mod( ja-1, nba )

      ldb    = descb( lld_ )

*

      IF( n.LE.( nba-icoffa ) ) THEN

*

*        It is assumed that the local columns JJA:JJA+N-1 of the matrix

*        A are in the same process column (IACOL).

*

*                         N

*                JJA             JJA+N-1

*         /      ---------------------    \

*   IROFFA|      |                   |    |

*         \      |...................|    |          ( IAROW )

*           IIA  |x                  |    |   MBA = DESCA( MB_ )

*                | x                 |    |

*                |--x----------------|    /

*                |   x               |

*                |    x              |        ITOP

*                |     x             |          |

*                |      x            |      /-------\

*                |-------x-----------|      |-------x-----------|

*                |        x          |      |        x          |

*                |         x         |      |         x         |

*                |          x        |      |          x        |

*                |           x       |      |           x       |

*                |------------x------|      |------------x------|

*                |             x     |      \____________/

*                |              x    |            |

*                |               x   |          IBASE

*                |                x  |

*                |-----------------x-|          Local picture

*                |                  x|

*                |                   |

*                |                   |

*                |                   |

*                |-------------------|

*                |                   |

*                .                   .

*                .                   .

*                .      (IACOL)      .

*

         IF( mycol.EQ.iacol ) THEN

*

            mp = numroc( m+iroffa, mba, myrow, iarow, nprow )

            IF( mp.LE.0 )

     $         RETURN

            IF( myrow.EQ.iarow )

     $         mp = mp - iroffa

            mydist = mod( myrow-iarow+nprow, nprow )

            itop   = mydist * mba - iroffa

*

            IF( lsame( uplo, 'U' ) ) THEN

*

               itop   = max( 0, itop )

               iibega = iia

               iienda = iia + mp - 1

               iinxta = min( iceil( iibega, mba ) * mba, iienda )

               iibegb = iib

               iinxtb = iibegb + iinxta - iibega

*

   10          CONTINUE

               IF( ( n-itop ).GT.0 ) THEN

                  CALL slamov( uplo, iinxta-iibega+1, n-itop,

     $                         a( iibega+(jja+itop-1)*lda ), lda,

     $                         b( iibegb+(jjb+itop-1)*ldb ), ldb )

                  mydist = mydist + nprow

                  itop   = mydist * mba - iroffa

                  iibega = iinxta + 1

                  iinxta = min( iinxta+mba, iienda )

                  iibegb = iinxtb + 1

                  iinxtb = iibegb + iinxta - iibega

                  GO TO 10

               END IF

*

            ELSE IF( lsame( uplo, 'L' ) ) THEN

*

               mpaa  = mp

               iiaa  = iia

               jjaa  = jja

               iibb  = iib

               jjbb  = jjb

               ibase = min( itop + mba, n )

               itop  = min( max( 0, itop ), n )

*

   20          CONTINUE

               IF( jjaa.LE.( jja+n-1 ) ) THEN

                  height = ibase - itop

                  CALL slamov( 'All', mpaa, itop-jjaa+jja,

     $                         a( iiaa+(jjaa-1)*lda ), lda,

     $                         b( iibb+(jjbb-1)*ldb ), ldb )

                  CALL slamov( uplo, mpaa, height,

     $                         a( iiaa+(jja+itop-1)*lda ), lda,

     $                         b( iibb+(jjb+itop-1)*ldb ), ldb )

                  mpaa   = max( 0, mpaa - height )

                  iiaa   = iiaa + height

                  jjaa   = jja  + ibase

                  iibb   = iibb + height

                  jjbb   = jjb  + ibase

                  mydist = mydist + nprow

                  itop   = mydist * mba - iroffa

                  ibase  = min( itop + mba, n )

                  itop   = min( itop, n )

                  GO TO 20

               END IF

*

            ELSE

*

               CALL slamov( 'All', mp, n, a( iia+(jja-1)*lda ),

     $                      lda, b( iib+(jjb-1)*ldb ), ldb )

*

            END IF

*

         END IF

*

      ELSE IF( m.LE.( mba-iroffa ) ) THEN

*

*        It is assumed that the local rows IIA:IIA+M-1 of the matrix A

*        are in the same process row (IAROW).

*

*            ICOFFA

*             / \JJA

*        IIA  ------------------ ....            --------

*             | .x  |    |    |                 / |    | \

*             | . x |    |    |            ILEFT| |    | |

*             | .  x     |    |                 | |    | |

*             | .   x    |    |                 \ x    | |

*             | .   |x   |    |                   |x   | | IRIGHT

*             | .   | x  |    |                   | x  | |

*    (IAROW)  | .   |  x |    |                   |  x | |

*             | .   |   x|    |                   |   x| |

*             | .   |    x    |                   |    x /

*             | .   |    |x   |                   |    |

*             | .   |    | x  |                   |    |

*             | .   |    |  x |                   |    |

*             | .   |    |   x|                   |    |

*    IIA+M-1  ------------------ ....            -------

*              NB_A

*             (IACOL)                          Local picture

*

         IF( myrow.EQ.iarow ) THEN

*

            nq = numroc( n+icoffa, nba, mycol, iacol, npcol )

            IF( nq.LE.0 )

     $         RETURN

            IF( mycol.EQ.iacol )

     $         nq = nq - icoffa

            mydist = mod( mycol-iacol+npcol, npcol )

            ileft  = mydist * nba - icoffa

*

            IF( lsame( uplo, 'L' ) ) THEN

*

               ileft  = max( 0, ileft )

               jjbega = jja

               jjenda = jja + nq - 1

               jjnxta = min( iceil( jjbega, nba ) * nba, jjenda )

               jjbegb = jjb

               jjnxtb = jjbegb + jjnxta - jjbega

*

   30          CONTINUE

               IF( ( m-ileft ).GT.0 ) THEN

                  CALL slamov( uplo, m-ileft, jjnxta-jjbega+1,

     $                         a( iia+ileft+(jjbega-1)*lda ), lda,

     $                         b( iib+ileft+(jjbegb-1)*ldb ), ldb )

                  mydist = mydist + npcol

                  ileft  = mydist * nba - icoffa

                  jjbega = jjnxta +1

                  jjnxta = min( jjnxta+nba, jjenda )

                  jjbegb = jjnxtb +1

                  jjnxtb = jjbegb + jjnxta - jjbega

                  GO TO 30

               END IF

*

            ELSE IF( lsame( uplo, 'U' ) ) THEN

*

               nqaa   = nq

               iiaa   = iia

               jjaa   = jja

               iibb   = iib

               jjbb   = jjb

               iright = min( ileft + nba, m )

               ileft  = min( max( 0, ileft ), m )

*

   40          CONTINUE

               IF( iiaa.LE.( iia+m-1 ) ) THEN

                  wide = iright - ileft

                  CALL slamov( 'All', ileft-iiaa+iia, nqaa,

     $                         a( iiaa+(jjaa-1)*lda ), lda,

     $                         b( iibb+(jjbb-1)*ldb ), ldb )

                  CALL slamov( uplo, wide, nqaa,

     $                         a( iia+ileft+(jjaa-1)*lda ), lda,

     $                         b( iib+ileft+(jjbb-1)*ldb ), ldb )

                  nqaa   = max( 0, nqaa - wide )

                  iiaa   = iia  + iright

                  jjaa   = jjaa + wide

                  iibb   = iib  + iright

                  jjbb   = jjbb + wide

                  mydist = mydist + npcol

                  ileft  = mydist * nba - icoffa

                  iright = min( ileft + nba, m )

                  ileft  = min( ileft, m )

                  GO TO 40

               END IF

*

            ELSE

*

               CALL slamov( 'All', m, nq, a( iia+(jja-1)*lda ),

     $                      lda, b( iib+(jjb-1)*ldb ), ldb )

*

            END IF

*

         END IF

*

      END IF

*

      RETURN

*

*     End of PSLACP2

*

      END