d0/d17/pblastim_8f_source.html

      SUBROUTINE pvdimchk( ICTXT, NOUT, N, MATRIX, IX, JX, DESCX, INCX,

     $                     INFO )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Scalar Arguments ..

      CHARACTER*1        MATRIX

      INTEGER            ICTXT, INCX, INFO, IX, JX, N, NOUT

*     ..

*     .. Array Arguments ..

      INTEGER            DESCX( * )

*     ..

*

*  Purpose

*  =======

*

*  PVDIMCHK checks the validity of the input test dimensions. In case of

*  an invalid parameter or discrepancy between the parameters, this rou-

*  tine  displays  error  messages and returns an non-zero error code in

*  INFO.

*

*  Notes

*  =====

*

*  A description  vector  is associated with each 2D block-cyclicly dis-

*  tributed matrix.  This  vector  stores  the  information  required to

*  establish the  mapping  between a  matrix entry and its corresponding

*  process and memory location.

*

*  In  the  following  comments,   the character _  should  be  read  as

*  "of  the  distributed  matrix".  Let  A  be a generic term for any 2D

*  block cyclicly distributed matrix.  Its description vector is DESCA:

*

*  NOTATION         STORED IN       EXPLANATION

*  ---------------- --------------- ------------------------------------

*  DTYPE_A (global) DESCA( DTYPE_ ) The descriptor type.

*  CTXT_A  (global) DESCA( CTXT_  ) The BLACS context handle, indicating

*                                   the NPROW x NPCOL BLACS process grid

*                                   A  is distributed over.  The context

*                                   itself  is  global,  but  the handle

*                                   (the integer value) may vary.

*  M_A     (global) DESCA( M_     ) The  number of rows in the distribu-

*                                   ted matrix A, M_A >= 0.

*  N_A     (global) DESCA( N_     ) The number of columns in the distri-

*                                   buted matrix A, N_A >= 0.

*  IMB_A   (global) DESCA( IMB_   ) The number of rows of the upper left

*                                   block of the matrix A, IMB_A > 0.

*  INB_A   (global) DESCA( INB_   ) The  number  of columns of the upper

*                                   left   block   of   the   matrix  A,

*                                   INB_A > 0.

*  MB_A    (global) DESCA( MB_    ) The blocking factor used to  distri-

*                                   bute the last  M_A-IMB_A rows of  A,

*                                   MB_A > 0.

*  NB_A    (global) DESCA( NB_    ) The blocking factor used to  distri-

*                                   bute the last  N_A-INB_A  columns of

*                                   A, NB_A > 0.

*  RSRC_A  (global) DESCA( RSRC_  ) The process row over which the first

*                                   row of the matrix  A is distributed,

*                                   NPROW > RSRC_A >= 0.

*  CSRC_A  (global) DESCA( CSRC_  ) The  process  column  over which the

*                                   first  column of  A  is distributed.

*                                   NPCOL > CSRC_A >= 0.

*  LLD_A   (local)  DESCA( LLD_   ) The  leading  dimension of the local

*                                   array  storing  the  local blocks of

*                                   the distributed matrix A,

*                                   IF( Lc( 1, N_A ) > 0 )

*                                      LLD_A >= MAX( 1, Lr( 1, M_A ) )

*                                   ELSE

*                                      LLD_A >= 1.

*

*  Let K be the number of  rows of a matrix A starting at the global in-

*  dex IA,i.e, A( IA:IA+K-1, : ). Lr( IA, K ) denotes the number of rows

*  that the process of row coordinate MYROW ( 0 <= MYROW < NPROW ) would

*  receive if these K rows were distributed over NPROW processes.  If  K

*  is the number of columns of a matrix  A  starting at the global index

*  JA, i.e, A( :, JA:JA+K-1, : ), Lc( JA, K ) denotes the number  of co-

*  lumns that the process MYCOL ( 0 <= MYCOL < NPCOL ) would  receive if

*  these K columns were distributed over NPCOL processes.

*

*  The values of Lr() and Lc() may be determined via a call to the func-

*  tion PB_NUMROC:

*  Lr( IA, K ) = PB_NUMROC( K, IA, IMB_A, MB_A, MYROW, RSRC_A, NPROW )

*  Lc( JA, K ) = PB_NUMROC( K, JA, INB_A, NB_A, MYCOL, CSRC_A, NPCOL )

*

*  Arguments

*  =========

*

*  ICTXT   (local input) INTEGER

*          On entry,  ICTXT  specifies the BLACS context handle, indica-

*          ting the global  context of the operation. The context itself

*          is global, but the value of ICTXT is local.

*

*  NOUT    (global input) INTEGER

*          On entry, NOUT specifies the unit number for the output file.

*          When NOUT is 6, output to screen,  when  NOUT is 0, output to

*          stderr. NOUT is only defined for process 0.

*

*  MATRIX  (global input) CHARACTER*1

*          On entry,  MATRIX  specifies the one character matrix identi-

*          fier.

*

*  IX      (global input) INTEGER

*          On entry, IX  specifies X's global row index, which points to

*          the beginning of the submatrix sub( X ).

*

*  JX      (global input) INTEGER

*          On entry, JX  specifies X's global column index, which points

*          to the beginning of the submatrix sub( X ).

*

*  DESCX   (global and local input) INTEGER array

*          On entry, DESCX  is an integer array of dimension DLEN_. This

*          is the array descriptor for the matrix X.

*

*  INCX    (global input) INTEGER

*          On entry,  INCX   specifies  the  global  increment  for  the

*          elements of  X.  Only two values of  INCX   are  supported in

*          this version, namely 1 and M_X. INCX  must not be zero.

*

*  INFO    (global output) INTEGER

*          On exit,  when  INFO  is  zero,  no  error has been detected,

*          otherwise an error has been detected.

*

*  -- Written on April 1, 1998 by

*     Antoine Petitet, University  of  Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Parameters ..

      INTEGER            BLOCK_CYCLIC_2D_INB, CSRC_, CTXT_, DLEN_,

     $                   dtype_, imb_, inb_, lld_, mb_, m_, nb_, n_,

     $                   rsrc_

      parameter( block_cyclic_2d_inb = 2, dlen_ = 11,

     $                   dtype_ = 1, ctxt_ = 2, m_ = 3, n_ = 4,

     $                   imb_ = 5, inb_ = 6, mb_ = 7, nb_ = 8,

     $                   rsrc_ = 9, csrc_ = 10, lld_ = 11 )

*     ..

*     .. Local Scalars ..

      INTEGER         MYCOL, MYROW, NPCOL, NPROW

*     ..

*     .. External Subroutines ..

      EXTERNAL        blacs_gridinfo, igsum2d

*     ..

*     .. Executable Statements ..

*

      info = 0

      CALL blacs_gridinfo( ictxt, nprow, npcol, myrow, mycol )

*

      IF( n.LT.0 ) THEN

         info = 1

      ELSE IF( n.EQ.0 ) THEN

         IF( descx( m_ ).LT.0 )

     $      info = 1

         IF( descx( n_ ).LT.0 )

     $      info = 1

      ELSE

         IF( incx.EQ.descx( m_ ) .AND.

     $      descx( n_ ).LT.( jx+n-1 ) ) THEN

            info = 1

         ELSE IF( incx.EQ.1 .AND. incx.NE.descx( m_ ) .AND.

     $      descx( m_ ).LT.( ix+n-1 ) ) THEN

            info = 1

         ELSE

            IF( ix.GT.descx( m_ ) ) THEN

               info = 1

            ELSE IF( jx.GT.descx( n_ ) ) THEN

               info = 1

            END IF

         END IF

      END IF

*

*     Check all processes for an error

*

      CALL igsum2d( ictxt, 'All', ' ', 1, 1, info, 1, -1, 0 )

*

      IF( info.NE.0 ) THEN

         IF( myrow.EQ.0 .AND. mycol.EQ.0 ) THEN

            WRITE( nout, fmt = 9999 ) matrix

            WRITE( nout, fmt = 9998 ) n, matrix, ix, matrix, jx, matrix,

     $                                incx

            WRITE( nout, fmt = 9997 ) matrix, descx( m_ ), matrix,

     $                                descx( n_ )

            WRITE( nout, fmt = * )

         END IF

      END IF

*

 9999 FORMAT( 'Incompatible arguments for matrix ', a1, ':' )

 9998 FORMAT( 'N = ', i6, ', I', a1, ' = ', i6, ', J', a1, ' = ',

     $        i6, ',INC', a1, ' = ', i6 )

 9997 FORMAT( 'DESC', a1, '( M_ ) = ', i6, ', DESC', a1, '( N_ ) = ',

     $        i6, '.' )

*

      RETURN

*

*     End of PVDIMCHK

*


      END


      SUBROUTINE pmdimchk( ICTXT, NOUT, M, N, MATRIX, IA, JA, DESCA,

     $                     INFO )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Scalar Arguments ..

      CHARACTER*1        MATRIX

      INTEGER            ICTXT, INFO, IA, JA, M, N, NOUT

*     ..

*     .. Array Arguments ..

      INTEGER            DESCA( * )

*     ..

*

*  Purpose

*  =======

*

*  PMDIMCHK checks the validity of the input test dimensions. In case of

*  an invalid parameter or discrepancy between the parameters, this rou-

*  tine  displays  error  messages and returns an non-zero error code in

*  INFO.

*

*  Notes

*  =====

*

*  A description  vector  is associated with each 2D block-cyclicly dis-

*  tributed matrix.  This  vector  stores  the  information  required to

*  establish the  mapping  between a  matrix entry and its corresponding

*  process and memory location.

*

*  In  the  following  comments,   the character _  should  be  read  as

*  "of  the  distributed  matrix".  Let  A  be a generic term for any 2D

*  block cyclicly distributed matrix.  Its description vector is DESCA:

*

*  NOTATION         STORED IN       EXPLANATION

*  ---------------- --------------- ------------------------------------

*  DTYPE_A (global) DESCA( DTYPE_ ) The descriptor type.

*  CTXT_A  (global) DESCA( CTXT_  ) The BLACS context handle, indicating

*                                   the NPROW x NPCOL BLACS process grid

*                                   A  is distributed over.  The context

*                                   itself  is  global,  but  the handle

*                                   (the integer value) may vary.

*  M_A     (global) DESCA( M_     ) The  number of rows in the distribu-

*                                   ted matrix A, M_A >= 0.

*  N_A     (global) DESCA( N_     ) The number of columns in the distri-

*                                   buted matrix A, N_A >= 0.

*  IMB_A   (global) DESCA( IMB_   ) The number of rows of the upper left

*                                   block of the matrix A, IMB_A > 0.

*  INB_A   (global) DESCA( INB_   ) The  number  of columns of the upper

*                                   left   block   of   the   matrix  A,

*                                   INB_A > 0.

*  MB_A    (global) DESCA( MB_    ) The blocking factor used to  distri-

*                                   bute the last  M_A-IMB_A rows of  A,

*                                   MB_A > 0.

*  NB_A    (global) DESCA( NB_    ) The blocking factor used to  distri-

*                                   bute the last  N_A-INB_A  columns of

*                                   A, NB_A > 0.

*  RSRC_A  (global) DESCA( RSRC_  ) The process row over which the first

*                                   row of the matrix  A is distributed,

*                                   NPROW > RSRC_A >= 0.

*  CSRC_A  (global) DESCA( CSRC_  ) The  process  column  over which the

*                                   first  column of  A  is distributed.

*                                   NPCOL > CSRC_A >= 0.

*  LLD_A   (local)  DESCA( LLD_   ) The  leading  dimension of the local

*                                   array  storing  the  local blocks of

*                                   the distributed matrix A,

*                                   IF( Lc( 1, N_A ) > 0 )

*                                      LLD_A >= MAX( 1, Lr( 1, M_A ) )

*                                   ELSE

*                                      LLD_A >= 1.

*

*  Let K be the number of  rows of a matrix A starting at the global in-

*  dex IA,i.e, A( IA:IA+K-1, : ). Lr( IA, K ) denotes the number of rows

*  that the process of row coordinate MYROW ( 0 <= MYROW < NPROW ) would

*  receive if these K rows were distributed over NPROW processes.  If  K

*  is the number of columns of a matrix  A  starting at the global index

*  JA, i.e, A( :, JA:JA+K-1, : ), Lc( JA, K ) denotes the number  of co-

*  lumns that the process MYCOL ( 0 <= MYCOL < NPCOL ) would  receive if

*  these K columns were distributed over NPCOL processes.

*

*  The values of Lr() and Lc() may be determined via a call to the func-

*  tion PB_NUMROC:

*  Lr( IA, K ) = PB_NUMROC( K, IA, IMB_A, MB_A, MYROW, RSRC_A, NPROW )

*  Lc( JA, K ) = PB_NUMROC( K, JA, INB_A, NB_A, MYCOL, CSRC_A, NPCOL )

*

*  Arguments

*  =========

*

*  ICTXT   (local input) INTEGER

*          On entry,  ICTXT  specifies the BLACS context handle, indica-

*          ting the global  context of the operation. The context itself

*          is global, but the value of ICTXT is local.

*

*  NOUT    (global input) INTEGER

*          On entry, NOUT specifies the unit number for the output file.

*          When NOUT is 6, output to screen,  when  NOUT is 0, output to

*          stderr. NOUT is only defined for process 0.

*

*  MATRIX  (global input) CHARACTER*1

*          On entry,  MATRIX  specifies the one character matrix identi-

*          fier.

*

*  IA      (global input) INTEGER

*          On entry, IA  specifies A's global row index, which points to

*          the beginning of the submatrix sub( A ).

*

*  JA      (global input) INTEGER

*          On entry, JA  specifies A's global column index, which points

*          to the beginning of the submatrix sub( A ).

*

*  DESCA   (global and local input) INTEGER array

*          On entry, DESCA  is an integer array of dimension DLEN_. This

*          is the array descriptor for the matrix A.

*

*  INFO    (global output) INTEGER

*          On exit,  when  INFO  is  zero,  no  error has been detected,

*          otherwise an error has been detected.

*

*  -- Written on April 1, 1998 by

*     Antoine Petitet, University  of  Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Parameters ..

      INTEGER            BLOCK_CYCLIC_2D_INB, CSRC_, CTXT_, DLEN_,

     $                   DTYPE_, IMB_, INB_, LLD_, MB_, M_, NB_, N_,

     $                   rsrc_

      parameter( block_cyclic_2d_inb = 2, dlen_ = 11,

     $                   dtype_ = 1, ctxt_ = 2, m_ = 3, n_ = 4,

     $                   imb_ = 5, inb_ = 6, mb_ = 7, nb_ = 8,

     $                   rsrc_ = 9, csrc_ = 10, lld_ = 11 )

*     ..

*     .. Local Scalars ..

      INTEGER         MYCOL, MYROW, NPCOL, NPROW

*     ..

*     .. External Subroutines ..

      EXTERNAL        blacs_gridinfo, igsum2d

*     ..

*     .. Executable Statements ..

*

      info = 0

      CALL blacs_gridinfo( ictxt, nprow, npcol, myrow, mycol )

*

      IF( ( m.LT.0 ).OR.( n.LT.0 ) ) THEN

         info = 1

      ELSE IF( ( m.EQ.0 ).OR.( n.EQ.0 ) )THEN

         IF( desca( m_ ).LT.0 )

     $      info = 1

         IF( desca( n_ ).LT.0 )

     $      info = 1

      ELSE

         IF( desca( m_ ).LT.( ia+m-1 ) )

     $      info = 1

         IF( desca( n_ ).LT.( ja+n-1 ) )

     $      info = 1

      END IF

*

*     Check all processes for an error

*

      CALL igsum2d( ictxt, 'All', ' ', 1, 1, info, 1, -1, 0 )

*

      IF( info.NE.0 ) THEN

         IF( myrow.EQ.0 .AND. mycol.EQ.0 ) THEN

            WRITE( nout, fmt = 9999 ) matrix

            WRITE( nout, fmt = 9998 ) m, n, matrix, ia, matrix, ja

            WRITE( nout, fmt = 9997 ) matrix, desca( m_ ), matrix,

     $                                desca( n_ )

            WRITE( nout, fmt = * )

         END IF

      END IF

*

 9999 FORMAT( 'Incompatible arguments for matrix ', a1, ':' )

 9998 FORMAT( 'M = ', i6, ', N = ', i6, ', I', a1, ' = ', i6,

     $        ', J', a1, ' = ', i6 )

 9997 FORMAT( 'DESC', a1, '( M_ ) = ', i6, ', DESC', a1, '( N_ ) = ',

     $        i6, '.' )

*

      RETURN

*

*     End of PMDIMCHK

*


      END


      SUBROUTINE pvdescchk( ICTXT, NOUT, MATRIX, DESCX, DTX, MX, NX,

     $                      IMBX, INBX, MBX, NBX, RSRCX, CSRCX, INCX,

     $                      MPX, NQX, IPREX, IMIDX, IPOSTX, IGAP,

     $                      GAPMUL, INFO )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Scalar Arguments ..

      CHARACTER*1        MATRIX

      INTEGER            CSRCX, DTX, GAPMUL, ICTXT, IGAP, IMBX, IMIDX,

     $                   INBX, INCX, INFO, IPOSTX, IPREX, MBX, MPX, MX,

     $                   NBX, NOUT, NQX, NX, RSRCX

*     ..

*     .. Array Arguments ..

      INTEGER            DESCX( * )

*     ..

*

*  Purpose

*  =======

*

*  PVDESCCHK  checks  the validity of the input test parameters and ini-

*  tializes  the  descriptor DESCX and the scalar variables MPX, NQX. In

*  case  of  an  invalid parameter, this routine displays error messages

*  and return an non-zero error code in INFO.

*

*  Notes

*  =====

*

*  A description  vector  is associated with each 2D block-cyclicly dis-

*  tributed matrix.  This  vector  stores  the  information  required to

*  establish the  mapping  between a  matrix entry and its corresponding

*  process and memory location.

*

*  In  the  following  comments,   the character _  should  be  read  as

*  "of  the  distributed  matrix".  Let  A  be a generic term for any 2D

*  block cyclicly distributed matrix.  Its description vector is DESCA:

*

*  NOTATION         STORED IN       EXPLANATION

*  ---------------- --------------- ------------------------------------

*  DTYPE_A (global) DESCA( DTYPE_ ) The descriptor type.

*  CTXT_A  (global) DESCA( CTXT_  ) The BLACS context handle, indicating

*                                   the NPROW x NPCOL BLACS process grid

*                                   A  is distributed over.  The context

*                                   itself  is  global,  but  the handle

*                                   (the integer value) may vary.

*  M_A     (global) DESCA( M_     ) The  number of rows in the distribu-

*                                   ted matrix A, M_A >= 0.

*  N_A     (global) DESCA( N_     ) The number of columns in the distri-

*                                   buted matrix A, N_A >= 0.

*  IMB_A   (global) DESCA( IMB_   ) The number of rows of the upper left

*                                   block of the matrix A, IMB_A > 0.

*  INB_A   (global) DESCA( INB_   ) The  number  of columns of the upper

*                                   left   block   of   the   matrix  A,

*                                   INB_A > 0.

*  MB_A    (global) DESCA( MB_    ) The blocking factor used to  distri-

*                                   bute the last  M_A-IMB_A rows of  A,

*                                   MB_A > 0.

*  NB_A    (global) DESCA( NB_    ) The blocking factor used to  distri-

*                                   bute the last  N_A-INB_A  columns of

*                                   A, NB_A > 0.

*  RSRC_A  (global) DESCA( RSRC_  ) The process row over which the first

*                                   row of the matrix  A is distributed,

*                                   NPROW > RSRC_A >= 0.

*  CSRC_A  (global) DESCA( CSRC_  ) The  process  column  over which the

*                                   first  column of  A  is distributed.

*                                   NPCOL > CSRC_A >= 0.

*  LLD_A   (local)  DESCA( LLD_   ) The  leading  dimension of the local

*                                   array  storing  the  local blocks of

*                                   the distributed matrix A,

*                                   IF( Lc( 1, N_A ) > 0 )

*                                      LLD_A >= MAX( 1, Lr( 1, M_A ) )

*                                   ELSE

*                                      LLD_A >= 1.

*

*  Let K be the number of  rows of a matrix A starting at the global in-

*  dex IA,i.e, A( IA:IA+K-1, : ). Lr( IA, K ) denotes the number of rows

*  that the process of row coordinate MYROW ( 0 <= MYROW < NPROW ) would

*  receive if these K rows were distributed over NPROW processes.  If  K

*  is the number of columns of a matrix  A  starting at the global index

*  JA, i.e, A( :, JA:JA+K-1, : ), Lc( JA, K ) denotes the number  of co-

*  lumns that the process MYCOL ( 0 <= MYCOL < NPCOL ) would  receive if

*  these K columns were distributed over NPCOL processes.

*

*  The values of Lr() and Lc() may be determined via a call to the func-

*  tion PB_NUMROC:

*  Lr( IA, K ) = PB_NUMROC( K, IA, IMB_A, MB_A, MYROW, RSRC_A, NPROW )

*  Lc( JA, K ) = PB_NUMROC( K, JA, INB_A, NB_A, MYCOL, CSRC_A, NPCOL )

*

*  Arguments

*  =========

*

*  ICTXT   (local input) INTEGER

*          On entry,  ICTXT  specifies the BLACS context handle, indica-

*          ting the global  context of the operation. The context itself

*          is global, but the value of ICTXT is local.

*

*  NOUT    (global input) INTEGER

*          On entry, NOUT specifies the unit number for the output file.

*          When NOUT is 6, output to screen,  when  NOUT is 0, output to

*          stderr. NOUT is only defined for process 0.

*

*  MATRIX  (global input) CHARACTER*1

*          On entry,  MATRIX  specifies the one character matrix identi-

*          fier.

*

*  DESCX   (global output) INTEGER array

*          On entry, DESCX  is an array of dimension DLEN_. DESCX is the

*          array descriptor to be set.

*

*  DTYPEX  (global input) INTEGER

*          On entry, DTYPEX  specifies the descriptor type. In this ver-

*          sion, DTYPEX must be BLOCK_CYCLIC_INB_2D.

*

*  MX      (global input) INTEGER

*          On entry, MX  specifies the number of rows in the matrix.  MX

*          must be at least zero.

*

*  NX      (global input) INTEGER

*          On  entry,  NX specifies the number of columns in the matrix.

*          NX must be at least zero.

*

*  IMBX    (global input) INTEGER

*          On entry, IMBX specifies the row blocking factor used to dis-

*          tribute  the  first  IMBX rows of the matrix. IMBX must be at

*          least one.

*

*  INBX    (global input) INTEGER

*          On entry,  INBX  specifies the column blocking factor used to

*          distribute  the  first  INBX columns of the matrix. INBX must

*          be at least one.

*

*  MBX     (global input) INTEGER

*          On entry, MBX  specifies the row blocking factor used to dis-

*          tribute the rows of the matrix. MBX must be at least one.

*

*  NBX     (global input) INTEGER

*          On entry, NBX  specifies  the  column blocking factor used to

*          distribute  the  columns  of the matrix. NBX must be at least

*          one.

*

*  RSRCX   (global input) INTEGER

*          On entry, RSRCX  specifies the process row in which the first

*          row  of  the  matrix resides. When RSRCX is -1, the matrix is

*          row replicated,  otherwise  RSCRX  must  be at least zero and

*          strictly less than NPROW.

*

*  CSRCX   (global input) INTEGER

*          On entry,  CSRCX  specifies  the  process column in which the

*          first column of the matrix resides.  When  CSRCX  is -1,  the

*          matrix is column replicated, otherwise CSCRX must be at least

*          zero and strictly less than NPCOL.

*

*  INCX    (global input) INTEGER

*          On entry,  INCX  specifies  the global vector increment. INCX

*          must be one or MX.

*

*  MPX     (local output) INTEGER

*          On exit, MPX is Lr( 1, MX ).

*

*  NQX     (local output) INTEGER

*          On exit, NQX is Lc( 1, NX ).

*

*  IPREX   (local output) INTEGER

*          On exit,  IPREX  specifies  the size of the guard zone to put

*          before the start of the local padded array.

*

*  IMIDX   (local output) INTEGER

*          On exit,  IMIDX  specifies  the  ldx-gap of the guard zone to

*          put after each column of the local padded array.

*

*  IPOSTX  (local output) INTEGER

*          On exit,  IPOSTX  specifies the size of the guard zone to put

*          after the local padded array.

*

*  IGAP    (global input) INTEGER

*          On entry, IGAP specifies the size of the ldx-gap.

*

*  GAPMUL  (global input) INTEGER

*          On entry,  GAPMUL  is  a constant factor controlling the size

*          of the pre- and post guardzone.

*

*  INFO    (global output) INTEGER

*          On exit,  when  INFO  is  zero,  no  error has been detected,

*          otherwise an error has been detected.

*

*  -- Written on April 1, 1998 by

*     Antoine Petitet, University  of  Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Parameters ..

      INTEGER            BLOCK_CYCLIC_2D_INB, CSRC_, CTXT_, DLEN_,

     $                   DTYPE_, IMB_, INB_, LLD_, MB_, M_, NB_, N_,

     $                   RSRC_

      PARAMETER          ( BLOCK_CYCLIC_2D_INB = 2, dlen_ = 11,

     $                   dtype_ = 1, ctxt_ = 2, m_ = 3, n_ = 4,

     $                   imb_ = 5, inb_ = 6, mb_ = 7, nb_ = 8,

     $                   rsrc_ = 9, csrc_ = 10, lld_ = 11 )

*     ..

*     .. Local Scalars ..

      INTEGER            LLDX, MYCOL, MYROW, NPCOL, NPROW

*     ..

*     .. External Subroutines ..

      EXTERNAL           BLACS_GRIDINFO, IGSUM2D, PB_DESCINIT2

*     ..

*     .. External Functions ..

      INTEGER            PB_NUMROC

      EXTERNAL           PB_NUMROC

*     ..

*     .. Intrinsic Functions ..

      INTRINSIC          max

*     ..

*     .. Executable Statements ..

*

      info = 0

      CALL blacs_gridinfo( ictxt, nprow, npcol, myrow, mycol )

*

*     Verify descriptor type DTYPE_

*

      IF( dtx.NE.block_cyclic_2d_inb ) THEN

         IF( myrow.EQ.0 .AND. mycol.EQ.0 )

     $      WRITE( nout, fmt = 9999 ) matrix, 'DTYPE', matrix, dtx,

     $                                block_cyclic_2d_inb

         info = 1

      END IF

*

*     Verify global matrix dimensions (M_,N_) are correct

*

      IF( mx.LT.0 ) THEN

         IF( myrow.EQ.0 .AND. mycol.EQ.0 )

     $      WRITE( nout, fmt = 9998 ) matrix, 'M', matrix, mx

         info = 1

      ELSE IF( nx.LT.0 ) THEN

         IF( myrow.EQ.0 .AND. mycol.EQ.0 )

     $      WRITE( nout, fmt = 9997 ) matrix, 'N', matrix, nx

         info = 1

      END IF

*

*     Verify if blocking factors (IMB_, INB_) are correct

*

      IF( imbx.LT.1 ) THEN

         IF( myrow.EQ.0 .AND. mycol.EQ.0 )

     $      WRITE( nout, fmt = 9996 ) matrix, 'IMB', matrix, imbx

         info = 1

      ELSE IF( inbx.LT.1 ) THEN

         IF( myrow.EQ.0 .AND. mycol.EQ.0 )

     $      WRITE( nout, fmt = 9995 ) matrix, 'INB', matrix, inbx

         info = 1

      END IF

*

*     Verify if blocking factors (MB_, NB_) are correct

*

      IF( mbx.LT.1 ) THEN

         IF( myrow.EQ.0 .AND. mycol.EQ.0 )

     $      WRITE( nout, fmt = 9994 ) matrix, 'MB', matrix, mbx

         info = 1

      ELSE IF( nbx.LT.1 ) THEN

         IF( myrow.EQ.0 .AND. mycol.EQ.0 )

     $      WRITE( nout, fmt = 9993 ) matrix, 'NB', matrix, nbx

         info = 1

      END IF

*

*     Verify if origin process coordinates (RSRC_, CSRC_) are valid

*

      IF( rsrcx.LT.-1 .OR. rsrcx.GE.nprow ) THEN

         IF( myrow.EQ.0 .AND. mycol.EQ.0 ) THEN

            WRITE( nout, fmt = 9992 ) matrix

            WRITE( nout, fmt = 9990 ) 'RSRC', matrix, rsrcx, nprow

         END IF

         info = 1

      ELSE IF( csrcx.LT.-1 .OR. csrcx.GE.npcol ) THEN

         IF( myrow.EQ.0 .AND. mycol.EQ.0 ) THEN

            WRITE( nout, fmt = 9991 ) matrix

            WRITE( nout, fmt = 9990 ) 'CSRC', matrix, csrcx, npcol

         END IF

         info = 1

      END IF

*

*     Check input increment value

*

      IF( incx.NE.1 .AND. incx.NE.mx ) THEN

         IF( myrow.EQ.0 .AND. mycol.EQ.0 ) THEN

            WRITE( nout, fmt = 9989 ) matrix

            WRITE( nout, fmt = 9988 ) 'INC', matrix, incx, matrix, mx

         END IF

         info = 1

      END IF

*

*     Check all processes for an error

*

      CALL igsum2d( ictxt, 'All', ' ', 1, 1, info, 1, -1, 0 )

*

      IF( info.NE.0 ) THEN

*

         IF( myrow.EQ.0 .AND. mycol.EQ.0 ) THEN

            WRITE( nout, fmt = 9987 ) matrix

            WRITE( nout, fmt = * )

         END IF

*

      ELSE

*

*        Compute local testing leading dimension

*

         mpx    = pb_numroc( mx, 1, imbx, mbx, myrow, rsrcx, nprow )

         nqx    = pb_numroc( nx, 1, inbx, nbx, mycol, csrcx, npcol )

         iprex  = max( gapmul*nbx, mpx )

         imidx  = igap

         ipostx = max( gapmul*nbx, nqx )

         lldx   = max( 1, mpx ) + imidx

*

         CALL pb_descinit2( descx, mx, nx, imbx, inbx, mbx, nbx, rsrcx,

     $                      csrcx, ictxt, lldx, info )

*

*        Check all processes for an error

*

         CALL igsum2d( ictxt, 'All', ' ', 1, 1, info, 1, -1, 0 )

*

         IF( info.NE.0 ) THEN

            IF( myrow.EQ.0 .AND. mycol.EQ.0 ) THEN

               WRITE( nout, fmt = 9987 ) matrix

               WRITE( nout, fmt = * )

            END IF

         END IF

*

      END IF

*

 9999 FORMAT( 2x, '>> Invalid matrix ', a1, ' descriptor type ', a5, a1,

     $        ': ', i6, ' should be ', i3, '.' )

 9998 FORMAT( 2x, '>> Invalid matrix ', a1, ' row dimension ', a1, a1,

     $        ': ', i6, ' should be at least 1.' )

 9997 FORMAT( 2x, '>> Invalid matrix ', a1, ' column dimension ', a1,

     $        a1, ': ', i6, ' should be at least 1.' )

 9996 FORMAT( 2x, '>> Invalid matrix ', a1, ' first row block size ',

     $        a3, a1, ': ', i6, ' should be at least 1.' )

 9995 FORMAT( 2x, '>> Invalid matrix ', a1, ' first column block size ',

     $        a3, a1,': ', i6, ' should be at least 1.' )

 9994 FORMAT( 2x, '>> Invalid matrix ', a1, ' row block size ', a2, a1,

     $        ': ', i6, ' should be at least 1.' )

 9993 FORMAT( 2x, '>> Invalid matrix ', a1, ' column block size ', a2,

     $        a1,': ', i6, ' should be at least 1.' )

 9992 FORMAT( 2x, '>> Invalid matrix ', a1, ' row process source:' )

 9991 FORMAT( 2x, '>> Invalid matrix ', a1, ' column process source:' )

 9990 FORMAT( 2x, '>> ', a4, a1, '= ', i6, ' should be >= -1 and < ',

     $        i6, '.' )

 9989 FORMAT( 2x, '>> Invalid vector ', a1, ' increment:' )

 9988 FORMAT( 2x, '>> ', a3, a1, '= ', i6, ' should be 1 or M', a1,

     $        ' = ', i6, '.' )

 9987 FORMAT( 2x, '>> Invalid matrix ', a1, ' descriptor: going on to ',

     $        'next test case.' )

*

      RETURN

*

*     End of PVDESCCHK

*


      END


      SUBROUTINE pmdescchk( ICTXT, NOUT, MATRIX, DESCA, DTA, MA, NA,

     $                      IMBA, INBA, MBA, NBA, RSRCA, CSRCA, MPA,

     $                      NQA, IPREA, IMIDA, IPOSTA, IGAP, GAPMUL,

     $                      INFO )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Scalar Arguments ..

      CHARACTER*1        MATRIX

      INTEGER            CSRCA, DTA, GAPMUL, ICTXT, IGAP, IMBA, IMIDA,

     $                   INBA, INFO, IPOSTA, IPREA, MA, MBA, MPA, NA,

     $                   NBA, NOUT, NQA, RSRCA

*     ..

*     .. Array Arguments ..

      INTEGER            DESCA( * )

*     ..

*

*  Purpose

*  =======

*

*  PMDESCCHK  checks  the validity of the input test parameters and ini-

*  tializes  the  descriptor DESCA and the scalar variables MPA, NQA. In

*  case  of  an  invalid parameter, this routine displays error messages

*  and return an non-zero error code in INFO.

*

*  Notes

*  =====

*

*  A description  vector  is associated with each 2D block-cyclicly dis-

*  tributed matrix.  This  vector  stores  the  information  required to

*  establish the  mapping  between a  matrix entry and its corresponding

*  process and memory location.

*

*  In  the  following  comments,   the character _  should  be  read  as

*  "of  the  distributed  matrix".  Let  A  be a generic term for any 2D

*  block cyclicly distributed matrix.  Its description vector is DESCA:

*

*  NOTATION         STORED IN       EXPLANATION

*  ---------------- --------------- ------------------------------------

*  DTYPE_A (global) DESCA( DTYPE_ ) The descriptor type.

*  CTXT_A  (global) DESCA( CTXT_  ) The BLACS context handle, indicating

*                                   the NPROW x NPCOL BLACS process grid

*                                   A  is distributed over.  The context

*                                   itself  is  global,  but  the handle

*                                   (the integer value) may vary.

*  M_A     (global) DESCA( M_     ) The  number of rows in the distribu-

*                                   ted matrix A, M_A >= 0.

*  N_A     (global) DESCA( N_     ) The number of columns in the distri-

*                                   buted matrix A, N_A >= 0.

*  IMB_A   (global) DESCA( IMB_   ) The number of rows of the upper left

*                                   block of the matrix A, IMB_A > 0.

*  INB_A   (global) DESCA( INB_   ) The  number  of columns of the upper

*                                   left   block   of   the   matrix  A,

*                                   INB_A > 0.

*  MB_A    (global) DESCA( MB_    ) The blocking factor used to  distri-

*                                   bute the last  M_A-IMB_A rows of  A,

*                                   MB_A > 0.

*  NB_A    (global) DESCA( NB_    ) The blocking factor used to  distri-

*                                   bute the last  N_A-INB_A  columns of

*                                   A, NB_A > 0.

*  RSRC_A  (global) DESCA( RSRC_  ) The process row over which the first

*                                   row of the matrix  A is distributed,

*                                   NPROW > RSRC_A >= 0.

*  CSRC_A  (global) DESCA( CSRC_  ) The  process  column  over which the

*                                   first  column of  A  is distributed.

*                                   NPCOL > CSRC_A >= 0.

*  LLD_A   (local)  DESCA( LLD_   ) The  leading  dimension of the local

*                                   array  storing  the  local blocks of

*                                   the distributed matrix A,

*                                   IF( Lc( 1, N_A ) > 0 )

*                                      LLD_A >= MAX( 1, Lr( 1, M_A ) )

*                                   ELSE

*                                      LLD_A >= 1.

*

*  Let K be the number of  rows of a matrix A starting at the global in-

*  dex IA,i.e, A( IA:IA+K-1, : ). Lr( IA, K ) denotes the number of rows

*  that the process of row coordinate MYROW ( 0 <= MYROW < NPROW ) would

*  receive if these K rows were distributed over NPROW processes.  If  K

*  is the number of columns of a matrix  A  starting at the global index

*  JA, i.e, A( :, JA:JA+K-1, : ), Lc( JA, K ) denotes the number  of co-

*  lumns that the process MYCOL ( 0 <= MYCOL < NPCOL ) would  receive if

*  these K columns were distributed over NPCOL processes.

*

*  The values of Lr() and Lc() may be determined via a call to the func-

*  tion PB_NUMROC:

*  Lr( IA, K ) = PB_NUMROC( K, IA, IMB_A, MB_A, MYROW, RSRC_A, NPROW )

*  Lc( JA, K ) = PB_NUMROC( K, JA, INB_A, NB_A, MYCOL, CSRC_A, NPCOL )

*

*  Arguments

*  =========

*

*  ICTXT   (local input) INTEGER

*          On entry,  ICTXT  specifies the BLACS context handle, indica-

*          ting the global  context of the operation. The context itself

*          is global, but the value of ICTXT is local.

*

*  NOUT    (global input) INTEGER

*          On entry, NOUT specifies the unit number for the output file.

*          When NOUT is 6, output to screen,  when  NOUT is 0, output to

*          stderr. NOUT is only defined for process 0.

*

*  MATRIX  (global input) CHARACTER*1

*          On entry,  MATRIX  specifies the one character matrix identi-

*          fier.

*

*  DESCA   (global output) INTEGER array

*          On entry, DESCA  is an array of dimension DLEN_. DESCA is the

*          array descriptor to be set.

*

*  DTYPEA  (global input) INTEGER

*          On entry, DTYPEA  specifies the descriptor type. In this ver-

*          sion, DTYPEA must be BLOCK_CYCLIC_INB_2D.

*

*  MA      (global input) INTEGER

*          On entry, MA  specifies the number of rows in the matrix.  MA

*          must be at least zero.

*

*  NA      (global input) INTEGER

*          On  entry,  NA specifies the number of columns in the matrix.

*          NA must be at least zero.

*

*  IMBA    (global input) INTEGER

*          On entry, IMBA specifies the row blocking factor used to dis-

*          tribute  the  first  IMBA rows of the matrix. IMBA must be at

*          least one.

*

*  INBA    (global input) INTEGER

*          On entry,  INBA  specifies the column blocking factor used to

*          distribute  the  first  INBA columns of the matrix. INBA must

*          be at least one.

*

*  MBA     (global input) INTEGER

*          On entry, MBA  specifies the row blocking factor used to dis-

*          tribute the rows of the matrix. MBA must be at least one.

*

*  NBA     (global input) INTEGER

*          On entry, NBA  specifies  the  column blocking factor used to

*          distribute  the  columns  of the matrix. NBA must be at least

*          one.

*

*  RSRCA   (global input) INTEGER

*          On entry, RSRCA  specifies the process row in which the first

*          row  of  the  matrix resides. When RSRCA is -1, the matrix is

*          row replicated,  otherwise  RSCRA  must  be at least zero and

*          strictly less than NPROW.

*

*  CSRCA   (global input) INTEGER

*          On entry,  CSRCA  specifies  the  process column in which the

*          first column of the matrix resides.  When  CSRCA  is -1,  the

*          matrix is column replicated, otherwise CSCRA must be at least

*          zero and strictly less than NPCOL.

*

*  MPA     (local output) INTEGER

*          On exit, MPA is Lr( 1, MA ).

*

*  NQA     (local output) INTEGER

*          On exit, NQA is Lc( 1, NA ).

*

*  IPREA   (local output) INTEGER

*          On exit,  IPREA  specifies  the size of the guard zone to put

*          before the start of the local padded array.

*

*  IMIDA   (local output) INTEGER

*          On exit,  IMIDA  specifies  the  lda-gap of the guard zone to

*          put after each column of the local padded array.

*

*  IPOSTA  (local output) INTEGER

*          On exit,  IPOSTA  specifies the size of the guard zone to put

*          after the local padded array.

*

*  IGAP    (global input) INTEGER

*          On entry, IGAP specifies the size of the lda-gap.

*

*  GAPMUL  (global input) INTEGER

*          On entry,  GAPMUL  is  a constant factor controlling the size

*          of the pre- and post guardzone.

*

*  INFO    (global output) INTEGER

*          On exit,  when  INFO  is  zero,  no  error has been detected,

*          otherwise an error has been detected.

*

*  -- Written on April 1, 1998 by

*     Antoine Petitet, University  of  Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Parameters ..

      INTEGER            BLOCK_CYCLIC_2D_INB, CSRC_, CTXT_, DLEN_,

     $                   DTYPE_, IMB_, INB_, LLD_, MB_, M_, NB_, N_,

     $                   RSRC_

      PARAMETER          ( BLOCK_CYCLIC_2D_INB = 2, dlen_ = 11,

     $                   dtype_ = 1, ctxt_ = 2, m_ = 3, n_ = 4,

     $                   imb_ = 5, inb_ = 6, mb_ = 7, nb_ = 8,

     $                   rsrc_ = 9, csrc_ = 10, lld_ = 11 )

*     ..

*     .. Local Scalars ..

      INTEGER            LLDA, MYCOL, MYROW, NPCOL, NPROW

*     ..

*     .. External Subroutines ..

      EXTERNAL           blacs_gridinfo, igsum2d, pb_descinit2

*     ..

*     .. External Functions ..

      INTEGER            PB_NUMROC

      EXTERNAL           PB_NUMROC

*     ..

*     .. Intrinsic Functions ..

      INTRINSIC          max

*     ..

*     .. Executable Statements ..

*

      info = 0

      CALL blacs_gridinfo( ictxt, nprow, npcol, myrow, mycol )

*

*     Verify descriptor type DTYPE_

*

      IF( dta.NE.block_cyclic_2d_inb ) THEN

         IF( myrow.EQ.0 .AND. mycol.EQ.0 )

     $      WRITE( nout, fmt = 9999 ) matrix, 'DTYPE', matrix, dta,

     $                                block_cyclic_2d_inb

         info = 1

      END IF

*

*     Verify global matrix dimensions (M_,N_) are correct

*

      IF( ma.LT.0 ) THEN

         IF( myrow.EQ.0 .AND. mycol.EQ.0 )

     $      WRITE( nout, fmt = 9998 ) matrix, 'M', matrix, ma

         info = 1

      ELSE IF( na.LT.0 ) THEN

         IF( myrow.EQ.0 .AND. mycol.EQ.0 )

     $      WRITE( nout, fmt = 9997 ) matrix, 'N', matrix, na

         info = 1

      END IF

*

*     Verify if blocking factors (IMB_, INB_) are correct

*

      IF( imba.LT.1 ) THEN

         IF( myrow.EQ.0 .AND. mycol.EQ.0 )

     $      WRITE( nout, fmt = 9996 ) matrix, 'IMB', matrix, imba

         info = 1

      ELSE IF( inba.LT.1 ) THEN

         IF( myrow.EQ.0 .AND. mycol.EQ.0 )

     $      WRITE( nout, fmt = 9995 ) matrix, 'INB', matrix, inba

         info = 1

      END IF

*

*     Verify if blocking factors (MB_, NB_) are correct

*

      IF( mba.LT.1 ) THEN

         IF( myrow.EQ.0 .AND. mycol.EQ.0 )

     $      WRITE( nout, fmt = 9994 ) matrix, 'MB', matrix, mba

         info = 1

      ELSE IF( nba.LT.1 ) THEN

         IF( myrow.EQ.0 .AND. mycol.EQ.0 )

     $      WRITE( nout, fmt = 9993 ) matrix, 'NB', matrix, nba

         info = 1

      END IF

*

*     Verify if origin process coordinates (RSRC_, CSRC_) are valid

*

      IF( rsrca.LT.-1 .OR. rsrca.GE.nprow ) THEN

         IF( myrow.EQ.0 .AND. mycol.EQ.0 ) THEN

            WRITE( nout, fmt = 9992 ) matrix

            WRITE( nout, fmt = 9990 ) 'RSRC', matrix, rsrca, nprow

         END IF

         info = 1

      ELSE IF( csrca.LT.-1 .OR. csrca.GE.npcol ) THEN

         IF( myrow.EQ.0 .AND. mycol.EQ.0 ) THEN

            WRITE( nout, fmt = 9991 ) matrix

            WRITE( nout, fmt = 9990 ) 'CSRC', matrix, csrca, npcol

         END IF

         info = 1

      END IF

*

*     Check all processes for an error

*

      CALL igsum2d( ictxt, 'All', ' ', 1, 1, info, 1, -1, 0 )

*

      IF( info.NE.0 ) THEN

*

         IF( myrow.EQ.0 .AND. mycol.EQ.0 ) THEN

            WRITE( nout, fmt = 9989 ) matrix

            WRITE( nout, fmt = * )

         END IF

*

      ELSE

*

*        Compute local testing leading dimension

*

         mpa    = pb_numroc( ma, 1, imba, mba, myrow, rsrca, nprow )

         nqa    = pb_numroc( na, 1, inba, nba, mycol, csrca, npcol )

         iprea  = max( gapmul*nba, mpa )

         imida  = igap

         iposta = max( gapmul*nba, nqa )

         llda   = max( 1, mpa ) + imida

*

         CALL pb_descinit2( desca, ma, na, imba, inba, mba, nba, rsrca,

     $                      csrca, ictxt, llda, info )

*

*        Check all processes for an error

*

         CALL igsum2d( ictxt, 'All', ' ', 1, 1, info, 1, -1, 0 )

*

         IF( info.NE.0 ) THEN

            IF( myrow.EQ.0 .AND. mycol.EQ.0 ) THEN

               WRITE( nout, fmt = 9989 ) matrix

               WRITE( nout, fmt = * )

            END IF

         END IF

*

      END IF

*

 9999 FORMAT( 2x, '>> Invalid matrix ', a1, ' descriptor type ', a5, a1,

     $        ': ', i6, ' should be ', i3, '.' )

 9998 FORMAT( 2x, '>> Invalid matrix ', a1, ' row dimension ', a1, a1,

     $        ': ', i6, ' should be at least 1.' )

 9997 FORMAT( 2x, '>> Invalid matrix ', a1, ' column dimension ', a1,

     $        a1, ': ', i6, ' should be at least 1.' )

 9996 FORMAT( 2x, '>> Invalid matrix ', a1, ' first row block size ',

     $        a3, a1, ': ', i6, ' should be at least 1.' )

 9995 FORMAT( 2x, '>> Invalid matrix ', a1, ' first column block size ',

     $        a3, a1,': ', i6, ' should be at least 1.' )

 9994 FORMAT( 2x, '>> Invalid matrix ', a1, ' row block size ', a2, a1,

     $        ': ', i6, ' should be at least 1.' )

 9993 FORMAT( 2x, '>> Invalid matrix ', a1, ' column block size ', a2,

     $        a1,': ', i6, ' should be at least 1.' )

 9992 FORMAT( 2x, '>> Invalid matrix ', a1, ' row process source:' )

 9991 FORMAT( 2x, '>> Invalid matrix ', a1, ' column process source:' )

 9990 FORMAT( 2x, '>> ', a4, a1, '= ', i6, ' should be >= -1 and < ',

     $        i6, '.' )

 9989 FORMAT( 2x, '>> Invalid matrix ', a1, ' descriptor: going on to ',

     $        'next test case.' )

*

      RETURN

*

*     End of PMDESCCHK

*


      END


      DOUBLE PRECISION FUNCTION pdopbl2( SUBNAM, M, N, KKL, KKU )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Scalar Arguments ..

      CHARACTER*7        subnam

      INTEGER            kkl, kku, m, n

*     ..

*

*  Purpose

*  =======

*

*  PDOPBL2  computes  an  approximation  of the number of floating point

*  operations performed by a subroutine SUBNAM with the  given values of

*  the parameters M, N, KL, and KU.

*

*  This version counts operations for the Level 2 PBLAS.

*

*  Arguments

*  =========

*

*  SUBNAM  (input) CHARACTER*7

*          On entry, SUBNAM specifies the name of the subroutine.

*

*  M       (input) INTEGER

*          On entry,  M  specifies the number of rows of the coefficient

*          matrix.  M must be at least zero.

*

*  N       (input) INTEGER

*          On entry,  N  specifies  the number of columns of the coeffi-

*          cient matrix. If the matrix  is  square (such  as  in a solve

*          routine) then N is the number of right hand sides. N  must be

*          at least zero.

*

*  KKL     (input) INTEGER

*          On entry,  KKL  specifies the lower band width of the coeffi-

*          cient matrix. KL is set to max( 0, min( M-1, KKL ) ).

*

*  KKU     (input) INTEGER

*          On entry,  KKU  specifies the upper band width of the coeffi-

*          cient matrix. KU is set to max( 0, min( N-1, KKU ) ).

*

*  -- Written on April 1, 1998 by

*     Antoine Petitet, University  of  Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Parameters ..

      DOUBLE PRECISION   one, six, two, zero

      PARAMETER          ( one = 1.0d+0, six = 6.0d+0, two = 2.0d+0,

     $                   zero = 0.0d+0 )

*     ..

*     .. Local Scalars ..

      CHARACTER*1        c1

      CHARACTER*2        c2

      CHARACTER*3        c3

      DOUBLE PRECISION   adds, ek, em, en, kl, ku, mults

*     ..

*     .. External Functions ..

      LOGICAL            lsame, lsamen

      EXTERNAL           lsame, lsamen

*     ..

*     .. Intrinsic Functions ..

      INTRINSIC          dble, max, min

*     ..

*     .. Executable Statements ..

*

*     Quick return if possible

*

      IF( m.LE.0 .OR. .NOT.( lsamen( 2, subnam, 'PS' ) .OR.

     $    lsamen( 2, subnam, 'PD' ) .OR.

     $    lsamen( 2, subnam, 'PC' ) .OR. lsamen( 2, subnam, 'PZ' ) ) )

     $     THEN

         pdopbl2 = zero

         RETURN

      END IF

*

      c1 = subnam( 2: 2 )

      c2 = subnam( 3: 4 )

      c3 = subnam( 5: 7 )

      mults = zero

      adds  = zero

      kl = max( 0, min( m-1, kkl ) )

      ku = max( 0, min( n-1, kku ) )

      em = dble( m )

      en = dble( n )

      ek = dble( kl )

*

*     -------------------------------

*     Matrix-vector multiply routines

*     -------------------------------

*

      IF( lsamen( 3, c3, 'MV ' ) ) THEN

*

         IF( lsamen( 2, c2, 'GE' ) ) THEN

*

            mults = em * ( en + one )

            adds  = em * en

*

*        Assume M <= N + KL and KL < M

*               N <= M + KU and KU < N

*        so that the zero sections are triangles.

*

         ELSE IF( lsamen( 2, c2, 'GB' ) ) THEN

*

            mults = em * ( en + one ) -

     $              ( em - one - kl ) * ( em - kl ) / two -

     $              ( en - one - ku ) * ( en - ku ) / two

            adds  = em * ( en + one ) -

     $              ( em - one - kl ) * ( em - kl ) / two -

     $              ( en - one - ku ) * ( en - ku ) / two

*

         ELSE IF( lsamen( 2, c2, 'SY' ) .OR. lsamen( 2, c2, 'SP' ) .OR.

     $            lsamen( 2, c2, 'HE' ) .OR. lsamen( 2, c2, 'HP' ) )

     $            THEN

*

            mults = em * ( em + one )

            adds  = em * em

*

         ELSE IF( lsamen( 2, c2, 'SB' ) .OR.

     $            lsamen( 2, c2, 'HB' ) ) THEN

*

            mults = em * ( em + one ) - ( em - one - ek ) * ( em - ek )

            adds  = em * em - ( em - one - ek ) * ( em - ek )

*

         ELSE IF( lsamen( 2, c2, 'TR' ) .OR. lsamen( 2, c2, 'TP' ) )

     $             THEN

*

            mults = em * ( em + one ) / two

            adds  = ( em - one ) * em / two

*

         ELSE IF( lsamen( 2, c2, 'TB' ) ) THEN

*

            mults = em * ( em + one ) / two -

     $              ( em - ek - one ) * ( em - ek ) / two

            adds = ( em - one ) * em / two -

     $             ( em - ek - one ) * ( em - ek ) / two

*

         END IF

*

*     ---------------------

*     Matrix solve routines

*     ---------------------

*

      ELSE IF( lsamen( 3, c3, 'SV ' ) ) THEN

*

         IF( lsamen( 2, c2, 'TR' ) .OR. lsamen( 2, c2, 'TP' ) ) THEN

*

            mults = em * ( em + one ) / two

            adds  = ( em - one ) * em / two

*

         ELSE IF( lsamen( 2, c2, 'TB' ) ) THEN

*

            mults = em * ( em + one ) / two -

     $              ( em - ek - one ) * ( em - ek ) / two

            adds  = ( em - one ) * em / two -

     $              ( em - ek - one ) * ( em - ek ) / two

*

         END IF

*

*     ----------------

*     Rank-one updates

*     ----------------

*

      ELSE IF( lsamen( 3, c3, 'R  ' ) ) THEN

*

         IF( lsamen( 2, c2, 'GE' ) ) THEN

*

            mults = em * en + min( em, en )

            adds  = em * en

*

         ELSE IF( lsamen( 2, c2, 'SY' ) .OR. lsamen( 2, c2, 'SP' ) .OR.

     $            lsamen( 2, c2, 'HE' ) .OR. lsamen( 2, c2, 'HP' ) )

     $            THEN

*

            mults = em * ( em + one ) / two + em

            adds  = em * ( em + one ) / two

*

         END IF

*

      ELSE IF( lsamen( 3, c3, 'RC ' ) .OR. lsamen( 3, c3, 'RU ' ) ) THEN

*

         IF( lsamen( 2, c2, 'GE' ) ) THEN

*

            mults = em * en + min( em, en )

            adds  = em * en

*

         END IF

*

*     ----------------

*     Rank-two updates

*     ----------------

*

      ELSE IF( lsamen( 3, c3, 'R2 ' ) ) THEN

         IF( lsamen( 2, c2, 'SY' ) .OR. lsamen( 2, c2, 'SP' ) .OR.

     $       lsamen( 2, c2, 'HE' ) .OR. lsamen( 2, c2, 'HP' ) ) THEN

*

            mults = em * ( em + one ) + two * em

            adds  = em * ( em + one )

*

         END IF

      END IF

*

*     ------------------------------------------------

*     Compute the total number of operations.

*     For real and double precision routines, count

*        1 for each multiply and 1 for each add.

*     For complex and complex*16 routines, count

*        6 for each multiply and 2 for each add.

*     ------------------------------------------------

*

      IF( lsame( c1, 'S' ) .OR. lsame( c1, 'D' ) ) THEN

*

         pdopbl2 = mults + adds

*

      ELSE

*

         pdopbl2 = six * mults + two * adds

*

      END IF

*

      RETURN

*

*     End of PDOPBL2

*


      END


      DOUBLE PRECISION FUNCTION pdopbl3( SUBNAM, M, N, K )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Scalar Arguments ..

      CHARACTER*7        subnam

      INTEGER            k, m, n

*     ..

*

*  Purpose

*  =======

*

*  PDOPBL3  computes  an  approximation  of the number of floating point

*  operations performed by a subroutine SUBNAM with the  given values of

*  the parameters M, N and K.

*

*  This version counts operations for the Level 3 PBLAS.

*

*  Arguments

*  =========

*

*  SUBNAM  (input) CHARACTER*7

*          On entry, SUBNAM specifies the name of the subroutine.

*

*  M       (input) INTEGER

*  N       (input) INTEGER

*  K       (input) INTEGER

*          On entry, M, N, and K  contain parameter  values  used by the

*          Level 3 PBLAS.  The output matrix is always M x N or N x N if

*          symmetric,  but  K  has different uses in different contexts.

*          For example, in the matrix-matrix multiply routine,  we  have

*          C = A * B where  C is M x N,  A is M x K, and  B is K x N. In

*          PxSYMM, PxHEMM, PxTRMM, and PxTRSM,  K  indicates whether the

*          matrix  A is applied on the left or right. If K <= 0, the ma-

*          trix is applied on the left, and if K > 0, on  the  right. In

*          PxTRADD, K  indicates  whether the matrix C is upper or lower

*          triangular. If K <= 0, the  matrix C is upper triangular, and

*          lower triangular otherwise.

*

*  -- Written on April 1, 1998 by

*     Antoine Petitet, University  of  Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Parameters ..

      DOUBLE PRECISION   one, six, two, zero

      PARAMETER          ( one = 1.0d+0, six = 6.0d+0, two = 2.0d+0,

     $                   zero = 0.0d+0 )

*     ..

*     .. Local Scalars ..

      CHARACTER*1        c1

      CHARACTER*2        c2

      CHARACTER*3        c3

      DOUBLE PRECISION   adds, ek, em, en, mults

*     ..

*     .. External Functions ..

      LOGICAL            lsame, lsamen

      EXTERNAL           lsame, lsamen

*     ..

*     .. Intrinsic Functions ..

      INTRINSIC          dble

*     ..

*     .. Executable Statements ..

*

*     Quick return if possible

*

      IF( m.LE.0 .OR. .NOT.( lsamen( 2, subnam, 'PS' ) .OR.

     $    lsamen( 2, subnam, 'PD' ) .OR. lsamen( 2, subnam, 'PC' )

     $   .OR. lsamen( 2, subnam, 'PZ' ) ) )

     $     THEN

         pdopbl3 = zero

         RETURN

      END IF

*

      c1 = subnam( 2: 2 )

      c2 = subnam( 3: 4 )

      c3 = subnam( 5: 7 )

      mults = zero

      adds  = zero

      em = dble( m )

      en = dble( n )

      ek = dble( k )

*

*     ----------------------

*     Matrix-matrix products

*        assume beta = 1

*     ----------------------

*

      IF( lsamen( 3, c3, 'MM ' ) ) THEN

*

         IF( lsamen( 2, c2, 'GE' ) ) THEN

*

            mults = em * ek * en

            adds  = em * ek * en

*

         ELSE IF( lsamen( 2, c2, 'SY' ) .OR.

     $            lsamen( 2, c2, 'HE' ) ) THEN

*

*           IF K <= 0, assume A multiplies B on the left.

*

            IF( k.LE.0 ) THEN

               mults = em * em * en

               adds  = em * em * en

            ELSE

               mults = em * en * en

               adds  = em * en * en

            END IF

*

         ELSE IF( lsamen( 2, c2, 'TR' ) ) THEN

*

*           IF K <= 0, assume A multiplies B on the left.

*

            IF( k.LE.0 ) THEN

               mults = en * em * ( em + one ) / two

               adds  = en * em * ( em - one ) / two

            ELSE

               mults = em * en * ( en + one ) / two

               adds  = em * en * ( en - one ) / two

            END IF

*

         END IF

*

*     ------------------------------------------------

*     Rank-K update of a symmetric or Hermitian matrix

*     ------------------------------------------------

*

      ELSE IF( lsamen( 3, c3, 'RK ' ) ) THEN

*

         IF( lsamen( 2, c2, 'SY' ) .OR.

     $       lsamen( 2, c2, 'HE' ) ) THEN

*

            mults = ek * em *( em + one ) / two

            adds  = ek * em *( em + one ) / two

         END IF

*

*     -------------------------------------------------

*     Rank-2K update of a symmetric or Hermitian matrix

*     -------------------------------------------------

*

      ELSE IF( lsamen( 3, c3, 'R2K' ) ) THEN

*

         IF( lsamen( 2, c2, 'SY' ) .OR.

     $       lsamen( 3, c2, 'HE' ) ) THEN

*

            mults = ek * em * em

            adds  = ek * em * em + em

         END IF

*

*     -----------------------------------------

*     Solving system with many right hand sides

*     -----------------------------------------

*

      ELSE IF( lsamen( 4, subnam( 3:6 ), 'TRSM' ) ) THEN

*

         IF( k.LE.0 ) THEN

            mults = en * em * ( em + one ) / two

            adds  = en * em * ( em - one ) / two

         ELSE

            mults = em * en * ( en + one ) / two

            adds  = em * en * ( en - one ) / two

         END IF

*

*     --------------------------

*     Matrix (tranpose) Addition

*     --------------------------

*

      ELSE IF( lsamen( 3, c3, 'ADD' ) ) THEN

*

         IF( lsamen( 2, c2, 'GE' ) ) THEN

*

            mults = 2 * em * en

            adds  = em * en

*

         ELSE IF( lsamen( 2, c2, 'TR' ) ) THEN

*

*           IF K <= 0, assume C is upper triangular.

*

            IF( k.LE.0 ) THEN

               IF( m.LE.n ) THEN

                  mults = em * ( two * en - em + one )

                  adds  = em * ( em + one ) / two + em * ( en - em )

               ELSE

                  mults = en * ( en + one )

                  adds  = en * ( en + one ) / two

               END IF

            ELSE

               IF( m.GE.n ) THEN

                  mults = en * ( two * em - en + one )

                  adds  = en * ( en + one ) / two + en * ( em - en )

               ELSE

                  mults = em * ( em + one )

                  adds  = em * ( em + one ) / two

               END IF

            END IF

*

         END IF

*

      END IF

*

*     ------------------------------------------------

*     Compute the total number of operations.

*     For real and double precision routines, count

*        1 for each multiply and 1 for each add.

*     For complex and complex*16 routines, count

*        6 for each multiply and 2 for each add.

*     ------------------------------------------------

*

      IF( lsame( c1, 'S' ) .OR. lsame( c1, 'D' ) ) THEN

*

         pdopbl3 = mults + adds

*

      ELSE

*

         pdopbl3 = six * mults + two * adds

*

      END IF

*

      RETURN

*

*     End of PDOPBL3

*


      END


      SUBROUTINE pxerbla( ICTXT, SRNAME, INFO )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Scalar Arguments ..

      INTEGER            ICTXT, INFO

*     ..

*     .. Array Arguments ..

      CHARACTER*(*)      SRNAME

*     ..

*

*  Purpose

*  =======

*

*  PXERBLA is an error handler for the ScaLAPACK routines.  It is called

*  by a ScaLAPACK routine if an input parameter has an invalid value.  A

*  message is printed. Installers may consider modifying this routine in

*  order to call system-specific exception-handling facilities.

*

*  Arguments

*  =========

*

*  ICTXT   (local input) INTEGER

*          On entry,  ICTXT  specifies the BLACS context handle, indica-

*          ting the global  context of the operation. The context itself

*          is global, but the value of ICTXT is local.

*

*  SRNAME  (global input) CHARACTER*(*)

*          On entry, SRNAME specifies the name of the routine which cal-

*          ling PXERBLA.

*

*  INFO    (global input) INTEGER

*          On entry, INFO  specifies the position of the invalid parame-

*          ter in the parameter list of the calling routine.

*

*  -- Written on April 1, 1998 by

*     Antoine Petitet, University  of  Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Local Scalars ..

      INTEGER            MYCOL, MYROW, NPCOL, NPROW

*     ..

*     .. External Subroutines ..

      EXTERNAL           BLACS_GRIDINFO

*     ..

*     .. Executable Statements ..

*

      CALL BLACS_GRIDINFO( ICTXT, NPROW, NPCOL, MYROW, MYCOL )

*

      WRITE( *, fmt = 9999 ) myrow, mycol, srname, info

*

 9999 FORMAT( '{', i5, ',', i5, '}:  On entry to ', a,

     $        ' parameter number ', i4, ' had an illegal value' )

*

      RETURN

*

*     End of PXERBLA

*


      END


      LOGICAL          FUNCTION lsame( CA, CB )

*

*  -- LAPACK auxiliary routine (version 2.1) --

*     Univ. of Tennessee, Univ. of California Berkeley, NAG Ltd.,

*     Courant Institute, Argonne National Lab, and Rice University

*     September 30, 1994

*

*     .. Scalar Arguments ..

      CHARACTER          ca, cb

*     ..

*

*  Purpose

*  =======

*

*  LSAME returns .TRUE. if CA is the same letter as CB regardless of

*  case.

*

*  Arguments

*  =========

*

*  CA      (input) CHARACTER*1

*  CB      (input) CHARACTER*1

*          CA and CB specify the single characters to be compared.

*

* =====================================================================

*

*     .. Intrinsic Functions ..

      INTRINSIC          ichar

*     ..

*     .. Local Scalars ..

      INTEGER            inta, intb, zcode

*     ..

*     .. Executable Statements ..

*

*     Test if the characters are equal

*

      lsame = ca.EQ.cb

      IF( lsame )

     $   RETURN

*

*     Now test for equivalence if both characters are alphabetic.

*

      zcode = ichar( 'Z' )

*

*     Use 'Z' rather than 'A' so that ASCII can be detected on Prime

*     machines, on which ICHAR returns a value with bit 8 set.

*     ICHAR('A') on Prime machines returns 193 which is the same as

*     ICHAR('A') on an EBCDIC machine.

*

      inta = ichar( ca )

      intb = ichar( cb )

*

      IF( zcode.EQ.90 .OR. zcode.EQ.122 ) THEN

*

*        ASCII is assumed - ZCODE is the ASCII code of either lower or

*        upper case 'Z'.

*

         IF( inta.GE.97 .AND. inta.LE.122 ) inta = inta - 32

         IF( intb.GE.97 .AND. intb.LE.122 ) intb = intb - 32

*

      ELSE IF( zcode.EQ.233 .OR. zcode.EQ.169 ) THEN

*

*        EBCDIC is assumed - ZCODE is the EBCDIC code of either lower or

*        upper case 'Z'.

*

         IF( inta.GE.129 .AND. inta.LE.137 .OR.

     $       inta.GE.145 .AND. inta.LE.153 .OR.

     $       inta.GE.162 .AND. inta.LE.169 ) inta = inta + 64

         IF( intb.GE.129 .AND. intb.LE.137 .OR.

     $       intb.GE.145 .AND. intb.LE.153 .OR.

     $       intb.GE.162 .AND. intb.LE.169 ) intb = intb + 64

*

      ELSE IF( zcode.EQ.218 .OR. zcode.EQ.250 ) THEN

*

*        ASCII is assumed, on Prime machines - ZCODE is the ASCII code

*        plus 128 of either lower or upper case 'Z'.

*

         IF( inta.GE.225 .AND. inta.LE.250 ) inta = inta - 32

         IF( intb.GE.225 .AND. intb.LE.250 ) intb = intb - 32

      END IF

      lsame = inta.EQ.intb

*

*     RETURN

*

*     End of LSAME

*


      END


      LOGICAL          FUNCTION lsamen( N, CA, CB )

*

*  -- LAPACK auxiliary routine (version 2.1) --

*     Univ. of Tennessee, Univ. of California Berkeley, NAG Ltd.,

*     Courant Institute, Argonne National Lab, and Rice University

*     September 30, 1994

*

*     .. Scalar Arguments ..

      CHARACTER*( * )    ca, cb

      INTEGER            n

*     ..

*

*  Purpose

*  =======

*

*  LSAMEN  tests if the first N letters of CA are the same as the

*  first N letters of CB, regardless of case.

*  LSAMEN returns .TRUE. if CA and CB are equivalent except for case

*  and .FALSE. otherwise.  LSAMEN also returns .FALSE. if LEN( CA )

*  or LEN( CB ) is less than N.

*

*  Arguments

*  =========

*

*  N       (input) INTEGER

*          The number of characters in CA and CB to be compared.

*

*  CA      (input) CHARACTER*(*)

*  CB      (input) CHARACTER*(*)

*          CA and CB specify two character strings of length at least N.

*          Only the first N characters of each string will be accessed.

*

* =====================================================================

*

*     .. Local Scalars ..

      INTEGER            i

*     ..

*     .. External Functions ..

      LOGICAL            lsame

      EXTERNAL           lsame

*     ..

*     .. Intrinsic Functions ..

      INTRINSIC          len

*     ..

*     .. Executable Statements ..

*

      lsamen = .false.

      IF( len( ca ).LT.n .OR. len( cb ).LT.n )

     $   GO TO 20

*

*     Do for each character in the two strings.

*

      DO 10 i = 1, n

*

*        Test if the characters are equal using LSAME.

*

         IF( .NOT.lsame( ca( i: i ), cb( i: i ) ) )

     $      GO TO 20

*

   10 CONTINUE

      lsamen = .true.

*

   20 CONTINUE

      RETURN

*

*     End of LSAMEN

*


      END


      SUBROUTINE icopy( N, SX, INCX, SY, INCY )

*

*  -- LAPACK auxiliary test routine (version 2.1) --

*     Univ. of Tennessee, Univ. of California Berkeley, NAG Ltd.,

*     Courant Institute, Argonne National Lab, and Rice University

*     February 29, 1992

*

*     .. Scalar Arguments ..

      INTEGER            INCX, INCY, N

*     ..

*     .. Array Arguments ..

      INTEGER            SX( * ), SY( * )

*     ..

*

*  Purpose

*  =======

*

*  ICOPY copies an integer vector x to an integer vector y.

*  Uses unrolled loops for increments equal to 1.

*

*  Arguments

*  =========

*

*  N       (input) INTEGER

*          The length of the vectors SX and SY.

*

*  SX      (input) INTEGER array, dimension (1+(N-1)*abs(INCX))

*          The vector X.

*

*  INCX    (input) INTEGER

*          The spacing between consecutive elements of SX.

*

*  SY      (output) INTEGER array, dimension (1+(N-1)*abs(INCY))

*          The vector Y.

*

*  INCY    (input) INTEGER

*          The spacing between consecutive elements of SY.

*

*  =====================================================================

*

*     .. Local Scalars ..

      INTEGER            I, IX, IY, M, MP1

*     ..

*     .. Intrinsic Functions ..

      INTRINSIC          MOD

*     ..

*     .. Executable Statements ..

*

      IF( N.LE.0 )

     $   RETURN

      IF( incx.EQ.1 .AND. incy.EQ.1 )

     $   GO TO 20

*

*     Code for unequal increments or equal increments not equal to 1

*

      ix = 1

      iy = 1

      IF( incx.LT.0 )

     $   ix = ( -n+1 )*incx + 1

      IF( incy.LT.0 )

     $   iy = ( -n+1 )*incy + 1

      DO 10 i = 1, n

         sy( iy ) = sx( ix )

         ix = ix + incx

         iy = iy + incy

   10 CONTINUE

      RETURN

*

*     Code for both increments equal to 1

*

*     Clean-up loop

*

   20 CONTINUE

      m = mod( n, 7 )

      IF( m.EQ.0 )

     $   GO TO 40

      DO 30 i = 1, m

         sy( i ) = sx( i )

   30 CONTINUE

      IF( n.LT.7 )

     $   RETURN

   40 CONTINUE

      mp1 = m + 1

      DO 50 i = mp1, n, 7

         sy( i ) = sx( i )

         sy( i+1 ) = sx( i+1 )

         sy( i+2 ) = sx( i+2 )

         sy( i+3 ) = sx( i+3 )

         sy( i+4 ) = sx( i+4 )

         sy( i+5 ) = sx( i+5 )

         sy( i+6 ) = sx( i+6 )

   50 CONTINUE

      RETURN

*

*     End of ICOPY

*


      END


      INTEGER FUNCTION pb_noabort( CINFO )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Scalar Arguments ..

      INTEGER            cinfo

*     ..

*

*  Purpose

*  =======

*

*  PB_NOABORT  transmits  the  info  parameter of a PBLAS routine to the

*  tester  and  tells the PBLAS error handler to avoid aborting on erro-

*  neous input arguments.

*

*  Notes

*  =====

*

*  This  routine  is  necessary  because of the CRAY C fortran interface

*  and  the  fact  that  the  usual PBLAS error handler routine has been

*  initially written in C.

*

*  -- Written on April 1, 1998 by

*     Antoine Petitet, University  of  Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Common Blocks ..

      INTEGER            info, nblog, nout

      LOGICAL            abrtflg

      common             /infoc/info, nblog

      common             /pberrorc/nout, abrtflg

*     ..

*     .. Executable Statements ..

*

      info = cinfo

      IF( abrtflg ) THEN

         pb_noabort = 0

      ELSE

         pb_noabort = 1

      END IF

*

      RETURN

*

*     End of PB_NOABORT

*


      END


      SUBROUTINE pb_infog2l( I, J, DESC, NPROW, NPCOL, MYROW, MYCOL, II,

     $                       JJ, PROW, PCOL )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Scalar Arguments ..

      INTEGER            I, II, J, JJ, MYCOL, MYROW, NPCOL, NPROW, PCOL,

     $                   PROW

*     ..

*     .. Array Arguments ..

      INTEGER            DESC( * )

*     ..

*

*  Purpose

*  =======

*

*  PB_INFOG2L  computes the starting local index II, JJ corresponding to

*  the submatrix starting globally at the entry pointed by  I,  J.  This

*  routine returns the coordinates in the grid of the process owning the

*  matrix entry of global indexes I, J, namely PROW and PCOL.

*

*  Notes

*  =====

*

*  A description  vector  is associated with each 2D block-cyclicly dis-

*  tributed matrix.  This  vector  stores  the  information  required to

*  establish the  mapping  between a  matrix entry and its corresponding

*  process and memory location.

*

*  In  the  following  comments,   the character _  should  be  read  as

*  "of  the  distributed  matrix".  Let  A  be a generic term for any 2D

*  block cyclicly distributed matrix.  Its description vector is DESCA:

*

*  NOTATION         STORED IN       EXPLANATION

*  ---------------- --------------- ------------------------------------

*  DTYPE_A (global) DESCA( DTYPE_ ) The descriptor type.

*  CTXT_A  (global) DESCA( CTXT_  ) The BLACS context handle, indicating

*                                   the NPROW x NPCOL BLACS process grid

*                                   A  is distributed over.  The context

*                                   itself  is  global,  but  the handle

*                                   (the integer value) may vary.

*  M_A     (global) DESCA( M_     ) The  number of rows in the distribu-

*                                   ted matrix A, M_A >= 0.

*  N_A     (global) DESCA( N_     ) The number of columns in the distri-

*                                   buted matrix A, N_A >= 0.

*  IMB_A   (global) DESCA( IMB_   ) The number of rows of the upper left

*                                   block of the matrix A, IMB_A > 0.

*  INB_A   (global) DESCA( INB_   ) The  number  of columns of the upper

*                                   left   block   of   the   matrix  A,

*                                   INB_A > 0.

*  MB_A    (global) DESCA( MB_    ) The blocking factor used to  distri-

*                                   bute the last  M_A-IMB_A rows of  A,

*                                   MB_A > 0.

*  NB_A    (global) DESCA( NB_    ) The blocking factor used to  distri-

*                                   bute the last  N_A-INB_A  columns of

*                                   A, NB_A > 0.

*  RSRC_A  (global) DESCA( RSRC_  ) The process row over which the first

*                                   row of the matrix  A is distributed,

*                                   NPROW > RSRC_A >= 0.

*  CSRC_A  (global) DESCA( CSRC_  ) The  process  column  over which the

*                                   first  column of  A  is distributed.

*                                   NPCOL > CSRC_A >= 0.

*  LLD_A   (local)  DESCA( LLD_   ) The  leading  dimension of the local

*                                   array  storing  the  local blocks of

*                                   the distributed matrix A,

*                                   IF( Lc( 1, N_A ) > 0 )

*                                      LLD_A >= MAX( 1, Lr( 1, M_A ) )

*                                   ELSE

*                                      LLD_A >= 1.

*

*  Let K be the number of  rows of a matrix A starting at the global in-

*  dex IA,i.e, A( IA:IA+K-1, : ). Lr( IA, K ) denotes the number of rows

*  that the process of row coordinate MYROW ( 0 <= MYROW < NPROW ) would

*  receive if these K rows were distributed over NPROW processes.  If  K

*  is the number of columns of a matrix  A  starting at the global index

*  JA, i.e, A( :, JA:JA+K-1, : ), Lc( JA, K ) denotes the number  of co-

*  lumns that the process MYCOL ( 0 <= MYCOL < NPCOL ) would  receive if

*  these K columns were distributed over NPCOL processes.

*

*  The values of Lr() and Lc() may be determined via a call to the func-

*  tion PB_NUMROC:

*  Lr( IA, K ) = PB_NUMROC( K, IA, IMB_A, MB_A, MYROW, RSRC_A, NPROW )

*  Lc( JA, K ) = PB_NUMROC( K, JA, INB_A, NB_A, MYCOL, CSRC_A, NPCOL )

*

*  Arguments

*  =========

*

*  I       (global input) INTEGER

*          On entry, I  specifies  the  global starting row index of the

*          submatrix. I must at least one.

*

*  J       (global input) INTEGER

*          On entry, J  specifies  the  global  starting column index of

*          the submatrix. J must at least one.

*

*  DESC    (global and local input) INTEGER array

*          On entry,  DESC is an integer array of dimension DLEN_.  This

*          is the array descriptor of the underlying matrix.

*

*  NPROW   (global input) INTEGER

*          On entry,  NPROW   specifies the total number of process rows

*          over which the matrix is distributed.  NPROW must be at least

*          one.

*

*  NPCOL   (global input) INTEGER

*          On entry, NPCOL specifies the total number of process columns

*          over which the matrix is distributed.  NPCOL must be at least

*          one.

*

*  MYROW   (local input) INTEGER

*          On entry,  MYROW  specifies the row coordinate of the process

*          whose local index  II  is determined.  MYROW must be at least

*          zero and strictly less than NPROW.

*

*  MYCOL   (local input) INTEGER

*          On entry,  MYCOL  specifies the column coordinate of the pro-

*          cess whose local index  JJ  is determined.  MYCOL  must be at

*          least zero and strictly less than NPCOL.

*

*  II      (local output) INTEGER

*          On exit, II  specifies the  local  starting  row index of the

*          submatrix. On exit, II is at least one.

*

*  JJ      (local output) INTEGER

*          On exit, JJ  specifies the local starting column index of the

*          submatrix. On exit, JJ is at least one.

*

*  PROW    (global output) INTEGER

*          On exit,  PROW  specifies  the  row coordinate of the process

*          that possesses the first row of the submatrix.  On exit, PROW

*          is -1 if DESC( RSRC_ )  is -1 on input, and,  at  least  zero

*          and strictly less than NPROW otherwise.

*

*  PCOL    (global output) INTEGER

*          On exit, PCOL  specifies the column coordinate of the process

*          that possesses the first column of the  submatrix.  On  exit,

*          PCOL is -1 if DESC( CSRC_ )  is -1 on input, and,  at   least

*          zero and strictly less than NPCOL otherwise.

*

*  -- Written on April 1, 1998 by

*     Antoine Petitet, University  of  Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Parameters ..

      INTEGER            BLOCK_CYCLIC_2D_INB, CSRC_, CTXT_, DLEN_,

     $                   DTYPE_, IMB_, INB_, LLD_, MB_, M_, NB_, N_,

     $                   RSRC_

      PARAMETER          ( BLOCK_CYCLIC_2D_INB = 2, dlen_ = 11,

     $                   dtype_ = 1, ctxt_ = 2, m_ = 3, n_ = 4,

     $                   imb_ = 5, inb_ = 6, mb_ = 7, nb_ = 8,

     $                   rsrc_ = 9, csrc_ = 10, lld_ = 11 )

*     ..

*     .. Local Scalars ..

      INTEGER            CSRC, I1, ILOCBLK, IMB, INB, J1, MB, MYDIST,

     $                   NB, NBLOCKS, RSRC

*     ..

*     .. Local Arrays ..

      INTEGER            DESC2( DLEN_ )

*     ..

*     .. External Subroutines ..

      EXTERNAL           PB_DESCTRANS

*     ..

*     .. Executable Statements ..

*

*     Convert descriptor

*

      CALL pb_desctrans( desc, desc2 )

*

      imb  = desc2( imb_ )

      prow = desc2( rsrc_ )

*

*     Has every process row I ?

*

      IF( ( prow.EQ.-1 ).OR.( nprow.EQ.1 ) ) THEN

*

         ii = i

*

      ELSE IF( i.LE.imb ) THEN

*

*        I is in range of first block

*

         IF( myrow.EQ.prow ) THEN

            ii = i

         ELSE

            ii = 1

         END IF

*

      ELSE

*

*        I is not in first block of matrix, figure out who has it.

*

         rsrc = prow

         mb = desc2( mb_ )

*

         IF( myrow.EQ.rsrc ) THEN

*

            nblocks = ( i - imb - 1 ) / mb + 1

            prow    = prow + nblocks

            prow    = prow - ( prow / nprow ) * nprow

*

            ilocblk = nblocks / nprow

*

            IF( ilocblk.GT.0 ) THEN

               IF( ( ilocblk*nprow ).GE.nblocks ) THEN

                  IF( myrow.EQ.prow ) THEN

                     ii = i + ( ilocblk - nblocks ) * mb

                  ELSE

                     ii = imb + ( ilocblk - 1 ) * mb + 1

                  END IF

               ELSE

                  ii = imb + ilocblk * mb + 1

               END IF

            ELSE

               ii = imb + 1

            END IF

*

         ELSE

*

            i1      = i - imb

            nblocks = ( i1 - 1 ) / mb + 1

            prow    = prow + nblocks

            prow    = prow - ( prow / nprow ) * nprow

*

            mydist  = myrow - rsrc

            IF( mydist.LT.0 )

     $         mydist = mydist + nprow

*

            ilocblk = nblocks / nprow

*

            IF( ilocblk.GT.0 ) THEN

               mydist = mydist - nblocks + ilocblk * nprow

               IF( mydist.LT.0 ) THEN

                  ii = mb + ilocblk * mb + 1

               ELSE

                  IF( myrow.EQ.prow ) THEN

                     ii = i1 + ( ilocblk - nblocks + 1 ) * mb

                  ELSE

                     ii = ilocblk * mb + 1

                  END IF

               END IF

            ELSE

               mydist = mydist - nblocks

               IF( mydist.LT.0 ) THEN

                  ii = mb + 1

               ELSE IF( myrow.EQ.prow ) THEN

                  ii = i1 + ( 1 - nblocks ) * mb

               ELSE

                  ii = 1

               END IF

            END IF

         END IF

*

      END IF

*

      inb  = desc2( inb_ )

      pcol = desc2( csrc_ )

*

*     Has every process column J ?

*

      IF( ( pcol.EQ.-1 ).OR.( npcol.EQ.1 ) ) THEN

*

         jj = j

*

      ELSE IF( j.LE.inb ) THEN

*

*        J is in range of first block

*

         IF( mycol.EQ.pcol ) THEN

            jj = j

         ELSE

            jj = 1

         END IF

*

      ELSE

*

*        J is not in first block of matrix, figure out who has it.

*

         csrc = pcol

         nb   = desc2( nb_ )

*

         IF( mycol.EQ.csrc ) THEN

*

            nblocks = ( j - inb - 1 ) / nb + 1

            pcol    = pcol + nblocks

            pcol    = pcol - ( pcol / npcol ) * npcol

*

            ilocblk = nblocks / npcol

*

            IF( ilocblk.GT.0 ) THEN

               IF( ( ilocblk*npcol ).GE.nblocks ) THEN

                  IF( mycol.EQ.pcol ) THEN

                     jj = j + ( ilocblk - nblocks ) * nb

                  ELSE

                     jj = inb + ( ilocblk - 1 ) * nb + 1

                  END IF

               ELSE

                  jj = inb + ilocblk * nb + 1

               END IF

            ELSE

               jj = inb + 1

            END IF

*

         ELSE

*

            j1      = j - inb

            nblocks = ( j1 - 1 ) / nb + 1

            pcol    = pcol + nblocks

            pcol    = pcol - ( pcol / npcol ) * npcol

*

            mydist  = mycol - csrc

            IF( mydist.LT.0 )

     $         mydist = mydist + npcol

*

            ilocblk = nblocks / npcol

*

            IF( ilocblk.GT.0 ) THEN

               mydist = mydist - nblocks + ilocblk * npcol

               IF( mydist.LT.0 ) THEN

                  jj = nb + ilocblk * nb + 1

               ELSE

                  IF( mycol.EQ.pcol ) THEN

                     jj = j1 + ( ilocblk - nblocks + 1 ) * nb

                  ELSE

                     jj = ilocblk * nb + 1

                  END IF

               END IF

            ELSE

               mydist = mydist - nblocks

               IF( mydist.LT.0 ) THEN

                  jj = nb + 1

               ELSE IF( mycol.EQ.pcol ) THEN

                  jj = j1 + ( 1 - nblocks ) * nb

               ELSE

                  jj = 1

               END IF

            END IF

         END IF

*

      END IF

*

      RETURN

*

*     End of PB_INFOG2L

*


      END


      SUBROUTINE pb_ainfog2l( M, N, I, J, DESC, NPROW, NPCOL, MYROW,

     $                        MYCOL, IMB1, INB1, MP, NQ, II, JJ, PROW,

     $                        PCOL, RPROW, RPCOL )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Scalar Arguments ..

      INTEGER            I, II, IMB1, INB1, J, JJ, M, MP, MYCOL, MYROW,

     $                   n, npcol, nprow, nq, pcol, prow, rpcol, rprow

*     ..

*     .. Array Arguments ..

      INTEGER            DESC( * )

*     ..

*

*  Purpose

*  =======

*

*  PB_AINFOG2L  computes the  starting  local row and column indexes II,

*  JJ  corresponding to  the  submatrix  starting  globally at the entry

*  pointed by I,  J. This routine returns the coordinates in the grid of

*  the  process owning  the  matrix entry of global indexes I, J, namely

*  PROW  and  PCOL. In addition, this routine computes the quantities MP

*  and  NQ,  which are respectively the local number of rows and columns

*  owned by the process of coordinate  MYROW, MYCOL corresponding to the

*  global submatrix A(I:I+M-1,J:J+N-1).  Finally, the size  of the first

*  partial block and the relative process coordinates  are also returned

*  respectively in IMB, INB and RPROW, RPCOL.

*

*  Notes

*  =====

*

*  A description  vector  is associated with each 2D block-cyclicly dis-

*  tributed matrix.  This  vector  stores  the  information  required to

*  establish the  mapping  between a  matrix entry and its corresponding

*  process and memory location.

*

*  In  the  following  comments,   the character _  should  be  read  as

*  "of  the  distributed  matrix".  Let  A  be a generic term for any 2D

*  block cyclicly distributed matrix.  Its description vector is DESCA:

*

*  NOTATION         STORED IN       EXPLANATION

*  ---------------- --------------- ------------------------------------

*  DTYPE_A (global) DESCA( DTYPE_ ) The descriptor type.

*  CTXT_A  (global) DESCA( CTXT_  ) The BLACS context handle, indicating

*                                   the NPROW x NPCOL BLACS process grid

*                                   A  is distributed over.  The context

*                                   itself  is  global,  but  the handle

*                                   (the integer value) may vary.

*  M_A     (global) DESCA( M_     ) The  number of rows in the distribu-

*                                   ted matrix A, M_A >= 0.

*  N_A     (global) DESCA( N_     ) The number of columns in the distri-

*                                   buted matrix A, N_A >= 0.

*  IMB_A   (global) DESCA( IMB_   ) The number of rows of the upper left

*                                   block of the matrix A, IMB_A > 0.

*  INB_A   (global) DESCA( INB_   ) The  number  of columns of the upper

*                                   left   block   of   the   matrix  A,

*                                   INB_A > 0.

*  MB_A    (global) DESCA( MB_    ) The blocking factor used to  distri-

*                                   bute the last  M_A-IMB_A rows of  A,

*                                   MB_A > 0.

*  NB_A    (global) DESCA( NB_    ) The blocking factor used to  distri-

*                                   bute the last  N_A-INB_A  columns of

*                                   A, NB_A > 0.

*  RSRC_A  (global) DESCA( RSRC_  ) The process row over which the first

*                                   row of the matrix  A is distributed,

*                                   NPROW > RSRC_A >= 0.

*  CSRC_A  (global) DESCA( CSRC_  ) The  process  column  over which the

*                                   first  column of  A  is distributed.

*                                   NPCOL > CSRC_A >= 0.

*  LLD_A   (local)  DESCA( LLD_   ) The  leading  dimension of the local

*                                   array  storing  the  local blocks of

*                                   the distributed matrix A,

*                                   IF( Lc( 1, N_A ) > 0 )

*                                      LLD_A >= MAX( 1, Lr( 1, M_A ) )

*                                   ELSE

*                                      LLD_A >= 1.

*

*  Let K be the number of  rows of a matrix A starting at the global in-

*  dex IA,i.e, A( IA:IA+K-1, : ). Lr( IA, K ) denotes the number of rows

*  that the process of row coordinate MYROW ( 0 <= MYROW < NPROW ) would

*  receive if these K rows were distributed over NPROW processes.  If  K

*  is the number of columns of a matrix  A  starting at the global index

*  JA, i.e, A( :, JA:JA+K-1, : ), Lc( JA, K ) denotes the number  of co-

*  lumns that the process MYCOL ( 0 <= MYCOL < NPCOL ) would  receive if

*  these K columns were distributed over NPCOL processes.

*

*  The values of Lr() and Lc() may be determined via a call to the func-

*  tion PB_NUMROC:

*  Lr( IA, K ) = PB_NUMROC( K, IA, IMB_A, MB_A, MYROW, RSRC_A, NPROW )

*  Lc( JA, K ) = PB_NUMROC( K, JA, INB_A, NB_A, MYCOL, CSRC_A, NPCOL )

*

*  Arguments

*  =========

*

*  M       (global input) INTEGER

*          On entry, M specifies the global number of rows of the subma-

*          trix. M must be at least zero.

*

*  N       (global input) INTEGER

*          On entry, N specifies  the  global  number  of columns of the

*          submatrix. N must be at least zero.

*

*  I       (global input) INTEGER

*          On entry, I  specifies  the  global starting row index of the

*          submatrix. I must at least one.

*

*  J       (global input) INTEGER

*          On entry, J  specifies  the global starting column  index  of

*          the submatrix. J must at least one.

*

*  DESC    (global and local input) INTEGER array

*          On entry,  DESC is an integer array of dimension DLEN_.  This

*          is the array descriptor of the underlying matrix.

*

*  NPROW   (global input) INTEGER

*          On entry,  NPROW   specifies the total number of process rows

*          over which the matrix is distributed.  NPROW must be at least

*          one.

*

*  NPCOL   (global input) INTEGER

*          On entry, NPCOL specifies the total number of process columns

*          over which the matrix is distributed.  NPCOL must be at least

*          one.

*

*  MYROW   (local input) INTEGER

*          On entry,  MYROW  specifies the row coordinate of the process

*          whose local index  II  is determined.  MYROW must be at least

*          zero and strictly less than NPROW.

*

*  MYCOL   (local input) INTEGER

*          On entry,  MYCOL  specifies the column coordinate of the pro-

*          cess whose local index  JJ  is determined.  MYCOL  must be at

*          least zero and strictly less than NPCOL.

*

*  IMB1    (global output) INTEGER

*          On exit, IMB1 specifies the number of rows of the upper  left

*          block of the submatrix. On exit,  IMB1 is less or equal  than

*          M and greater or equal than MIN( 1, M ).

*

*  INB1    (global output) INTEGER

*          On exit, INB1 specifies  the number  of  columns of the upper

*          left block of the submatrix. On exit,  INB1 is  less or equal

*          than N and greater or equal than MIN( 1, N ).

*

*  MP      (local output) INTEGER

*          On exit, MP specifies the local number of rows of the  subma-

*          trix, that the processes of row coordinate MYROW own.  MP  is

*          at least zero.

*

*  NQ      (local output) INTEGER

*          On exit, NQ specifies  the  local  number  of columns  of the

*          submatrix,  that  the processes  of column  coordinate  MYCOL

*          own. NQ is at least zero.

*

*  II      (local output) INTEGER

*          On exit, II  specifies the  local  starting  row index of the

*          submatrix. On exit, II is at least one.

*

*  JJ      (local output) INTEGER

*          On exit, JJ  specifies the  local  starting  column index  of

*          the submatrix. On exit, II is at least one.

*

*  PROW    (global output) INTEGER

*          On exit,  PROW  specifies the row coordinate of  the  process

*          that possesses the first row of the submatrix. On exit,  PROW

*          is -1 if DESC(RSRC_)  is -1 on input, and, at least zero  and

*          strictly less than NPROW otherwise.

*

*  PCOL    (global output) INTEGER

*          On exit, PCOL  specifies the column coordinate of the process

*          that possesses the first column of the  submatrix.  On  exit,

*          PCOL is -1 if DESC(CSRC_)  is -1 on input, and, at least zero

*          and strictly less than NPCOL otherwise.

*

*  RPROW   (global output) INTEGER

*          On exit, RPROW specifies  the  relative row coordinate of the

*          process that possesses the first row  I  of the submatrix. On

*          exit, RPROW is -1 if DESC(RSRC_) is  -1  on  input,  and,  at

*          least zero and strictly less than NPROW otherwise.

*

*  RPCOL   (global output) INTEGER

*          On exit, RPCOL specifies  the  relative column  coordinate of

*          the process that possesses the first column  J  of the subma-

*          trix. On exit, RPCOL is -1 if  DESC(CSRC_)  is  -1  on input,

*          and, at least zero and strictly less than NPCOL otherwise.

*

*  -- Written on April 1, 1998 by

*     Antoine Petitet, University  of  Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Parameters ..

      INTEGER            BLOCK_CYCLIC_2D_INB, CSRC_, CTXT_, DLEN_,

     $                   DTYPE_, IMB_, INB_, LLD_, MB_, M_, NB_, N_,

     $                   RSRC_

      PARAMETER          ( BLOCK_CYCLIC_2D_INB = 2, dlen_ = 11,

     $                   dtype_ = 1, ctxt_ = 2, m_ = 3, n_ = 4,

     $                   imb_ = 5, inb_ = 6, mb_ = 7, nb_ = 8,

     $                   rsrc_ = 9, csrc_ = 10, lld_ = 11 )

*     ..

*     .. Local Scalars ..

      INTEGER            CSRC, I1, ILOCBLK, J1, M1, MB, MYDIST, N1, NB,

     $                   NBLOCKS, RSRC

*     ..

*     .. Local Arrays ..

      INTEGER            DESC2( DLEN_ )

*     ..

*     .. External Subroutines ..

      EXTERNAL           pb_desctrans

*     ..

*     .. Intrinsic Functions ..

      INTRINSIC          min

*     ..

*     .. Executable Statements ..

*

*     Convert descriptor

*

      CALL pb_desctrans( desc, desc2 )

*

      mb   = desc2( mb_ )

      imb1 = desc2( imb_ )

      rsrc = desc2( rsrc_ )

*

      IF( ( rsrc.EQ.-1 ).OR.( nprow.EQ.1 ) ) THEN

*

         ii    = i

         imb1  = imb1 - i + 1

         IF( imb1.LE.0 )

     $      imb1 = ( ( -imb1 ) / mb + 1 ) * mb + imb1

         imb1  = min( imb1, m )

         mp    = m

         prow  = rsrc

         rprow = 0

*

      ELSE

*

*        Figure out PROW, II and IMB1 first

*

         IF( i.LE.imb1 ) THEN

*

            prow = rsrc

*

            IF( myrow.EQ.prow ) THEN

               ii = i

            ELSE

               ii = 1

            END IF

*

            imb1 = imb1 - i + 1

*

         ELSE

*

            i1 = i - imb1 - 1

            nblocks = i1 / mb + 1

            prow = rsrc + nblocks

            prow = prow - ( prow / nprow ) * nprow

*

            IF( myrow.EQ.rsrc ) THEN

*

               ilocblk = nblocks / nprow

*

               IF( ilocblk.GT.0 ) THEN

                  IF( ( ilocblk*nprow ).GE.nblocks ) THEN

                     IF( myrow.EQ.prow ) THEN

                        ii = i + ( ilocblk - nblocks ) * mb

                     ELSE

                        ii = imb1 + ( ilocblk - 1 ) * mb + 1

                     END IF

                  ELSE

                     ii = imb1 + ilocblk * mb + 1

                  END IF

               ELSE

                  ii = imb1 + 1

               END IF

*

            ELSE

*

               mydist = myrow - rsrc

               IF( mydist.LT.0 )

     $            mydist = mydist + nprow

*

               ilocblk = nblocks / nprow

*

               IF( ilocblk.GT.0 ) THEN

                  mydist = mydist - nblocks + ilocblk * nprow

                  IF( mydist.LT.0 ) THEN

                     ii = ( ilocblk + 1 ) * mb + 1

                  ELSE IF( myrow.EQ.prow ) THEN

                     ii = i1 + ( ilocblk - nblocks + 1 ) * mb + 1

                  ELSE

                     ii = ilocblk * mb + 1

                  END IF

               ELSE

                  mydist = mydist - nblocks

                  IF( mydist.LT.0 ) THEN

                     ii = mb + 1

                  ELSE IF( myrow.EQ.prow ) THEN

                     ii = i1 + ( 1 - nblocks ) * mb + 1

                  ELSE

                     ii = 1

                  END IF

               END IF

            END IF

*

            imb1 = nblocks * mb - i1

*

         END IF

*

*        Figure out MP

*

         IF( m.LE.imb1 ) THEN

*

            IF( myrow.EQ.prow ) THEN

               mp = m

            ELSE

               mp = 0

            END IF

*

         ELSE

*

            m1 = m - imb1

            nblocks = m1 / mb + 1

*

            IF( myrow.EQ.prow ) THEN

               ilocblk = nblocks / nprow

               IF( ilocblk.GT.0 ) THEN

                  IF( ( nblocks - ilocblk * nprow ).GT.0 ) THEN

                     mp = imb1 + ilocblk * mb

                  ELSE

                     mp = m + mb * ( ilocblk - nblocks )

                  END IF

               ELSE

                  mp = imb1

               END IF

            ELSE

               mydist = myrow - prow

               IF( mydist.LT.0 )

     $            mydist = mydist + nprow

               ilocblk = nblocks / nprow

               IF( ilocblk.GT.0 ) THEN

                  mydist = mydist - nblocks + ilocblk * nprow

                  IF( mydist.LT.0 ) THEN

                     mp = ( ilocblk + 1 ) * mb

                  ELSE IF( mydist.GT.0 ) THEN

                     mp = ilocblk * mb

                  ELSE

                     mp = m1 + mb * ( ilocblk - nblocks + 1 )

                  END IF

               ELSE

                  mydist = mydist - nblocks

                  IF( mydist.LT.0 ) THEN

                     mp = mb

                  ELSE IF( mydist.GT.0 ) THEN

                     mp = 0

                  ELSE

                     mp = m1 + mb * ( 1 - nblocks )

                  END IF

               END IF

            END IF

*

         END IF

*

         imb1 = min( imb1, m )

         rprow = myrow - prow

         IF( rprow.LT.0 )

     $      rprow = rprow + nprow

*

      END IF

*

      nb   = desc2( nb_ )

      inb1 = desc2( inb_ )

      csrc = desc2( csrc_ )

*

      IF( ( csrc.EQ.-1 ).OR.( npcol.EQ.1 ) ) THEN

*

         jj    = j

         inb1  = inb1 - i + 1

         IF( inb1.LE.0 )

     $      inb1 = ( ( -inb1 ) / nb + 1 ) * nb + inb1

         inb1  = min( inb1, n )

         nq    = n

         pcol  = csrc

         rpcol = 0

*

      ELSE

*

*        Figure out PCOL, JJ and INB1 first

*

         IF( j.LE.inb1 ) THEN

*

            pcol = csrc

*

            IF( mycol.EQ.pcol ) THEN

               jj = j

            ELSE

               jj = 1

            END IF

*

            inb1 = inb1 - j + 1

*

         ELSE

*

            j1 = j - inb1 - 1

            nblocks = j1 / nb + 1

            pcol = csrc + nblocks

            pcol = pcol - ( pcol / npcol ) * npcol

*

            IF( mycol.EQ.csrc ) THEN

*

               ilocblk = nblocks / npcol

*

               IF( ilocblk.GT.0 ) THEN

                  IF( ( ilocblk*npcol ).GE.nblocks ) THEN

                     IF( mycol.EQ.pcol ) THEN

                        jj = j + ( ilocblk - nblocks ) * nb

                     ELSE

                        jj = inb1 + ( ilocblk - 1 ) * nb + 1

                     END IF

                  ELSE

                     jj = inb1 + ilocblk * nb + 1

                  END IF

               ELSE

                  jj = inb1 + 1

               END IF

*

            ELSE

*

               mydist = mycol - csrc

               IF( mydist.LT.0 )

     $            mydist = mydist + npcol

*

               ilocblk = nblocks / npcol

*

               IF( ilocblk.GT.0 ) THEN

                  mydist = mydist - nblocks + ilocblk * npcol

                  IF( mydist.LT.0 ) THEN

                     jj = ( ilocblk + 1 ) * nb + 1

                  ELSE IF( mycol.EQ.pcol ) THEN

                     jj = j1 + ( ilocblk - nblocks + 1 ) * nb + 1

                  ELSE

                     jj = ilocblk * nb + 1

                  END IF

               ELSE

                  mydist = mydist - nblocks

                  IF( mydist.LT.0 ) THEN

                     jj = nb + 1

                  ELSE IF( mycol.EQ.pcol ) THEN

                     jj = j1 + ( 1 - nblocks ) * nb + 1

                  ELSE

                     jj = 1

                  END IF

               END IF

            END IF

*

            inb1 = nblocks * nb - j1

*

         END IF

*

*        Figure out NQ

*

         IF( n.LE.inb1 ) THEN

*

            IF( mycol.EQ.pcol ) THEN

               nq = n

            ELSE

               nq = 0

            END IF

*

         ELSE

*

            n1 = n - inb1

            nblocks = n1 / nb + 1

*

            IF( mycol.EQ.pcol ) THEN

               ilocblk = nblocks / npcol

               IF( ilocblk.GT.0 ) THEN

                  IF( ( nblocks - ilocblk * npcol ).GT.0 ) THEN

                     nq = inb1 + ilocblk * nb

                  ELSE

                     nq = n + nb * ( ilocblk - nblocks )

                  END IF

               ELSE

                  nq = inb1

               END IF

            ELSE

               mydist = mycol - pcol

               IF( mydist.LT.0 )

     $            mydist = mydist + npcol

               ilocblk = nblocks / npcol

               IF( ilocblk.GT.0 ) THEN

                  mydist = mydist - nblocks + ilocblk * npcol

                  IF( mydist.LT.0 ) THEN

                     nq = ( ilocblk + 1 ) * nb

                  ELSE IF( mydist.GT.0 ) THEN

                     nq = ilocblk * nb

                  ELSE

                     nq = n1 + nb * ( ilocblk - nblocks + 1 )

                  END IF

               ELSE

                  mydist = mydist - nblocks

                  IF( mydist.LT.0 ) THEN

                     nq = nb

                  ELSE IF( mydist.GT.0 ) THEN

                     nq = 0

                  ELSE

                     nq = n1 + nb * ( 1 - nblocks )

                  END IF

               END IF

            END IF

*

         END IF

*

         inb1 = min( inb1, n )

         rpcol = mycol - pcol

         IF( rpcol.LT.0 )

     $      rpcol = rpcol + npcol

*

      END IF

*

      RETURN

*

*     End of PB_AINFOG2L

*


      END


      INTEGER FUNCTION pb_numroc( N, I, INB, NB, PROC, SRCPROC, NPROCS )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Scalar Arguments ..

      INTEGER            i, inb, n, nb, nprocs, proc, srcproc

*     ..

*

*  Purpose

*  =======

*

*  PB_NUMROC   returns  the  local number of matrix rows/columns process

*  PROC will get  if we give out N rows/columns starting from global in-

*  dex I.

*

*  Arguments

*  =========

*

*  N       (global input) INTEGER

*          On entry, N  specifies the number of rows/columns being dealt

*          out. N must be at least zero.

*

*  I       (global input) INTEGER

*          On entry, I  specifies the global index of the matrix  entry.

*          I must be at least one.

*

*  INB     (global input) INTEGER

*          On entry,  INB  specifies  the size of the first block of the

*          global matrix. INB must be at least one.

*

*  NB      (global input) INTEGER

*          On entry, NB specifies the size of the blocks used to  parti-

*          tion the matrix. NB must be at least one.

*

*  PROC    (local input) INTEGER

*          On entry, PROC specifies  the coordinate of the process whose

*          local portion is determined.  PROC must be at least zero  and

*          strictly less than NPROCS.

*

*  SRCPROC (global input) INTEGER

*          On entry,  SRCPROC  specifies  the coordinate of the  process

*          that possesses the  first row or column  of the matrix.  When

*          SRCPROC = -1, the data  is not  distributed  but  replicated,

*          otherwise  SRCPROC  must be at least zero and  strictly  less

*          than NPROCS.

*

*  NPROCS  (global input) INTEGER

*          On entry,  NPROCS  specifies the total number of process rows

*          or columns over which the matrix is distributed.  NPROCS must

*          be at least one.

*

*  -- Written on April 1, 1998 by

*     Antoine Petitet, University  of  Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Local Scalars ..

      INTEGER            i1, ilocblk, inb1, mydist, n1, nblocks,

     $                   srcproc1

*     ..

*     .. Executable Statements ..

*

      if( ( srcproc.EQ.-1 ).OR.( nprocs.EQ.1 ) ) then

         pb_numroc = n

         RETURN

      END IF

*

*     Compute coordinate of process owning I and corresponding INB

*

      IF( i.LE.inb ) THEN

*

*        I is in range of first block, i.e SRCPROC owns I.

*

         srcproc1 = srcproc

         inb1 = inb - i + 1

*

      ELSE

*

*        I is not in first block of matrix, figure out who has it

*

         i1 = i - 1 - inb

         nblocks = i1 / nb + 1

         srcproc1 = srcproc + nblocks

         srcproc1 = srcproc1 - ( srcproc1 / nprocs ) * nprocs

         inb1 = nblocks*nb - i1

*

      END IF

*

*     Now everything is just like I=1. Search now who has N-1, Is N-1

*     in the first block ?

*

      IF( n.LE.inb1 ) THEN

         IF( proc.EQ.srcproc1 ) THEN

            pb_numroc = n

         ELSE

            pb_numroc = 0

         END IF

         RETURN

      END IF

*

      n1 = n - inb1

      nblocks = n1 / nb + 1

*

      IF( proc.EQ.srcproc1 ) THEN

         ilocblk = nblocks / nprocs

         IF( ilocblk.GT.0 ) THEN

            IF( ( nblocks - ilocblk * nprocs ).GT.0 ) THEN

               pb_numroc = inb1 + ilocblk * nb

            ELSE

               pb_numroc = n + nb * ( ilocblk - nblocks )

            END IF

         ELSE

            pb_numroc = inb1

         END IF

      ELSE

         mydist = proc - srcproc1

         IF( mydist.LT.0 )

     $      mydist = mydist + nprocs

         ilocblk = nblocks / nprocs

         IF( ilocblk.GT.0 ) THEN

            mydist = mydist - nblocks + ilocblk * nprocs

            IF( mydist.LT.0 ) THEN

               pb_numroc = ( ilocblk + 1 ) * nb

            ELSE IF( mydist.GT.0 ) THEN

               pb_numroc = ilocblk * nb

            ELSE

               pb_numroc = n1 + nb * ( ilocblk - nblocks + 1 )

            END IF

         ELSE

            mydist = mydist - nblocks

            IF( mydist.LT.0 ) THEN

               pb_numroc = nb

            ELSE IF( mydist.GT.0 ) THEN

               pb_numroc = 0

            ELSE

               pb_numroc = n1 + nb * ( 1 - nblocks )

            END IF

         END IF

      END IF

*

      RETURN

*

*     End of PB_NUMROC

*


      END


      SUBROUTINE pb_boot()

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*

*  Purpose

*  =======

*

*  PB_BOOT (re)sets all timers to 0, and enables PB_TIMER.

*

*  -- Written on April 1, 1998 by

*     R. Clint Whaley, University of Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Parameters ..

      INTEGER            NTIMER

      PARAMETER          ( NTIMER = 64 )

      double precision   startflag, zero

      parameter( startflag = -5.0d+0, zero = 0.0d+0 )

*     ..

*     .. Local Scalars ..

      INTEGER            I

*     ..

*     .. Common Blocks ..

      LOGICAL            DISABLED

      DOUBLE PRECISION   CPUSEC( NTIMER ), CPUSTART( NTIMER ),

     $                   wallsec( ntimer ), wallstart( ntimer )

      COMMON /sltimer00/ cpusec, wallsec, cpustart, wallstart, disabled

*     ..

*     .. Executable Statements ..

*

      disabled = .false.

      DO 10 i = 1, ntimer

         cpusec( i )  = zero

         wallsec( i ) = zero

         cpustart( i )  = startflag

         wallstart( i ) = startflag

   10 CONTINUE

*

      RETURN

*

*     End of PB_BOOT

*


      END

*


      SUBROUTINE pb_timer( I )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Scalar Arguments ..

      INTEGER            I

*     ..

*

*  Purpose

*  =======

*

*  PB_TIMER  provides a  "stopwatch" functionality cpu/wall timer in se-

*  conds. Up to 64 separate timers can be functioning at once. The first

*  call starts the timer, and the second stops it.  This routine  can be

*  disenabled, so that calls to the timer are ignored.  This feature can

*  be used to make sure certain sections of code do not  affect timings,

*  even if they call routines which have PB_TIMER calls in them.

*

*  Arguments

*  =========

*

*  I       (global input) INTEGER

*          On entry, I specifies the timer to stop/start.

*

*  -- Written on April 1, 1998 by

*     R. Clint Whaley, University of Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Parameters ..

      INTEGER            NTIMER

      PARAMETER          ( NTIMER = 64 )

      double precision   startflag

      parameter( startflag = -5.0d+0 )

*     ..

*     .. External Functions ..

      DOUBLE PRECISION   DCPUTIME00, DWALLTIME00

      EXTERNAL           DCPUTIME00, DWALLTIME00

*     ..

*     .. Common Blocks ..

      LOGICAL            DISABLED

      DOUBLE PRECISION   CPUSEC( NTIMER ), CPUSTART( NTIMER ),

     $                   wallsec( ntimer ), wallstart( ntimer )

      COMMON /sltimer00/ cpusec, wallsec, cpustart, wallstart, disabled

*     ..

*     .. Executable Statements ..

*

*     If timing disabled, return

*

      IF( disabled )

     $   RETURN

*

      IF( wallstart( i ).EQ.startflag ) THEN

*

*        If timer has not been started, start it

*

         wallstart( i ) = dwalltime00()

         cpustart( i )  = dcputime00()

*

      ELSE

*

*        Stop timer and add interval to count

*

         cpusec( i ) = cpusec( i ) + dcputime00() - cpustart( i )

         wallsec( i ) = wallsec( i ) + dwalltime00() - wallstart( i )

         wallstart( i ) = startflag

*

      END IF

*

      RETURN

*

*     End of PB_TIMER

*


      END

*


      SUBROUTINE pb_enable()

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*

*  Purpose

*  =======

*

*  PB_ENABLE sets it so calls to PB_TIMER are not ignored.

*

*  -- Written on April 1, 1998 by

*     R. Clint Whaley, University of Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Parameters ..

      INTEGER            NTIMER

      PARAMETER          ( NTIMER = 64 )

*     ..

*     .. Common Blocks ..

      logical            disabled

      DOUBLE PRECISION   CPUSEC( NTIMER ), CPUSTART( NTIMER ),

     $                   WALLSEC( NTIMER ), WALLSTART( NTIMER )

      COMMON /SLTIMER00/ CPUSEC, WALLSEC, CPUSTART, WALLSTART, DISABLED

*     ..

*     .. Executable Statements ..

*

      disabled = .false.

*

      RETURN

*

*     End of PB_ENABLE

*


      END

*


      SUBROUTINE pb_disable()

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*  Purpose

*  =======

*

*  PB_DISABLE sets it so calls to PB_TIMER are ignored.

*

*  -- Written on April 1, 1998 by

*     R. Clint Whaley, University of Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Parameters ..

      INTEGER            NTIMER

      PARAMETER          ( NTIMER = 64 )

*     ..

*     .. Common Blocks ..

      logical            disabled

      DOUBLE PRECISION   CPUSEC( NTIMER ), CPUSTART( NTIMER ),

     $                   WALLSEC( NTIMER ), WALLSTART( NTIMER )

      COMMON /SLTIMER00/ CPUSEC, WALLSEC, CPUSTART, WALLSTART, DISABLED

*     ..

*     .. Executable Statements ..

*

      disabled = .true.

*

      RETURN

*

*     End of PB_DISABLE

*


      END

*


      DOUBLE PRECISION FUNCTION pb_inquire( TMTYPE, I )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Scalar Arguments ..

      CHARACTER*1        tmtype

      INTEGER            i

*     ..

*

*  Purpose

*  =======

*

*  PB_INQUIRE returns wall or cpu time that has accumulated in timer I.

*

*  Arguments

*  =========

*

*  TMTYPE  (global input) CHARACTER

*          On entry, TMTYPE specifies what time will be returned as fol-

*          lows

*             = 'W': wall clock time is returned,

*             = 'C': CPU time is returned (default).

*

*  I       (global input) INTEGER

*          On entry, I specifies the timer to return.

*

*  -- Written on April 1, 1998 by

*     R. Clint Whaley, University of Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Parameters ..

      INTEGER            ntimer

      PARAMETER          ( ntimer = 64 )

      double precision   errflag

      parameter( errflag = -1.0d+0 )

*     ..

*     .. Local Scalars ..

      DOUBLE PRECISION   time

*     ..

*     .. External Functions ..

      LOGICAL            lsame

      DOUBLE PRECISION   dcputime00, dwalltime00

      EXTERNAL           dcputime00, dwalltime00, lsame

*     ..

*     .. Common Blocks ..

      LOGICAL            disabled

      DOUBLE PRECISION   cpusec( ntimer ), cpustart( ntimer ),

     $                   wallsec( ntimer ), wallstart( ntimer )

      COMMON /sltimer00/ cpusec, wallsec, cpustart, wallstart, disabled

*     ..

*     .. Executable Statements ..

*

      IF( lsame( tmtype, 'W' ) ) THEN

*

*        If walltime not available on this machine, return -1 flag

*

         IF( dwalltime00().EQ.errflag ) THEN

            time = errflag

         ELSE

            time = wallsec( i )

         END IF

      ELSE

         IF( dcputime00().EQ.errflag ) THEN

            time = errflag

         ELSE

            time = cpusec( i )

         END IF

      END IF

*

      pb_inquire = time

*

      RETURN

*

*     End of PB_INQUIRE

*


      END

*


      SUBROUTINE pb_combine( ICTXT, SCOPE, OP, TMTYPE, N, IBEG,

     $                       TIMES )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Scalar Arguments ..

      CHARACTER*1        OP, SCOPE, TMTYPE

      INTEGER            IBEG, ICTXT, N

*     ..

*     .. Array Arguments ..

      DOUBLE PRECISION   TIMES( N )

*     ..

*

*  Purpose

*  =======

*

*  PB_COMBINE returns wall or cpu time that has accumulated in timer I.

*

*  Arguments

*  =========

*

*  TMTYPE  (global input) CHARACTER

*          On entry, TMTYPE specifies what time will be returned as fol-

*          lows

*             = 'W': wall clock time is returned,

*             = 'C': CPU time is returned (default).

*

*  I       (global input) INTEGER

*          On entry, I specifies the timer to return.

*

*  -- Written on April 1, 1998 by

*     R. Clint Whaley, University of Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Parameters ..

      INTEGER            NTIMER

      PARAMETER          ( NTIMER = 64 )

      double precision   errflag

      parameter( errflag = -1.0d+0 )

*     ..

*     .. Local Scalars ..

      CHARACTER*1        TOP

      LOGICAL            TMPDIS

      INTEGER            I

*     ..

*     .. External Subroutines ..

      EXTERNAL           DGAMX2D, DGAMN2D, DGSUM2D, PB_TOPGET

*     ..

*     .. External Functions ..

      LOGICAL            LSAME

      DOUBLE PRECISION   DCPUTIME00, DWALLTIME00

      EXTERNAL           DCPUTIME00, DWALLTIME00, LSAME

*     ..

*     .. Common Blocks ..

      LOGICAL            DISABLED

      DOUBLE PRECISION   CPUSEC( NTIMER ), CPUSTART( NTIMER ),

     $                   WALLSEC( NTIMER ), WALLSTART( NTIMER )

      COMMON /SLTIMER00/ CPUSEC, WALLSEC, CPUSTART, WALLSTART, DISABLED

*     ..

*     .. Executable Statements ..

*

*     Disable timer for combine operation

*

      tmpdis = disabled

      disabled = .true.

*

*     Copy timer information into user's times array

*

      IF( lsame( tmtype, 'W' ) ) THEN

*

*        If walltime not available on this machine, fill in times

*        with -1 flag, and return

*

         IF( dwalltime00().EQ.errflag ) THEN

            DO 10 i = 1, n

               times( i ) = errflag

   10       CONTINUE

            RETURN

         ELSE

            DO 20 i = 1, n

               times( i ) = wallsec( ibeg + i - 1 )

   20       CONTINUE

         END IF

      ELSE

         IF( dcputime00().EQ.errflag ) THEN

            DO 30 i = 1, n

               times( i ) = errflag

   30       CONTINUE

            RETURN

         ELSE

            DO 40 i = 1, n

               times( i ) = cpusec( ibeg + i - 1 )

   40       CONTINUE

         END IF

      ENDIF

*

*     Combine all nodes' information, restore disabled, and return

*

      IF( op.EQ.'>' ) THEN

         CALL pb_topget( ictxt, 'Combine', scope, top )

         CALL dgamx2d( ictxt, scope, top, n, 1, times, n, -1, -1,

     $                 -1, -1, 0 )

      ELSE IF( op.EQ.'<' ) THEN

         CALL pb_topget( ictxt, 'Combine', scope, top )

         CALL dgamn2d( ictxt, scope, top, n, 1, times, n, -1, -1,

     $                 -1, -1, 0 )

      ELSE IF( op.EQ.'+' ) THEN

         CALL pb_topget( ictxt, 'Combine', scope, top )

         CALL dgsum2d( ictxt, scope, top, n, 1, times, n, -1, 0 )

      ELSE

         CALL pb_topget( ictxt, 'Combine', scope, top )

         CALL dgamx2d( ictxt, scope, top, n, 1, times, n, -1, -1,

     $                 -1, -1, 0 )

      END IF

*

      disabled = tmpdis

*

      RETURN

*

*     End of PB_COMBINE

*


      END


      SUBROUTINE pb_chkmat( ICTXT, M, MPOS0, N, NPOS0, IA, JA, DESCA,

     $                      DPOS0, INFO )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Scalar Arguments ..

      INTEGER            DPOS0, IA, ICTXT, INFO, JA, M, MPOS0, N, NPOS0

*     ..

*     .. Array Arguments ..

      INTEGER            DESCA( * )

*     ..

*

*  Purpose

*  =======

*

*  PB_CHKMAT  checks the validity of a descriptor vector  DESCA, the re-

*  lated global indexes  IA, JA from a local view point. If an inconsis-

*  tency is found among its parameters IA, JA and DESCA, the routine re-

*  turns an error code in INFO.

*

*  Arguments

*  =========

*

*  ICTXT   (local input) INTEGER

*          On entry,  ICTXT  specifies the BLACS context handle, indica-

*          ting the global  context of the operation. The context itself

*          is global, but the value of ICTXT is local.

*

*  M       (global input) INTEGER

*          On entry,  M  specifies  the  number  of  rows  the submatrix

*          sub( A ).

*

*  MPOS0   (global input) INTEGER

*          On entry,  MPOS0  specifies the  position in the calling rou-

*          tine's parameter list where the formal parameter M appears.

*

*  N       (global input) INTEGER

*          On entry,  N  specifies  the  number of columns the submatrix

*          sub( A ).

*

*  NPOS0   (global input) INTEGER

*          On entry,  NPOS0  specifies the  position in the calling rou-

*          tine's parameter list where the formal parameter N appears.

*

*  IA      (global input) INTEGER

*          On entry, IA  specifies A's global row index, which points to

*          the beginning of the submatrix sub( A ).

*

*  JA      (global input) INTEGER

*          On entry, JA  specifies A's global column index, which points

*          to the beginning of the submatrix sub( A ).

*

*  DESCA   (global and local input) INTEGER array

*          On entry, DESCA  is an integer array of dimension DLEN_. This

*          is the array descriptor for the matrix A.

*

*  DPOS0   (global input) INTEGER

*          On entry,  DPOS0  specifies the  position in the calling rou-

*          tine's parameter list where the formal  parameter  DESCA  ap-

*          pears.  Note that it is assumed that  IA and JA are respecti-

*          vely 2 and 1 entries behind DESCA.

*

*  INFO    (local input/local output) INTEGER

*          = 0:  successful exit

*          < 0:  If the i-th argument is an array and the j-entry had an

*                illegal  value,  then  INFO = -(i*100+j),  if  the i-th

*                argument is a  scalar  and had an  illegal  value, then

*                INFO = -i.

*

*  -- Written on April 1, 1998 by

*     R. Clint Whaley, University of Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Parameters ..

      INTEGER            BLOCK_CYCLIC_2D_INB, CSRC_, CTXT_, DLEN_,

     $                   DTYPE_, IMB_, INB_, LLD_, MB_, M_, NB_, N_,

     $                   RSRC_

      PARAMETER          ( BLOCK_CYCLIC_2D_INB = 2, dlen_ = 11,

     $                   dtype_ = 1, ctxt_ = 2, m_ = 3, n_ = 4,

     $                   imb_ = 5, inb_ = 6, mb_ = 7, nb_ = 8,

     $                   rsrc_ = 9, csrc_ = 10, lld_ = 11 )

      INTEGER            DESCMULT, BIGNUM

      PARAMETER          ( DESCMULT = 100, bignum = descmult*descmult )

*     ..

*     .. Local Scalars ..

      INTEGER            DPOS, IAPOS, JAPOS, MP, MPOS, MYCOL, MYROW,

     $                   NPCOL, NPOS, NPROW, NQ

*     ..

*     .. Local Arrays ..

      INTEGER            DESCA2( DLEN_ )

*     ..

*     .. External Subroutines ..

      EXTERNAL           blacs_gridinfo, pb_desctrans

*     ..

*     .. External Functions ..

      INTEGER            PB_NUMROC

      EXTERNAL           PB_NUMROC

*     ..

*     .. Intrinsic Functions ..

      INTRINSIC          min, max

*     ..

*     .. Executable Statements ..

*

*     Convert descriptor

*

      CALL pb_desctrans( desca, desca2 )

*

*     Want to find errors with MIN( ), so if no error, set it to a big

*     number.  If there already is an error, multiply by the the des-

*     criptor multiplier

*

      IF( info.GE.0 ) THEN

         info = bignum

      ELSE IF( info.LT.-descmult ) THEN

         info = -info

      ELSE

         info = -info * descmult

      END IF

*

*     Figure where in parameter list each parameter was, factoring in

*     descriptor multiplier

*

      mpos  = mpos0 * descmult

      npos  = npos0 * descmult

      iapos = ( dpos0 - 2 ) * descmult

      japos = ( dpos0 - 1 ) * descmult

      dpos  = dpos0 * descmult

*

*     Get grid parameters

*

      CALL blacs_gridinfo( ictxt, nprow, npcol, myrow, mycol )

*

*     Check that matrix values make sense from local viewpoint

*

      IF( m.LT.0 )

     $   info = min( info, mpos )

      IF( n.LT.0 )

     $   info = min( info, npos )

      IF( ia.LT.1 )

     $   info = min( info, iapos )

      IF( ja.LT.1 )

     $   info = min( info, japos )

      IF( desca2( dtype_ ).NE.block_cyclic_2d_inb )

     $   info = min( info, dpos + dtype_ )

      IF( desca2( imb_ ).LT.1 )

     $   info = min( info, dpos + imb_ )

      IF( desca2( inb_ ).LT.1 )

     $   info = min( info, dpos + inb_ )

      IF( desca2( mb_ ).LT.1 )

     $   info = min( info, dpos + mb_ )

      IF( desca2( nb_ ).LT.1 )

     $   info = min( info, dpos + nb_ )

      IF( desca2( rsrc_ ).LT.-1 .OR. desca2( rsrc_ ).GE.nprow )

     $   info = min( info, dpos + rsrc_ )

      IF( desca2( csrc_ ).LT.-1 .OR. desca2( csrc_ ).GE.npcol )

     $   info = min( info, dpos + csrc_ )

      IF( desca2( ctxt_ ).NE.ictxt )

     $   info = min( info, dpos + ctxt_ )

*

      IF( m.EQ.0 .OR. n.EQ.0 ) THEN

*

*        NULL matrix, relax some checks

*

         IF( desca2( m_ ).LT.0 )

     $      info = min( info, dpos + m_ )

         IF( desca2( n_ ).LT.0 )

     $      info = min( info, dpos + n_ )

         IF( desca2( lld_ ).LT.1 )

     $      info = min( info, dpos + lld_ )

*

      ELSE

*

*        more rigorous checks for non-degenerate matrices

*

         mp = pb_numroc( desca2( m_ ), 1, desca2( imb_ ), desca2( mb_ ),

     $                   myrow, desca2( rsrc_ ), nprow )

*

         IF( desca2( m_ ).LT.1 )

     $      info = min( info, dpos + m_ )

         IF( desca2( n_ ).LT.1 )

     $      info = min( info, dpos + n_ )

         IF( ia.GT.desca2( m_ ) )

     $      info = min( info, iapos )

         IF( ja.GT.desca2( n_ ) )

     $      info = min( info, japos )

         IF( ia+m-1.GT.desca2( m_ ) )

     $      info = min( info, mpos )

         IF( ja+n-1.GT.desca2( n_ ) )

     $      info = min( info, npos )

*

         IF( desca2( lld_ ).LT.max( 1, mp ) ) THEN

            nq = pb_numroc( desca2( n_ ), 1, desca2( inb_ ),

     $                      desca2( nb_ ), mycol, desca2( csrc_ ),

     $                      npcol )

            IF( desca2( lld_ ).LT.1 ) THEN

               info = min( info, dpos + lld_ )

            ELSE IF( nq.GT.0 ) THEN

               info = min( info, dpos + lld_ )

            END IF

         END IF

*

      END IF

*

*     Prepare output: set info = 0 if no error, and divide by

*     DESCMULT if error is not in a descriptor entry

*

      IF( info.EQ.bignum ) THEN

         info = 0

      ELSE IF( mod( info, descmult ).EQ.0 ) THEN

         info = -( info / descmult )

      ELSE

         info = -info

      END IF

*

      RETURN

*

*     End of PB_CHKMAT

*


      END


      SUBROUTINE pb_desctrans( DESCIN, DESCOUT )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Array Arguments ..

      INTEGER            DESCIN( * ), DESCOUT( * )

*     ..

*

*  Purpose

*  =======

*

*  PB_DESCTRANS  converts  a  descriptor  DESCIN of type BLOCK_CYCLIC_2D

*  or   BLOCK_CYCLIC_INB_2D   into   a   descriptor   DESCOUT   of  type

*  BLOCK_CYCLIC_INB_2D.

*

*  Notes

*  =====

*

*  A description  vector  is associated with each 2D block-cyclicly dis-

*  tributed matrix.  This  vector  stores  the  information required  to

*  establish the  mapping between a matrix entry and  its  corresponding

*  process and memory location.

*

*  In  the  following  comments,  the  character _  should  be  read  as

*  "of the distributed  matrix".  Let  A  be a generic term for  any  2D

*  block cyclicly distributed matrix.  Its description vector is DESCA:

*

*  NOTATION         STORED IN        EXPLANATION

*  ---------------- ---------------  -----------------------------------

*  DTYPE_A (global) DESCA( DTYPE1_ ) The descriptor type.

*  CTXT_A  (global) DESCA( CTXT1_  ) The BLACS context handle indicating

*                                    the   NPROW x NPCOL  BLACS  process

*                                    grid  A  is  distributed  over. The

*                                    context  itself  is global, but the

*                                    handle   (the  integer  value)  may

*                                    vary.

*  M_A     (global) DESCA( M1_     ) The  number  of rows in the distri-

*                                    buted matrix A, M_A >= 0.

*  N_A     (global) DESCA( N1_     ) The  number  of columns in the dis-

*                                    tributed matrix A, N_A >= 0.

*  MB_A    (global) DESCA( MB1_    ) The blocking factor used to distri-

*                                    bute the rows of A, MB_A > 0.

*  NB_A    (global) DESCA( NB1_    ) The blocking factor used to distri-

*                                    bute the columns of A, NB_A > 0.

*  RSRC_A  (global) DESCA( RSRC1_  ) The  process  row  over  which  the

*                                    first row of the matrix  A  is dis-

*                                    tributed, NPROW > RSRC_A >= 0.

*  CSRC_A  (global) DESCA( CSRC1_  ) The process column  over  which the

*                                    first column of  A  is distributed.

*                                    NPCOL > CSRC_A >= 0.

*  LLD_A   (local)  DESCA( LLD1_   ) The leading dimension  of the local

*                                    array  storing  the local blocks of

*                                    the distributed matrix A,

*                                    IF( Lc( 1, N_A ) > 0 )

*                                      LLD_A >= MAX( 1, Lr( 1, M_A ) )

*                                    ELSE

*                                      LLD_A >= 1.

*

*  Let K be the number of  rows of a matrix A starting at the global in-

*  dex IA,i.e, A( IA:IA+K-1, : ). Lr( IA, K ) denotes the number of rows

*  that the process of row coordinate MYROW ( 0 <= MYROW < NPROW ) would

*  receive if these K rows were distributed over NPROW processes.  If  K

*  is the number of columns of a matrix  A  starting at the global index

*  JA, i.e, A( :, JA:JA+K-1, : ), Lc( JA, K ) denotes the number  of co-

*  lumns that the process MYCOL ( 0 <= MYCOL < NPCOL ) would  receive if

*  these K columns were distributed over NPCOL processes.

*

*  The values of Lr() and Lc() may be determined via a call to the func-

*  tion PB_NUMROC:

*  Lr( IA, K ) = PB_NUMROC( K, IA, MB_A, MB_A, MYROW, RSRC_A, NPROW )

*  Lc( JA, K ) = PB_NUMROC( K, JA, NB_A, NB_A, MYCOL, CSRC_A, NPCOL )

*

*  A description  vector  is associated with each 2D block-cyclicly dis-

*  tributed matrix.  This  vector  stores  the  information  required to

*  establish the  mapping  between a  matrix entry and its corresponding

*  process and memory location.

*

*  In  the  following  comments,   the character _  should  be  read  as

*  "of  the  distributed  matrix".  Let  A  be a generic term for any 2D

*  block cyclicly distributed matrix.  Its description vector is DESCA:

*

*  NOTATION         STORED IN       EXPLANATION

*  ---------------- --------------- ------------------------------------

*  DTYPE_A (global) DESCA( DTYPE_ ) The descriptor type.

*  CTXT_A  (global) DESCA( CTXT_  ) The BLACS context handle, indicating

*                                   the NPROW x NPCOL BLACS process grid

*                                   A  is distributed over.  The context

*                                   itself  is  global,  but  the handle

*                                   (the integer value) may vary.

*  M_A     (global) DESCA( M_     ) The  number of rows in the distribu-

*                                   ted matrix A, M_A >= 0.

*  N_A     (global) DESCA( N_     ) The number of columns in the distri-

*                                   buted matrix A, N_A >= 0.

*  IMB_A   (global) DESCA( IMB_   ) The number of rows of the upper left

*                                   block of the matrix A, IMB_A > 0.

*  INB_A   (global) DESCA( INB_   ) The  number  of columns of the upper

*                                   left   block   of   the   matrix  A,

*                                   INB_A > 0.

*  MB_A    (global) DESCA( MB_    ) The blocking factor used to  distri-

*                                   bute the last  M_A-IMB_A rows of  A,

*                                   MB_A > 0.

*  NB_A    (global) DESCA( NB_    ) The blocking factor used to  distri-

*                                   bute the last  N_A-INB_A  columns of

*                                   A, NB_A > 0.

*  RSRC_A  (global) DESCA( RSRC_  ) The process row over which the first

*                                   row of the matrix  A is distributed,

*                                   NPROW > RSRC_A >= 0.

*  CSRC_A  (global) DESCA( CSRC_  ) The  process  column  over which the

*                                   first  column of  A  is distributed.

*                                   NPCOL > CSRC_A >= 0.

*  LLD_A   (local)  DESCA( LLD_   ) The  leading  dimension of the local

*                                   array  storing  the  local blocks of

*                                   the distributed matrix A,

*                                   IF( Lc( 1, N_A ) > 0 )

*                                      LLD_A >= MAX( 1, Lr( 1, M_A ) )

*                                   ELSE

*                                      LLD_A >= 1.

*

*  Let K be the number of  rows of a matrix A starting at the global in-

*  dex IA,i.e, A( IA:IA+K-1, : ). Lr( IA, K ) denotes the number of rows

*  that the process of row coordinate MYROW ( 0 <= MYROW < NPROW ) would

*  receive if these K rows were distributed over NPROW processes.  If  K

*  is the number of columns of a matrix  A  starting at the global index

*  JA, i.e, A( :, JA:JA+K-1, : ), Lc( JA, K ) denotes the number  of co-

*  lumns that the process MYCOL ( 0 <= MYCOL < NPCOL ) would  receive if

*  these K columns were distributed over NPCOL processes.

*

*  The values of Lr() and Lc() may be determined via a call to the func-

*  tion PB_NUMROC:

*  Lr( IA, K ) = PB_NUMROC( K, IA, IMB_A, MB_A, MYROW, RSRC_A, NPROW )

*  Lc( JA, K ) = PB_NUMROC( K, JA, INB_A, NB_A, MYCOL, CSRC_A, NPCOL )

*

*  Arguments

*  =========

*

*  DESCIN  (global and local input) INTEGER array

*          On entry, DESCIN  is an array of dimension DLEN1_ or DLEN_ as

*          specified by its first entry DESCIN( DTYPE_ ).  DESCIN is the

*          source  array  descriptor of type BLOCK_CYCLIC_2D  or of type

*          BLOCK_CYCLIC_2D_INB.

*

*  DESCOUT (global and local output) INTEGER array

*          On entry, DESCOUT is an array of dimension DLEN_.  DESCOUT is

*          the target array descriptor of type BLOCK_CYCLIC_2D_INB.

*

*  -- Written on April 1, 1998 by

*     R. Clint Whaley, University of Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Parameters ..

      INTEGER            BLOCK_CYCLIC_2D, CSRC1_, CTXT1_, DLEN1_,

     $                   DTYPE1_, LLD1_, M1_, MB1_, N1_, NB1_, RSRC1_

      PARAMETER          ( BLOCK_CYCLIC_2D = 1, dlen1_ = 9, dtype1_ = 1,

     $                   ctxt1_ = 2, m1_ = 3, n1_ = 4, mb1_ = 5,

     $                   nb1_ = 6, rsrc1_ = 7, csrc1_ = 8, lld1_ = 9 )

      INTEGER            BLOCK_CYCLIC_2D_INB, CSRC_, CTXT_, DLEN_,

     $                   DTYPE_, IMB_, INB_, LLD_, MB_, M_, NB_, N_,

     $                   RSRC_

      PARAMETER          ( BLOCK_CYCLIC_2D_INB = 2, dlen_ = 11,

     $                   dtype_ = 1, ctxt_ = 2, m_ = 3, n_ = 4,

     $                   imb_ = 5, inb_ = 6, mb_ = 7, nb_ = 8,

     $                   rsrc_ = 9, csrc_ = 10, lld_ = 11 )

*     ..

*     .. Local Scalars ..

      INTEGER            I

*     ..

*     .. Executable Statements ..

*

      IF( descin( dtype_ ).EQ.block_cyclic_2d ) THEN

         descout( dtype_ ) = block_cyclic_2d_inb

         descout( ctxt_  ) = descin( ctxt1_ )

         descout( m_     ) = descin( m1_    )

         descout( n_     ) = descin( n1_    )

         descout( imb_   ) = descin( mb1_   )

         descout( inb_   ) = descin( nb1_   )

         descout( mb_    ) = descin( mb1_   )

         descout( nb_    ) = descin( nb1_   )

         descout( rsrc_  ) = descin( rsrc1_ )

         descout( csrc_  ) = descin( csrc1_ )

         descout( lld_   ) = descin( lld1_  )

      ELSE IF( descin( dtype_ ).EQ.block_cyclic_2d_inb ) THEN

         DO 10 i = 1, dlen_

            descout( i ) = descin( i )

   10    CONTINUE

      ELSE

         descout( dtype_ ) = descin( 1 )

         descout( ctxt_  ) = descin( 2 )

         descout( m_     ) = 0

         descout( n_     ) = 0

         descout( imb_   ) = 1

         descout( inb_   ) = 1

         descout( mb_    ) = 1

         descout( nb_    ) = 1

         descout( rsrc_  ) = 0

         descout( csrc_  ) = 0

         descout( lld_   ) = 1

      END IF

*

      RETURN

*

*     End of PB_DESCTRANS

*


      END


      SUBROUTINE pb_descset2( DESC, M, N, IMB, INB, MB, NB, RSRC, CSRC,

     $                        CTXT, LLD )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Scalar Arguments ..

      INTEGER            CSRC, CTXT, IMB, INB, LLD, M, MB, N, NB, RSRC

*     ..

*     .. Array Arguments ..

      INTEGER            DESC( * )

*     ..

*

*  Purpose

*  =======

*

*  PB_DESCSET2 uses  its  10  input  arguments  M,  N, IMB, INB, MB, NB,

*  RSRC,  CSRC,  CTXT  and LLD to initialize a descriptor vector of type

*  BLOCK_CYCLIC_2D_INB.

*

*  Notes

*  =====

*

*  A description  vector  is associated with each 2D block-cyclicly dis-

*  tributed matrix.  This  vector  stores  the  information required  to

*  establish the  mapping between a matrix entry and  its  corresponding

*  process and memory location.

*

*  In  the  following  comments,  the  character _  should  be  read  as

*  "of the distributed  matrix".  Let  A  be a generic term for  any  2D

*  block cyclicly distributed matrix.  Its description vector is DESCA:

*

*  NOTATION         STORED IN        EXPLANATION

*  ---------------- ---------------  -----------------------------------

*  DTYPE_A (global) DESCA( DTYPE1_ ) The descriptor type.

*  CTXT_A  (global) DESCA( CTXT1_  ) The BLACS context handle indicating

*                                    the   NPROW x NPCOL  BLACS  process

*                                    grid  A  is  distributed  over. The

*                                    context  itself  is global, but the

*                                    handle   (the  integer  value)  may

*                                    vary.

*  M_A     (global) DESCA( M1_     ) The  number  of rows in the distri-

*                                    buted matrix A, M_A >= 0.

*  N_A     (global) DESCA( N1_     ) The  number  of columns in the dis-

*                                    tributed matrix A, N_A >= 0.

*  MB_A    (global) DESCA( MB1_    ) The blocking factor used to distri-

*                                    bute the rows of A, MB_A > 0.

*  NB_A    (global) DESCA( NB1_    ) The blocking factor used to distri-

*                                    bute the columns of A, NB_A > 0.

*  RSRC_A  (global) DESCA( RSRC1_  ) The  process  row  over  which  the

*                                    first row of the matrix  A  is dis-

*                                    tributed, NPROW > RSRC_A >= 0.

*  CSRC_A  (global) DESCA( CSRC1_  ) The process column  over  which the

*                                    first column of  A  is distributed.

*                                    NPCOL > CSRC_A >= 0.

*  LLD_A   (local)  DESCA( LLD1_   ) The leading dimension  of the local

*                                    array  storing  the local blocks of

*                                    the distributed matrix A,

*                                    IF( Lc( 1, N_A ) > 0 )

*                                      LLD_A >= MAX( 1, Lr( 1, M_A ) )

*                                    ELSE

*                                      LLD_A >= 1.

*

*  Let K be the number of  rows of a matrix A starting at the global in-

*  dex IA,i.e, A( IA:IA+K-1, : ). Lr( IA, K ) denotes the number of rows

*  that the process of row coordinate MYROW ( 0 <= MYROW < NPROW ) would

*  receive if these K rows were distributed over NPROW processes.  If  K

*  is the number of columns of a matrix  A  starting at the global index

*  JA, i.e, A( :, JA:JA+K-1, : ), Lc( JA, K ) denotes the number  of co-

*  lumns that the process MYCOL ( 0 <= MYCOL < NPCOL ) would  receive if

*  these K columns were distributed over NPCOL processes.

*

*  The values of Lr() and Lc() may be determined via a call to the func-

*  tion PB_NUMROC:

*  Lr( IA, K ) = PB_NUMROC( K, IA, MB_A, MB_A, MYROW, RSRC_A, NPROW )

*  Lc( JA, K ) = PB_NUMROC( K, JA, NB_A, NB_A, MYCOL, CSRC_A, NPCOL )

*

*  Arguments

*  =========

*

*  DESC    (global and local output) INTEGER array

*          On entry, DESC is an array of  dimension  DLEN_.  DESC is the

*          array descriptor to be set.

*

*  M       (global input) INTEGER

*          On entry,  M  specifies  the  number  of  rows of the matrix.

*          M must be at least zero.

*

*  N       (global input) INTEGER

*          On entry,  N  specifies  the number of columns of the matrix.

*          N must be at least zero.

*

*  IMB     (global input) INTEGER

*          On entry,  IMB  specifies  the row size of the first block of

*          the global matrix distribution. IMB must be at least one.

*

*  INB     (global input) INTEGER

*          On entry,  INB  specifies  the column size of the first block

*          of the global matrix distribution. INB must be at least one.

*

*  MB      (global input) INTEGER

*          On entry,  MB  specifies  the  row size of the blocks used to

*          partition the matrix. MB must be at least one.

*

*  NB      (global input) INTEGER

*          On entry, NB  specifies the column size of the blocks used to

*          partition the matrix. NB must be at least one.

*

*  RSRC    (global input) INTEGER

*          On entry,  RSRC  specifies  the row coordinate of the process

*          that possesses the first row of the matrix.  When  RSRC = -1,

*          the data is not  distributed but replicated,  otherwise  RSRC

*          must be at least zero and strictly less than NPROW.

*

*  CSRC    (global input) INTEGER

*          On entry,  CSRC  specifies  the column coordinate of the pro-

*          cess  that  possesses  the  first column of the matrix.  When

*          CSRC = -1, the data is not distributed but replicated, other-

*          wise CSRC must be at least zero and strictly less than NPCOL.

*

*  CTXT    (local input) INTEGER

*          On entry, CTXT specifies the BLACS context handle, indicating

*          the global  communication  context.  The value of the context

*          itself is local.

*

*  LLD     (local input)  INTEGER

*          On entry, LLD  specifies  the  leading dimension of the local

*          array storing the local entries of the matrix. LLD must be at

*          least MAX( 1, Lr(1,M) ).

*

*  -- Written on April 1, 1998 by

*     Antoine Petitet, University  of  Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Parameters ..

      INTEGER            BLOCK_CYCLIC_2D_INB, CSRC_, CTXT_, DLEN_,

     $                   DTYPE_, IMB_, INB_, LLD_, MB_, M_, NB_, N_,

     $                   RSRC_

      PARAMETER          ( BLOCK_CYCLIC_2D_INB = 2, dlen_ = 11,

     $                   dtype_ = 1, ctxt_ = 2, m_ = 3, n_ = 4,

     $                   imb_ = 5, inb_ = 6, mb_ = 7, nb_ = 8,

     $                   rsrc_ = 9, csrc_ = 10, lld_ = 11 )

*     ..

*     .. Executable Statements ..

*

      desc( dtype_ ) = block_cyclic_2d_inb

      desc( ctxt_  ) = ctxt

      desc( m_     ) = m

      desc( n_     ) = n

      desc( imb_   ) = imb

      desc( inb_   ) = inb

      desc( mb_    ) = mb

      desc( nb_    ) = nb

      desc( rsrc_  ) = rsrc

      desc( csrc_  ) = csrc

      desc( lld_   ) = lld

*

      RETURN

*

*     End of PB_DESCSET2

*


      END


      SUBROUTINE pb_descinit2( DESC, M, N, IMB, INB, MB, NB, RSRC, CSRC,

     $                         CTXT, LLD, INFO )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Scalar Arguments ..

      INTEGER            CSRC, CTXT, IMB, INB, INFO, LLD, M, MB, N, NB,

     $                   rsrc

*     ..

*     .. Array Arguments ..

      INTEGER            DESC( * )

*     ..

*

*  Purpose

*  =======

*

*  PB_DESCINIT2 uses  its  10  input  arguments  M, N, IMB, INB, MB, NB,

*  RSRC,  CSRC,  CTXT  and LLD to initialize a descriptor vector of type

*  BLOCK_CYCLIC_2D_INB.

*

*  Notes

*  =====

*

*  A description  vector  is associated with each 2D block-cyclicly dis-

*  tributed matrix.  This  vector  stores  the  information  required to

*  establish the  mapping  between a  matrix entry and its corresponding

*  process and memory location.

*

*  In  the  following  comments,   the character _  should  be  read  as

*  "of  the  distributed  matrix".  Let  A  be a generic term for any 2D

*  block cyclicly distributed matrix.  Its description vector is DESCA:

*

*  NOTATION         STORED IN       EXPLANATION

*  ---------------- --------------- ------------------------------------

*  DTYPE_A (global) DESCA( DTYPE_ ) The descriptor type.

*  CTXT_A  (global) DESCA( CTXT_  ) The BLACS context handle, indicating

*                                   the NPROW x NPCOL BLACS process grid

*                                   A  is distributed over.  The context

*                                   itself  is  global,  but  the handle

*                                   (the integer value) may vary.

*  M_A     (global) DESCA( M_     ) The  number of rows in the distribu-

*                                   ted matrix A, M_A >= 0.

*  N_A     (global) DESCA( N_     ) The number of columns in the distri-

*                                   buted matrix A, N_A >= 0.

*  IMB_A   (global) DESCA( IMB_   ) The number of rows of the upper left

*                                   block of the matrix A, IMB_A > 0.

*  INB_A   (global) DESCA( INB_   ) The  number  of columns of the upper

*                                   left   block   of   the   matrix  A,

*                                   INB_A > 0.

*  MB_A    (global) DESCA( MB_    ) The blocking factor used to  distri-

*                                   bute the last  M_A-IMB_A rows of  A,

*                                   MB_A > 0.

*  NB_A    (global) DESCA( NB_    ) The blocking factor used to  distri-

*                                   bute the last  N_A-INB_A  columns of

*                                   A, NB_A > 0.

*  RSRC_A  (global) DESCA( RSRC_  ) The process row over which the first

*                                   row of the matrix  A is distributed,

*                                   NPROW > RSRC_A >= 0.

*  CSRC_A  (global) DESCA( CSRC_  ) The  process  column  over which the

*                                   first  column of  A  is distributed.

*                                   NPCOL > CSRC_A >= 0.

*  LLD_A   (local)  DESCA( LLD_   ) The  leading  dimension of the local

*                                   array  storing  the  local blocks of

*                                   the distributed matrix A,

*                                   IF( Lc( 1, N_A ) > 0 )

*                                      LLD_A >= MAX( 1, Lr( 1, M_A ) )

*                                   ELSE

*                                      LLD_A >= 1.

*

*  Let K be the number of  rows of a matrix A starting at the global in-

*  dex IA,i.e, A( IA:IA+K-1, : ). Lr( IA, K ) denotes the number of rows

*  that the process of row coordinate MYROW ( 0 <= MYROW < NPROW ) would

*  receive if these K rows were distributed over NPROW processes.  If  K

*  is the number of columns of a matrix  A  starting at the global index

*  JA, i.e, A( :, JA:JA+K-1, : ), Lc( JA, K ) denotes the number  of co-

*  lumns that the process MYCOL ( 0 <= MYCOL < NPCOL ) would  receive if

*  these K columns were distributed over NPCOL processes.

*

*  The values of Lr() and Lc() may be determined via a call to the func-

*  tion PB_NUMROC:

*  Lr( IA, K ) = PB_NUMROC( K, IA, IMB_A, MB_A, MYROW, RSRC_A, NPROW )

*  Lc( JA, K ) = PB_NUMROC( K, JA, INB_A, NB_A, MYCOL, CSRC_A, NPCOL )

*

*  Arguments

*  =========

*

*  DESC    (global and local output) INTEGER array

*          On entry, DESC is an array of  dimension  DLEN_.  DESC is the

*          array descriptor to be set.

*

*  M       (global input) INTEGER

*          On entry,  M  specifies  the  number  of  rows of the matrix.

*          M must be at least zero.

*

*  N       (global input) INTEGER

*          On entry,  N  specifies  the number of columns of the matrix.

*          N must be at least zero.

*

*  IMB     (global input) INTEGER

*          On entry,  IMB  specifies  the row size of the first block of

*          the global matrix distribution. IMB must be at least one.

*

*  INB     (global input) INTEGER

*          On entry,  INB  specifies  the column size of the first block

*          of the global matrix distribution. INB must be at least one.

*

*  MB      (global input) INTEGER

*          On entry,  MB  specifies  the  row size of the blocks used to

*          partition the matrix. MB must be at least one.

*

*  NB      (global input) INTEGER

*          On entry, NB  specifies the column size of the blocks used to

*          partition the matrix. NB must be at least one.

*

*  RSRC    (global input) INTEGER

*          On entry,  RSRC  specifies  the row coordinate of the process

*          that possesses the first row of the matrix.  When  RSRC = -1,

*          the data is not  distributed but replicated,  otherwise  RSRC

*          must be at least zero and strictly less than NPROW.

*

*  CSRC    (global input) INTEGER

*          On entry,  CSRC  specifies  the column coordinate of the pro-

*          cess  that  possesses  the  first column of the matrix.  When

*          CSRC = -1, the data is not distributed but replicated, other-

*          wise CSRC must be at least zero and strictly less than NPCOL.

*

*  CTXT    (local input) INTEGER

*          On entry, CTXT specifies the BLACS context handle, indicating

*          the global  communication  context.  The value of the context

*          itself is local.

*

*  LLD     (local input)  INTEGER

*          On entry, LLD  specifies  the  leading dimension of the local

*          array storing the local entries of the matrix. LLD must be at

*          least MAX( 1, Lr(1,M) ).

*

*  INFO    (local output) INTEGER

*          = 0: successful exit

*          < 0: if INFO = -i, the i-th argument had an illegal value.

*

*  Notes

*  =====

*

*  If the routine can recover from an erroneous input argument,  it will

*  return an acceptable descriptor vector.  For example,  if LLD = 0  on

*  input, DESC( LLD_ ) will  contain  the smallest leading dimension re-

*  quired to store the specified m by n matrix, INFO will however be set

*  to -11 on exit in that case.

*

*  -- Written on April 1, 1998 by

*     Antoine Petitet, University  of  Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Parameters ..

      INTEGER            BLOCK_CYCLIC_2D_INB, CSRC_, CTXT_, DLEN_,

     $                   DTYPE_, IMB_, INB_, LLD_, MB_, M_, NB_, N_,

     $                   RSRC_

      PARAMETER          ( BLOCK_CYCLIC_2D_INB = 2, dlen_ = 11,

     $                   dtype_ = 1, ctxt_ = 2, m_ = 3, n_ = 4,

     $                   imb_ = 5, inb_ = 6, mb_ = 7, nb_ = 8,

     $                   rsrc_ = 9, csrc_ = 10, lld_ = 11 )

*     ..

*     .. Local Scalars ..

      INTEGER            LLDMIN, MP, MYCOL, MYROW, NPCOL, NPROW

*     ..

*     .. External Subroutines ..

      EXTERNAL           BLACS_GRIDINFO, PXERBLA

*     ..

*     .. External Functions ..

      INTEGER            PB_NUMROC

      EXTERNAL           PB_NUMROC

*     ..

*     .. Intrinsic Functions ..

      INTRINSIC          max, min

*     ..

*     .. Executable Statements ..

*

*     Get grid parameters

*

      CALL blacs_gridinfo( ctxt, nprow, npcol, myrow, mycol )

*

      info = 0

      IF( m.LT.0 ) THEN

         info = -2

      ELSE IF( n.LT.0 ) THEN

         info = -3

      ELSE IF( imb.LT.1 ) THEN

         info = -4

      ELSE IF( inb.LT.1 ) THEN

         info = -5

      ELSE IF( mb.LT.1 ) THEN

         info = -6

      ELSE IF( nb.LT.1 ) THEN

         info = -7

      ELSE IF( rsrc.LT.-1 .OR. rsrc.GE.nprow ) THEN

         info = -8

      ELSE IF( csrc.LT.-1 .OR. csrc.GE.npcol ) THEN

         info = -9

      ELSE IF( nprow.EQ.-1 ) THEN

         info = -10

      END IF

*

*     Compute minimum LLD if safe (to avoid division by 0)

*

      IF( info.EQ.0 ) THEN

         mp = pb_numroc( m, 1, imb, mb, myrow, rsrc, nprow )

         IF( pb_numroc( n, 1, inb, nb, mycol, csrc, npcol ).GT.0 ) THEN

            lldmin = max( 1, mp )

         ELSE

            lldmin = 1

         END IF

         IF( lld.LT.lldmin )

     $      info = -11

      END IF

*

      IF( info.NE.0 )

     $   CALL pxerbla( ctxt, 'PB_DESCINIT2', -info )

*

      desc( dtype_ ) = block_cyclic_2d_inb

      desc( ctxt_  ) = ctxt

      desc( m_     ) = max( 0, m )

      desc( n_     ) = max( 0, n )

      desc( imb_   ) = max( 1, imb )

      desc( inb_   ) = max( 1, inb )

      desc( mb_    ) = max( 1, mb )

      desc( nb_    ) = max( 1, nb )

      desc( rsrc_  ) = max( -1, min( rsrc, nprow-1 ) )

      desc( csrc_  ) = max( -1, min( csrc, npcol-1 ) )

      desc( lld_   ) = max( lld, lldmin )

*

      RETURN

*

*     End of PB_DESCINIT2

*


      END


      SUBROUTINE pb_binfo( OFFD, M, N, IMB1, INB1, MB, NB, MRROW, MRCOL,

     $                     LCMT00, MBLKS, NBLKS, IMBLOC, INBLOC, LMBLOC,

     $                     LNBLOC, ILOW, LOW, IUPP, UPP )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Scalar Arguments ..

      INTEGER            ILOW, IMB1, IMBLOC, INB1, INBLOC, IUPP, LCMT00,

     $                   LMBLOC, LNBLOC, LOW, M, MB, MBLKS, MRCOL,

     $                   mrrow, n, nb, nblks, offd, upp

*     ..

*

*  Purpose

*  =======

*

*  PB_BINFO   initializes the local information of an m by n local array

*  owned by the process of  relative  coordinates ( MRROW, MRCOL ). Note

*  that if m or n is less or equal than zero, there is no data, in which

*  case this process  does  not  need  the local information computed by

*  this routine to proceed.

*

*  Arguments

*  =========

*

*  OFFD    (global input) INTEGER

*          On entry,  OFFD  specifies the off-diagonal of the underlying

*          matrix of interest as follows:

*             OFFD = 0 specifies the main diagonal,

*             OFFD > 0 specifies lower subdiagonals, and

*             OFFD < 0 specifies upper superdiagonals.

*

*  M       (local input) INTEGER

*          On entry, M  specifies the local number of rows of the under-

*          lying matrix  owned  by the  process  of relative coordinates

*          ( MRROW, MRCOL ). M must be at least zero.

*

*  N       (local input) INTEGER

*          On entry, N  specifies the local number of columns of the un-

*          derlying matrix  owned by the process of relative coordinates

*          ( MRROW, MRCOL ). N must be at least zero.

*

*  IMB1    (global input) INTEGER

*          On input, IMB1 specifies  the global true size of  the  first

*          block of rows of the underlying global submatrix.  IMB1  must

*          be at least MIN( 1, M ).

*

*  INB1    (global input) INTEGER

*          On input, INB1 specifies  the global true size of  the  first

*          block  of  columns  of  the underlying global submatrix. INB1

*          must be at least MIN( 1, N ).

*

*  MB      (global input) INTEGER

*          On entry, MB  specifies the blocking factor used to partition

*          the rows of the matrix.  MB  must be at least one.

*

*  NB      (global input) INTEGER

*          On entry, NB  specifies the blocking factor used to partition

*          the the columns of the matrix.  NB  must be at least one.

*

*  MRROW   (local input) INTEGER

*          On entry, MRROW specifies the  relative row coordinate of the

*          process that possesses these M rows. MRROW must be least zero

*          and strictly less than NPROW.

*

*  MRCOL   (local input) INTEGER

*          On entry, MRCOL specifies  the  relative column coordinate of

*          the process that possesses these N  columns.  MRCOL  must  be

*          least zero and strictly less than NPCOL.

*

*  LCMT00  (local output) INTEGER

*          On exit, LCMT00  is the  LCM value of the left upper block of

*          this m by n local  block owned by the process of relative co-

*          ordinates ( MRROW, MRCOL ).

*

*  MBLKS   (local output) INTEGER

*          On exit, MBLKS specifies the local number of blocks  of  rows

*          corresponding to M. MBLKS must be at least zero.

*

*  NBLKS   (local output) INTEGER

*          On exit,  NBLKS  specifies  the local number of blocks of co-

*          lumns corresponding to N. NBLKS must be at least zero.

*

*  IMBLOC  (local output) INTEGER

*          On exit, IMBLOC  specifies  the  number of rows (size) of the

*          uppest blocks of this m by n local array owned by the process

*          of relative coordinates ( MRROW, MRCOL ).  IMBLOC is at least

*          MIN( 1, M ).

*

*  INBLOC  (local output) INTEGER

*          On exit, INBLOC  specifies  the  number of columns (size) of

*          the leftmost  blocks of this m by n local array owned by the

*          process of relative coordinates ( MRROW, MRCOL ).  INBLOC is

*          at least MIN( 1, N ).

*

*  LMBLOC  (local output) INTEGER

*          On exit, LMBLOC specifies the number  of  rows  (size) of the

*          lowest blocks of this m by n local array owned by the process

*          of  relative coordinates ( MRROW, MRCOL ). LMBLOC is at least

*          MIN( 1, M ).

*

*  LNBLOC  (local output) INTEGER

*          On exit, LNBLOC specifies the number of columns (size) of the

*          rightmost  blocks of this  m by n  local  array  owned by the

*          process of  relative  coordinates ( MRROW, MRCOL ). LNBLOC is

*          at least MIN( 1, N ).

*

*  ILOW    (local output) INTEGER

*          On exit, ILOW is the lower bound characterizing the first co-

*          lumn block owning offdiagonals of  this  m by n  array.  ILOW

*          must be less or equal than zero.

*

*  LOW     (global output) INTEGER

*          On exit,  LOW  is  the  lower bound characterizing the column

*          blocks with te exception of the  first  one (see ILOW) owning

*          offdiagonals of this m by n array. LOW  must be less or equal

*          than zero.

*

*  IUPP    (local output) INTEGER

*          On exit, IUPP is the upper bound characterizing the first row

*          block owning offdiagonals of this m by n array.  IUPP must be

*          greater or equal than zero.

*

*  UPP     (global output) INTEGER

*          On exit,  UPP  is  the  upper  bound  characterizing  the row

*          blocks with te exception of the  first  one (see IUPP) owning

*          offdiagonals of this m by n array. UPP  must  be  greater  or

*          equal than zero.

*

*  -- Written on April 1, 1998 by

*     Antoine Petitet, University  of  Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Local Scalars ..

      INTEGER            TMP1

*     ..

*     .. Intrinsic Functions ..

      INTRINSIC          MAX, MIN

*     ..

*     .. Executable Statements ..

*

*     Initialize LOW, ILOW, UPP, IUPP, LMBLOC, LNBLOC, IMBLOC, INBLOC,

*     MBLKS, NBLKS and LCMT00.

*

      LOW = 1 - nb

      upp = mb - 1

*

      lcmt00 = offd

*

      IF( m.LE.0 .OR. n.LE.0 ) THEN

*

         IF( mrrow.GT.0 ) THEN

            iupp = mb - 1

         ELSE

            iupp = max( 0, imb1 - 1 )

         END IF

         imbloc = 0

         mblks  = 0

         lmbloc = 0

*

         IF( mrcol.GT.0 ) THEN

            ilow = 1 - nb

         ELSE

            ilow = min( 0, 1 - inb1 )

         END IF

         inbloc = 0

         nblks  = 0

         lnbloc = 0

*

         lcmt00 = lcmt00 + ( low - ilow + mrcol * nb ) -

     $            ( iupp - upp + mrrow * mb )

*

         RETURN

*

      END IF

*

      IF( mrrow.GT.0 ) THEN

*

         imbloc = min( m, mb )

         iupp   = mb - 1

         lcmt00 = lcmt00 - ( imb1 - mb + mrrow * mb )

         mblks  = ( m - 1 ) / mb + 1

         lmbloc = m - ( m / mb ) * mb

         IF( lmbloc.EQ.0 )

     $      lmbloc = mb

*

         IF( mrcol.GT.0 ) THEN

*

            inbloc = min( n, nb )

            ilow   = 1 - nb

            lcmt00 = lcmt00 + inb1 - nb + mrcol * nb

            nblks  = ( n - 1 ) / nb + 1

            lnbloc = n - ( n / nb ) * nb

            IF( lnbloc.EQ.0 )

     $         lnbloc = nb

*

         ELSE

*

            inbloc = inb1

            ilow   = 1 - inb1

            tmp1   = n - inb1

            IF( tmp1.GT.0 ) THEN

*

*              more than one block

*

               nblks = ( tmp1 - 1 ) / nb + 2

               lnbloc = tmp1 - ( tmp1 / nb ) * nb

               IF( lnbloc.EQ.0 )

     $            lnbloc = nb

*

            ELSE

*

               nblks  = 1

               lnbloc = inb1

*

            END IF

*

         END IF

*

      ELSE

*

         imbloc = imb1

         iupp = imb1 - 1

         tmp1 = m - imb1

         IF( tmp1.GT.0 ) THEN

*

*           more than one block

*

            mblks  = ( tmp1 - 1 ) / mb + 2

            lmbloc = tmp1 - ( tmp1 / mb ) * mb

            IF( lmbloc.EQ.0 )

     $         lmbloc = mb

*

         ELSE

*

            mblks  = 1

            lmbloc = imb1

*

         END IF

*

         IF( mrcol.GT.0 ) THEN

*

            inbloc = min( n, nb )

            ilow   = 1 - nb

            lcmt00 = lcmt00 + inb1 - nb + mrcol * nb

            nblks  = ( n - 1 ) / nb + 1

            lnbloc = n - ( n / nb ) * nb

            IF( lnbloc.EQ.0 )

     $         lnbloc = nb

*

         ELSE

*

            inbloc = inb1

            ilow   = 1 - inb1

            tmp1   = n - inb1

            IF( tmp1.GT.0 ) THEN

*

*              more than one block

*

               nblks  = ( tmp1 - 1 ) / nb + 2

               lnbloc = tmp1 - ( tmp1 / nb ) * nb

               IF( lnbloc.EQ.0 )

     $            lnbloc = nb

*

            ELSE

*

               nblks  = 1

               lnbloc = inb1

*

            END IF

*

         END IF

*

      END IF

*

      RETURN

*

*     End of PB_BINFO

*


      END


      INTEGER FUNCTION pilaenv( ICTXT, PREC )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Scalar Arguments ..

      INTEGER            ictxt

      CHARACTER*1        prec

*     ..

*

*  Purpose

*  =======

*

*  PILAENV  returns  the  logical computational block size to be used by

*  the PBLAS routines during testing and timing. This is a special  ver-

*  sion to be used only as part of the testing or timing  PBLAS programs

*  for testing different values of logical computational block sizes for

*  the PBLAS routines. It is called by the PBLAS routines to  retrieve a

*  logical computational block size value.

*

*  Arguments

*  =========

*

*  ICTXT   (local input) INTEGER

*          On entry,  ICTXT  specifies the BLACS context handle, indica-

*          ting the global  context of the operation. The context itself

*          is global, but the value of ICTXT is local.

*

*  PREC    (dummy input) CHARACTER*1

*          On entry, PREC is a dummy argument.

*

*  -- Written on April 1, 1998 by

*     Antoine Petitet, University  of  Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Common Blocks ..

      INTEGER            info, nblog

      common             /infoc/info, nblog

*     ..

*     .. Executable Statements ..

*

      pilaenv = nblog

*

      RETURN

*

*     End of PILAENV

*


      END


      SUBROUTINE pb_locinfo( I, INB, NB, MYROC, SRCPROC, NPROCS,

     $                       ILOCBLK, ILOCOFF, MYDIST )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Scalar Arguments ..

      INTEGER            I, ILOCBLK, ILOCOFF, INB, MYDIST, MYROC, NB,

     $                   NPROCS, SRCPROC

*     ..

*

*  Purpose

*  =======

*

*  PB_LOCINFO  computes  local information about the beginning of a sub-

*  matrix starting at the global index I.

*

*  Arguments

*  =========

*

*  I       (global input) INTEGER

*          On entry,  I  specifies  the global starting index in the ma-

*          trix. I must be at least one.

*

*  INB     (global input) INTEGER

*          On entry,  INB  specifies the size of the first block of rows

*          or columns of the matrix. INB must be at least one.

*

*  NB      (global input) INTEGER

*          On entry, NB  specifies the size of the blocks of rows or co-

*          lumns of the matrix is partitioned into.  NB must be at least

*          one.

*

*  MYROC   (local input) INTEGER

*          On entry, MYROC is the  coordinate of the process whose local

*          information  is  determined.  MYROC  is  at  least  zero  and

*          strictly less than NPROCS.

*

*  SRCPROC (global input) INTEGER

*          On entry,  SRCPROC  specifies  the coordinate of the  process

*          that possesses the  first row or column  of the matrix.  When

*          SRCPROC = -1, the data  is not  distributed  but  replicated,

*          otherwise  SRCPROC  must be at least zero and  strictly  less

*          than NPROCS.

*

*  NPROCS  (global input) INTEGER

*          On entry, NPROCS  specifies  the total number of process rows

*          or  columns  over  which the submatrix is distributed. NPROCS

*          must be at least one.

*

*  ILOCBLK (local output) INTEGER

*          On exit, ILOCBLK  specifies  the  local  row  or column block

*          coordinate  corresponding  to  the row or column I of the ma-

*          trix. ILOCBLK must be at least zero.

*

*  ILOCOFF (local output) INTEGER

*          On exit, ILOCOFF  specifies the local row offset in the block

*          of local coordinate  ILOCBLK  corresponding to the row or co-

*          lumn I of the matrix. ILOCOFF must at least zero.

*

*  MYDIST  (local output) INTEGER

*          On exit, MYDIST  specifies the relative process coordinate of

*          the process specified by MYROC to the process owning the  row

*          or column I. MYDIST  is at  least zero and strictly less than

*          NPROCS.

*

*  -- Written on April 1, 1998 by

*     Antoine Petitet, University  of  Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Local Scalars ..

      INTEGER            ITMP, NBLOCKS, PROC

*     ..

*     .. Executable Statements ..

*

      ILOCOFF = 0

*

      if( srcproc.LT.0 ) THEN

*

         mydist = 0

*

         IF( i.LE.inb ) THEN

*

            ilocblk = 0

            ilocoff = i - 1

*

         ELSE

*

            itmp    = i - inb

            nblocks = ( itmp - 1 ) / nb + 1

            ilocblk = nblocks

            ilocoff = itmp - 1 - ( nblocks - 1 ) * nb

*

         END IF

*

      ELSE

*

         proc   = srcproc

         mydist = myroc - proc

         IF( mydist.LT.0 )

     $      mydist = mydist + nprocs

*

         IF( i.LE.inb ) THEN

*

            ilocblk = 0

            IF( myroc.EQ.proc )

     $         ilocoff = i - 1

*

         ELSE

*

            itmp    = i - inb

            nblocks = ( itmp - 1 ) / nb + 1

            proc    = proc + nblocks

            proc    = proc - ( proc / nprocs ) * nprocs

            ilocblk = nblocks / nprocs

*

            IF( ( ilocblk*nprocs ).LT.( mydist-nblocks ) )

     $         ilocblk = ilocblk + 1

*

            IF( myroc.EQ.proc )

     $         ilocoff = itmp - 1 - ( nblocks - 1 ) * nb

*

         END IF

*

      END IF

*

      RETURN

*

*     End of PB_LOCINFO

*


      END


      SUBROUTINE pb_initjmp( COLMAJ, NVIR, IMBVIR, INBVIR, IMBLOC,

     $                       INBLOC, MB, NB, RSRC, CSRC, NPROW, NPCOL,

     $                       STRIDE, JMP )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Scalar Arguments ..

      LOGICAL            COLMAJ

      INTEGER            CSRC, IMBLOC, IMBVIR, INBLOC, INBVIR, MB, NB,

     $                   NPCOL, NPROW, NVIR, RSRC, STRIDE

*     ..

*     .. Array Arguments ..

      INTEGER            JMP( * )

*     ..

*

*  Purpose

*  =======

*

*  PB_INITJMP  initializes the jump values JMP used by the random matrix

*  generator.

*

*  Arguments

*  =========

*

*  COLMAJ  (global input) LOGICAL

*          On entry, COLMAJ specifies the ordering of the random sequen-

*          ce. When  COLMAJ is .TRUE.,  the random sequence will be used

*          for a column major ordering, and otherwise a  row-major orde-

*          ring. This impacts on the computation of the jump values.

*

*  NVIR    (global input) INTEGER

*          On entry, NVIR  specifies  the size of the underlying virtual

*          matrix. NVIR must be at least zero.

*

*  IMBVIR  (local input) INTEGER

*          On entry, IMBVIR  specifies the number of virtual rows of the

*          upper left block of the underlying virtual submatrix.  IMBVIR

*          must be at least IMBLOC.

*

*  INBVIR  (local input) INTEGER

*          On entry, INBVIR  specifies  the number of virtual columns of

*          the  upper  left  block  of the underlying virtual submatrix.

*          INBVIR must be at least INBLOC.

*

*  IMBLOC  (local input) INTEGER

*          On entry, IMBLOC specifies  the  number of rows (size) of the

*          local uppest  blocks. IMBLOC is at least zero.

*

*  INBLOC  (local input) INTEGER

*          On entry,  INBLOC  specifies the number of columns (size)  of

*          the local leftmost blocks. INBLOC is at least zero.

*

*  MB      (global input) INTEGER

*          On entry, MB specifies the size of the blocks used to  parti-

*          tion the matrix rows. MB must be at least one.

*

*  NB      (global input) INTEGER

*          On entry, NB specifies the size of the blocks used to  parti-

*          tion the matrix columns. NB must be at least one.

*

*  RSRC    (global input) INTEGER

*          On entry,  RSRC  specifies the row coordinate of the  process

*          that possesses the  first row of the matrix.  When RSRC = -1,

*          the rows are not distributed but replicated,  otherwise  RSRC

*          must be at least zero and  strictly less than NPROW.

*

*  CSRC    (global input) INTEGER

*          On entry,  CSRC  specifies  the column coordinate of the pro-

*          cess that possesses the first column of the matrix. When CSRC

*          is equal to -1,  the columns are not distributed but replica-

*          ted, otherwise  CSRC  must be at least zero and strictly less

*          than NPCOL.

*

*  NPROW   (global input) INTEGER

*          On entry,  NPROW  specifies  the total number of process rows

*          over which the matrix is distributed.  NPROW must be at least

*          one.

*

*  NPCOL   (global input) INTEGER

*          On entry,  NPCOL  specifies  the  total number of process co-

*          lumns over which the matrix is distributed.  NPCOL must be at

*          least one.

*

*  STRIDE  (global input) INTEGER

*          On entry, STRIDE specifies the number of random numbers to be

*          generated  to  compute  one  matrix  entry. In the real case,

*          STRIDE is usually 1,  where  as in the complex case STRIDE is

*          usually 2 in order to generate the real and imaginary parts.

*

*  JMP     (local output) INTEGER array

*          On entry, JMP is an array of dimension JMP_LEN. On exit, this

*          array contains  the different  jump values used by the random

*          matrix generator.

*

*  -- Written on April 1, 1998 by

*     Antoine Petitet, University  of  Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Parameters ..

      INTEGER            JMP_1, JMP_COL, JMP_IMBV, JMP_INBV, JMP_LEN,

     $                   JMP_MB, JMP_NB, JMP_NPIMBLOC, JMP_NPMB,

     $                   JMP_NQINBLOC, JMP_NQNB, JMP_ROW

      PARAMETER          ( JMP_1 = 1, jmp_row = 2, jmp_col = 3,

     $                   jmp_mb = 4, jmp_imbv = 5, jmp_npmb = 6,

     $                   jmp_npimbloc = 7, jmp_nb = 8, jmp_inbv = 9,

     $                   jmp_nqnb = 10, jmp_nqinbloc = 11,

     $                   jmp_len = 11 )

*     ..

*     .. Local Scalars ..

      INTEGER            NPMB, NQNB

*     ..

*     .. Executable Statements ..

*

      IF( RSRC.LT.0 ) THEN

         NPMB = mb

      ELSE

         npmb = nprow * mb

      END IF

      IF( csrc.LT.0 ) THEN

         nqnb = nb

      ELSE

         nqnb = npcol * nb

      END IF

*

      jmp( jmp_1        ) = 1

*

      jmp( jmp_mb       ) = mb

      jmp( jmp_imbv     ) = imbvir

      jmp( jmp_npmb     ) = npmb

      jmp( jmp_npimbloc ) = imbloc + npmb - mb

*

      jmp( jmp_nb       ) = nb

      jmp( jmp_inbv     ) = inbvir

      jmp( jmp_nqnb     ) = nqnb

      jmp( jmp_nqinbloc ) = inbloc + nqnb - nb

*

      IF( colmaj ) THEN

         jmp( jmp_row ) = stride

         jmp( jmp_col ) = stride * nvir

      ELSE

         jmp( jmp_row ) = stride * nvir

         jmp( jmp_col ) = stride

      END IF

*

      RETURN

*

*     End of PB_INITJMP

*


      END


      SUBROUTINE pb_initmuladd( MULADD0, JMP, IMULADD )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Array Arguments ..

      INTEGER            IMULADD( 4, * ), JMP( * ), MULADD0( * )

*     ..

*

*  Purpose

*  =======

*

*  PB_INITMULADD initializes the  constants a's and c's corresponding to

*  the jump values (JMP) used by the matrix generator.

*

*  Arguments

*  =========

*

*  MULADD0 (local input) INTEGER array

*          On entry,  MULADD0  is an array of dimension 4 containing the

*          encoded  initial  constants  a and c to jump from  X( n )  to

*          X( n+1 ) = a*X( n ) + c in the random sequence.  MULADD0(1:2)

*          contains respectively the 16-lower and  16-higher bits of the

*          constant  a,  and  MULADD0(3:4)  contains  the  16-lower  and

*          16-higher bits of the constant c.

*

*  JMP     (local input) INTEGER array

*          On entry, JMP is an array of dimension JMP_LEN containing the

*          different jump values used by the matrix generator.

*

*  IMULADD (local output) INTEGER array

*          On entry, IMULADD is an array of dimension ( 4, JMP_LEN ). On

*          exit,  the jth column of this array contains the encoded ini-

*          tial constants a_j and c_j to jump from X( n ) to X(n+JMP(j))

*          (= a_j*X( n ) + c_j) in the random  sequence.  IMULADD(1:2,j)

*          contains  respectively the 16-lower and 16-higher bits of the

*          constant  a_j,  and  IMULADD(3:4,j) contains the 16-lower and

*          16-higher bits of the constant c_j.

*

*  -- Written on April 1, 1998 by

*     Antoine Petitet, University  of  Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Parameters ..

      INTEGER            JMP_1, JMP_COL, JMP_IMBV, JMP_INBV, JMP_LEN,

     $                   JMP_MB, JMP_NB, JMP_NPIMBLOC, JMP_NPMB,

     $                   JMP_NQINBLOC, JMP_NQNB, JMP_ROW

      PARAMETER          ( JMP_1 = 1, jmp_row = 2, jmp_col = 3,

     $                   jmp_mb = 4, jmp_imbv = 5, jmp_npmb = 6,

     $                   jmp_npimbloc = 7, jmp_nb = 8, jmp_inbv = 9,

     $                   jmp_nqnb = 10, jmp_nqinbloc = 11,

     $                   jmp_len = 11 )

*     ..

*

*     .. Local Arrays ..

      INTEGER            ITMP1( 2 ), ITMP2( 2 )

*     ..

*     .. External Subroutines ..

      EXTERNAL           PB_JUMP

*     ..

*     .. Executable Statements ..

*

      ITMP2( 1 ) = 100

      itmp2( 2 ) = 0

*

*     Compute IMULADD for all JMP values

*

      CALL pb_jump( jmp( jmp_1   ), muladd0, itmp2, itmp1,

     $              imuladd( 1, jmp_1   ) )

*

      CALL pb_jump( jmp( jmp_row ), muladd0, itmp1, itmp2,

     $              imuladd( 1, jmp_row ) )

      CALL pb_jump( jmp( jmp_col ), muladd0, itmp1, itmp2,

     $              imuladd( 1, jmp_col ) )

*

*     Compute constants a and c to jump JMP( * ) numbers in the

*     sequence for column- or row-major ordering of the sequence.

*

      CALL pb_jump( jmp( jmp_imbv     ), imuladd( 1, jmp_row ), itmp1,

     $              itmp2, imuladd( 1, jmp_imbv     ) )

      CALL pb_jump( jmp( jmp_mb       ), imuladd( 1, jmp_row ), itmp1,

     $              itmp2, imuladd( 1, jmp_mb       ) )

      CALL pb_jump( jmp( jmp_npmb     ), imuladd( 1, jmp_row ), itmp1,

     $              itmp2, imuladd( 1, jmp_npmb     ) )

      CALL pb_jump( jmp( jmp_npimbloc ), imuladd( 1, jmp_row ), itmp1,

     $              itmp2, imuladd( 1, jmp_npimbloc ) )

*

      CALL pb_jump( jmp( jmp_inbv     ), imuladd( 1, jmp_col ), itmp1,

     $              itmp2, imuladd( 1, jmp_inbv     ) )

      CALL pb_jump( jmp( jmp_nb       ), imuladd( 1, jmp_col ), itmp1,

     $              itmp2, imuladd( 1, jmp_nb       ) )

      CALL pb_jump( jmp( jmp_nqnb     ), imuladd( 1, jmp_col ), itmp1,

     $              itmp2, imuladd( 1, jmp_nqnb     ) )

      CALL pb_jump( jmp( jmp_nqinbloc ), imuladd( 1, jmp_col ), itmp1,

     $              itmp2, imuladd( 1, jmp_nqinbloc ) )

*

      RETURN

*

*     End of PB_INITMULADD

*


      END


      SUBROUTINE pb_setlocran( SEED, ILOCBLK, JLOCBLK, ILOCOFF, JLOCOFF,

     $                         MYRDIST, MYCDIST, NPROW, NPCOL, JMP,

     $                         IMULADD, IRAN )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Scalar Arguments ..

      INTEGER            ILOCBLK, ILOCOFF, JLOCBLK, JLOCOFF, MYCDIST,

     $                   MYRDIST, NPCOL, NPROW, SEED

*     ..

*     .. Array Arguments ..

      INTEGER            IMULADD( 4, * ), IRAN( * ), JMP( * )

*     ..

*

*  Purpose

*  =======

*

*  PB_SETLOCRAN locally initializes the random number generator.

*

*  Arguments

*  =========

*

*  SEED    (global input) INTEGER

*          On entry, SEED specifies a positive integer used to initiali-

*          ze the first number in the random sequence used by the matrix

*          generator. SEED must be at least zero.

*

*  ILOCBLK (local input) INTEGER

*          On entry,  ILOCBLK  specifies  the local row block coordinate

*          corresponding to the first row of the submatrix of  interest.

*          ILOCBLK must be at least zero.

*

*  ILOCOFF (local input) INTEGER

*          On entry, ILOCOFF specifies the local row offset in the block

*          of local coordinate ILOCBLK corresponding to the first row of

*          the submatrix of interest. ILOCOFF must at least zero.

*

*  JLOCBLK (local input) INTEGER

*          On entry, JLOCBLK specifies the local column block coordinate

*          corresponding to the first column of  the  submatrix of inte-

*          rest. JLOCBLK must be at least zero.

*

*  JLOCOFF (local input) INTEGER

*          On entry,  JLOCOFF  specifies  the local column offset in the

*          block of local coordinate  JLOCBLK corresponding to the first

*          column of the submatrix of interest. JLOCOFF must be at least

*          zero.

*

*  MYRDIST (local input) INTEGER

*          On entry, MYRDIST  specifies the relative row process coordi-

*          nate to the process  owning the first row of the submatrix of

*          interest. MYRDIST must be at least zero and stricly less than

*          NPROW (see the subroutine PB_LOCINFO).

*

*  MYCDIST (local input) INTEGER

*          On entry, MYCDIST specifies the relative column process coor-

*          dinate to the  process  owning the first column of the subma-

*          trix of interest.  MYCDIST  must be at least zero and stricly

*          less than NPCOL (see the subroutine PB_LOCINFO).

*

*  NPROW   (global input) INTEGER

*          On entry,  NPROW  specifies  the total number of process rows

*          over which the matrix is distributed.  NPROW must be at least

*          one.

*

*  NPCOL   (global input) INTEGER

*          On entry,  NPCOL  specifies  the  total number of process co-

*          lumns over which the matrix is distributed.  NPCOL must be at

*          least one.

*

*  JMP     (local input) INTEGER array

*          On entry, JMP is an array of dimension JMP_LEN containing the

*          different jump values used by the matrix generator.

*

*  IMULADD (local input) INTEGER array

*          On entry, IMULADD is an array of dimension (4, JMP_LEN).  The

*          jth  column  of this array contains the encoded initial cons-

*          tants a_j and c_j to jump  from  X( n ) to  X( n + JMP( j ) )

*          (= a_j * X( n ) + c_j) in the random sequence. IMULADD(1:2,j)

*          contains respectively the 16-lower and 16-higher bits of  the

*          constant a_j, and IMULADD(3:4,j)  contains  the 16-lower  and

*          16-higher bits of the constant c_j.

*

*  IRAN    (local output) INTEGER array

*          On entry, IRAN is an array of dimension 2. On exit, IRAN con-

*          tains respectively the 16-lower and 32-higher bits of the en-

*          coding of the entry of the  random sequence corresponding lo-

*          cally to the first local array entry to generate.

*

*  -- Written on April 1, 1998 by

*     Antoine Petitet, University  of  Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Parameters ..

      INTEGER            JMP_1, JMP_COL, JMP_IMBV, JMP_INBV, JMP_LEN,

     $                   JMP_MB, JMP_NB, JMP_NPIMBLOC, JMP_NPMB,

     $                   JMP_NQINBLOC, JMP_NQNB, JMP_ROW

      PARAMETER          ( JMP_1 = 1, jmp_row = 2, jmp_col = 3,

     $                   jmp_mb = 4, jmp_imbv = 5, jmp_npmb = 6,

     $                   jmp_npimbloc = 7, jmp_nb = 8, jmp_inbv = 9,

     $                   jmp_nqnb = 10, jmp_nqinbloc = 11,

     $                   jmp_len = 11 )

*     ..

*     .. Local Arrays ..

      INTEGER            IMULADDTMP( 4 ), ITMP( 2 )

*     ..

*     .. External Subroutines ..

      EXTERNAL           PB_JUMP, PB_SETRAN

*     ..

*     .. Executable Statements ..

*

*     Compute and set the value of IRAN corresponding to A( IA, JA )

*

      ITMP( 1 ) = seed

      itmp( 2 ) = 0

*

      CALL pb_jump( jmp( jmp_1 ), imuladd( 1, jmp_1 ), itmp, iran,

     $              imuladdtmp )

*

*     Jump ILOCBLK blocks of rows + ILOCOFF rows

*

      CALL pb_jump( ilocoff, imuladd( 1, jmp_row ), iran, itmp,

     $              imuladdtmp )

      IF( myrdist.GT.0 ) THEN

         CALL pb_jump( jmp( jmp_imbv ), imuladd( 1, jmp_row  ), itmp,

     $                 iran, imuladdtmp )

         CALL pb_jump( myrdist - 1,     imuladd( 1, jmp_mb   ), iran,

     $                 itmp, imuladdtmp )

         CALL pb_jump( ilocblk,         imuladd( 1, jmp_npmb ), itmp,

     $                 iran, imuladdtmp )

      ELSE

         IF( ilocblk.GT.0 ) THEN

            CALL pb_jump( jmp( jmp_imbv ), imuladd( 1, jmp_row  ), itmp,

     $                    iran, imuladdtmp )

            CALL pb_jump( nprow - 1,       imuladd( 1, jmp_mb   ), iran,

     $                    itmp, imuladdtmp )

            CALL pb_jump( ilocblk - 1,     imuladd( 1, jmp_npmb ), itmp,

     $                    iran, imuladdtmp )

         ELSE

            CALL pb_jump( 0,               imuladd( 1, jmp_1    ), itmp,

     $                    iran, imuladdtmp )

         END IF

      END IF

*

*     Jump JLOCBLK blocks of columns + JLOCOFF columns

*

      CALL pb_jump( jlocoff, imuladd( 1, jmp_col ), iran, itmp,

     $              imuladdtmp )

      IF( mycdist.GT.0 ) THEN

         CALL pb_jump( jmp( jmp_inbv ), imuladd( 1, jmp_col  ), itmp,

     $                 iran, imuladdtmp )

         CALL pb_jump( mycdist - 1,     imuladd( 1, jmp_nb   ), iran,

     $                 itmp, imuladdtmp )

         CALL pb_jump( jlocblk,         imuladd( 1, jmp_nqnb ), itmp,

     $                 iran, imuladdtmp )

      ELSE

         IF( jlocblk.GT.0 ) THEN

            CALL pb_jump( jmp( jmp_inbv ), imuladd( 1, jmp_col  ), itmp,

     $                    iran, imuladdtmp )

            CALL pb_jump( npcol - 1,       imuladd( 1, jmp_nb   ), iran,

     $                    itmp, imuladdtmp )

            CALL pb_jump( jlocblk - 1,     imuladd( 1, jmp_nqnb ), itmp,

     $                    iran, imuladdtmp )

         ELSE

            CALL pb_jump( 0,               imuladd( 1, jmp_1    ), itmp,

     $                    iran, imuladdtmp )

         END IF

      END IF

*

      CALL pb_setran( iran, imuladd( 1, jmp_1 ) )

*

      RETURN

*

*     End of PB_SETLOCRAN

*


      END


      SUBROUTINE pb_ladd( J, K, I )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Array Arguments ..

      INTEGER            I( 2 ), J( 2 ), K( 2 )

*     ..

*

*  Purpose

*  =======

*

*  PB_LADD adds without carry two long positive integers K and J and put

*  the result into I.  The long integers  I, J, K are encoded on 31 bits

*  using an array of 2 integers.  The 16-lower bits  are stored  in  the

*  first entry of each array, the  15-higher  bits  in the second entry.

*  For efficiency purposes, the intrisic modulo function is inlined.

*

*  Arguments

*  =========

*

*  J       (local input) INTEGER array

*          On entry, J is an array of dimension 2 containing the encoded

*          long integer J.

*

*  K       (local input) INTEGER array

*          On entry, K is an array of dimension 2 containing the encoded

*          long integer K.

*

*  I       (local output) INTEGER array

*          On entry, I is an array of dimension 2. On exit,  this  array

*          contains the encoded long integer I.

*

*  Further Details

*  ===============

*

*            K( 2 )   K( 1 )

*          0XXXXXXX XXXXXXXX  K   I( 1 ) = MOD( K( 1 ) + J( 1 ), 2**16 )

*        +                        carry  = ( K( 1 ) + J( 1 ) ) / 2**16

*            J( 2 )   J( 1 )

*          0XXXXXXX XXXXXXXX  J   I( 2 ) = K( 2 ) + J( 2 ) + carry

*        ----------------------   I( 2 ) = MOD( I( 2 ), 2**15 )

*            I( 2 )   I( 1 )

*          0XXXXXXX XXXXXXXX  I

*

*  -- Written on April 1, 1998 by

*     Antoine Petitet, University  of  Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Parameters ..

      INTEGER            IPOW15, IPOW16

      PARAMETER          ( IPOW15 = 2**15, ipow16 = 2**16 )

*     ..

*     .. Local Scalars ..

      INTEGER            ITMP1, ITMP2

*     ..

*     .. Executable Statements ..

*

*     I( 1 ) = MOD( K( 1 ) + J( 1 ), IPOW16 )

*

      ITMP1 = k( 1 ) + j( 1 )

      itmp2 = itmp1 / ipow16

      i( 1 ) = itmp1 - itmp2 * ipow16

*

*     I( 2 ) = MOD( ( K( 1 ) + J( 1 ) ) / IPOW16 + K( 2 ) + J( 2 ),

*                   IPOW15 )

*

      itmp1 = itmp2 + k( 2 ) + j( 2 )

      itmp2 = itmp1 / ipow15

      i( 2 ) = itmp1 - itmp2 * ipow15

*

      RETURN

*

*     End of PB_LADD

*


      END


      SUBROUTINE pb_lmul( K, J, I )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Array Arguments ..

      INTEGER            I( 2 ), J( 2 ), K( 2 )

*     ..

*

*  Purpose

*  =======

*

*  PB_LMUL  multiplies  without carry two long positive integers K and J

*  and put the result into I.  The long integers  I, J, K are encoded on

*  31 bits using an array of 2 integers. The 16-lower bits are stored in

*  the first entry of each array, the 15-higher bits in the second entry

*  of each array. For efficiency purposes, the  intrisic modulo function

*  is inlined.

*

*  Arguments

*  =========

*

*  K       (local input) INTEGER array

*          On entry, K is an array of dimension 2 containing the encoded

*          long integer K.

*

*  J       (local input) INTEGER array

*          On entry, J is an array of dimension 2 containing the encoded

*          long integer J.

*

*  I       (local output) INTEGER array

*          On entry, I is an array of dimension 2. On exit,  this  array

*          contains the encoded long integer I.

*

*  Further Details

*  ===============

*

*            K( 2 )   K( 1 )

*          0XXXXXXX XXXXXXXX  K   I( 1 ) = MOD( K( 1 ) + J( 1 ), 2**16 )

*        *                        carry  = ( K( 1 ) + J( 1 ) ) / 2**16

*            J( 2 )   J( 1 )

*          0XXXXXXX XXXXXXXX  J   I( 2 ) = K( 2 ) + J( 2 ) + carry

*        ----------------------   I( 2 ) = MOD( I( 2 ), 2**15 )

*            I( 2 )   I( 1 )

*          0XXXXXXX XXXXXXXX  I

*

*  -- Written on April 1, 1998 by

*     Antoine Petitet, University  of  Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Parameters ..

      INTEGER            IPOW15, IPOW16, IPOW30

      PARAMETER          ( IPOW15 = 2**15, ipow16 = 2**16,

     $                   ipow30 = 2**30 )

*     ..

*     .. Local Scalars ..

      INTEGER            ITMP1, ITMP2

*     ..

*     .. Executable Statements ..

*

      ITMP1 = k( 1 ) * j( 1 )

      IF( itmp1.LT.0 )

     $   itmp1 = ( itmp1 + ipow30 ) + ipow30

*

*     I( 1 ) = MOD( ITMP1, IPOW16 )

*

      itmp2 = itmp1 / ipow16

      i( 1 ) = itmp1 - itmp2 * ipow16

*

      itmp1 = k( 1 ) * j( 2 ) + k( 2 ) * j( 1 )

      IF( itmp1.LT.0 )

     $   itmp1 = ( itmp1 + ipow30 ) + ipow30

*

      itmp1 = itmp2 + itmp1

      IF( itmp1.LT.0 )

     $   itmp1 = ( itmp1 + ipow30 ) + ipow30

*

*     I( 2 ) = MOD( ITMP1, IPOW15 )

*

      i( 2 ) = itmp1 - ( itmp1 / ipow15 ) * ipow15

*

      RETURN

*

*     End of PB_LMUL

*


      END


      SUBROUTINE pb_jump( K, MULADD, IRANN, IRANM, IMA )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Scalar Arguments ..

      INTEGER            K

*     ..

*     .. Array Arguments ..

      INTEGER            IMA( 4 ), IRANM( 2 ), IRANN( 2 ), MULADD( 4 )

*     ..

*

*  Purpose

*  =======

*

*  PB_JUMP  computes the constants A and C to jump K numbers in the ran-

*  dom sequence:

*

*     X( n+K ) = A * X( n ) + C.

*

*  The constants encoded in MULADD specify how to jump from entry in the

*  sequence to the next.

*

*  Arguments

*  =========

*

*  K       (local input) INTEGER

*          On entry, K specifies the number of entries  of  the sequence

*          to jump over. When K is less or equal than zero, A and C  are

*          not computed, and  IRANM  is set to  IRANN corresponding to a

*          jump of size zero.

*

*  MULADD  (local input) INTEGER array

*          On entry,  MULADD  is an  array of dimension 4 containing the

*          encoded constants a and c to  jump  from  X( n ) to  X( n+1 )

*          ( = a*X( n )+c) in the random sequence.  MULADD(1:2) contains

*          respectively the 16-lower and 16-higher bits of  the constant

*          a,  and  MULADD(3:4) contains the 16-lower and 16-higher bits

*          of the constant c.

*

*  IRANN   (local input) INTEGER array

*          On entry,  IRANN  is an array of dimension 2. This array con-

*          tains respectively the 16-lower and 16-higher bits of the en-

*          coding of X( n ).

*

*  IRANM   (local output) INTEGER array

*          On entry,  IRANM  is an  array of dimension 2.  On exit, this

*          array contains respectively the 16-lower and  16-higher  bits

*          of the encoding of X( n+K ).

*

*  IMA     (local output) INTEGER array

*          On entry, IMA is an array of dimension 4. On exit, when K is

*          greater than zero, this array contains the encoded constants

*          A and C to  jump  from X( n ) to  X( n+K ) in the random se-

*          quence.  IMA(1:2)  contains  respectively  the  16-lower and

*          16-higher bits of the constant A, and IMA(3:4)  contains the

*          16-lower  and  16-higher  bits of the constant  C. When K is

*          less or equal than zero, this array is not referenced.

*

*  -- Written on April 1, 1998 by

*     Antoine Petitet, University  of  Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Local Scalars ..

      INTEGER            I

*     ..

*     .. Local Arrays ..

      INTEGER            J( 2 )

*     ..

*     .. External Subroutines ..

      EXTERNAL           PB_LADD, PB_LMUL

*     ..

*     .. Executable Statements ..

*

      IF( K.GT.0 ) THEN

*

         IMA( 1 ) = muladd( 1 )

         ima( 2 ) = muladd( 2 )

         ima( 3 ) = muladd( 3 )

         ima( 4 ) = muladd( 4 )

*

         DO 10 i = 1, k - 1

*

            CALL pb_lmul( ima, muladd, j )

*

            ima( 1 ) = j( 1 )

            ima( 2 ) = j( 2 )

*

            CALL pb_lmul( ima( 3 ), muladd, j )

            CALL pb_ladd( muladd( 3 ), j, ima( 3 ) )

*

   10    CONTINUE

*

         CALL pb_lmul( irann, ima, j )

         CALL pb_ladd( j, ima( 3 ), iranm )

*

      ELSE

*

         iranm( 1 ) = irann( 1 )

         iranm( 2 ) = irann( 2 )

*

      END IF

*

      RETURN

*

*     End of PB_JUMP

*


      END


      SUBROUTINE pb_setran( IRAN, IAC )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Array Arguments ..

      INTEGER            IAC( 4 ), IRAN( 2 )

*     ..

*

*  Purpose

*  =======

*

*  PB_SETRAN  initializes  the random generator with the encoding of the

*  first number X( 1 ) in the sequence,  and  the constants a and c used

*  to compute the next element in the sequence:

*

*     X( n+1 ) = a * X( n ) + c.

*

*  X( 1 ), a and c are stored in the common block  RANCOM  for later use

*  (see the routines PB_SRAN or PB_DRAN).

*

*  Arguments

*  =========

*

*  IRAN    (local input) INTEGER array

*          On entry, IRAN is an array of dimension 2.  This  array  con-

*          tains respectively the 16-lower and 16-higher bits of the en-

*          coding of X( 1 ).

*

*  IAC     (local input) INTEGER array

*          On entry,  IAC  is an array of dimension 4.  IAC(1:2) contain

*          respectively the 16-lower and 16-higher bits  of the constant

*          a, and  IAC(3:4)  contain  the 16-lower and 16-higher bits of

*          the constant c.

*

*  -- Written on April 1, 1998 by

*     Antoine Petitet, University  of  Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Common Blocks ..

      INTEGER            IACS( 4 ), IRAND( 2 )

      COMMON             /RANCOM/ IRAND, IACS

*     ..

*     .. Save Statements ..

      SAVE               /RANCOM/

*     ..

*     .. Executable Statements ..

*

      IRAND( 1 ) = iran( 1 )

      irand( 2 ) = iran( 2 )

      iacs( 1 )  = iac( 1 )

      iacs( 2 )  = iac( 2 )

      iacs( 3 )  = iac( 3 )

      iacs( 4 )  = iac( 4 )

*

      RETURN

*

*     End of PB_SETRAN

*


      END


      SUBROUTINE pb_jumpit( MULADD, IRANN, IRANM )

*

*  -- PBLAS test routine (version 2.0) --

*     University of Tennessee, Knoxville, Oak Ridge National Laboratory,

*     and University of California, Berkeley.

*     April 1, 1998

*

*     .. Array Arguments ..

      INTEGER            IRANM( 2 ), IRANN( 2 ), MULADD( 4 )

*     ..

*

*  Purpose

*  =======

*

*  PB_JUMPIT  jumps  in the random sequence from the number X( n ) enco-

*  ded in IRANN to the number  X( m )  encoded in  IRANM using the cons-

*  tants A and C encoded in MULADD:

*

*     X( m ) = A * X( n ) + C.

*

*  The constants A and C obviously depend on m and n, see the subroutine

*  PB_JUMP in order to set them up.

*

*  Arguments

*  =========

*

*  MULADD  (local input) INTEGER array

*          On netry, MULADD is an array of dimension 4. MULADD(1:2) con-

*          tains  respectively  the 16-lower and 16-higher bits  of  the

*          constant  A,  and   MULADD(3:4)  contains  the  16-lower  and

*          16-higher bits of the constant C.

*

*  IRANN   (local input) INTEGER array

*          On entry,  IRANN  is an array of dimension 2. This array con-

*          tains respectively the 16-lower and 16-higher bits of the en-

*          coding of X( n ).

*

*  IRANM   (local output) INTEGER array

*          On entry,  IRANM  is an  array of dimension 2.  On exit, this

*          array contains respectively the 16-lower and  16-higher  bits

*          of the encoding of X( m ).

*

*  -- Written on April 1, 1998 by

*     Antoine Petitet, University  of  Tennessee, Knoxville 37996, USA.

*

*  =====================================================================

*

*     .. Local Arrays ..

      INTEGER            J( 2 )

*     ..

*     .. External Subroutines ..

      EXTERNAL           PB_LADD, PB_LMUL

*     ..

*     .. Common Blocks ..

      INTEGER            IACS( 4 ), IRAND( 2 )

      COMMON             /RANCOM/ IRAND, IACS

*     ..

*     .. Save Statements ..

      SAVE               /RANCOM/

*     ..

*     .. Executable Statements ..

*

      CALL PB_LMUL( IRANN, MULADD, J )

      CALL PB_LADD( J, MULADD( 3 ), IRANM )

*

      IRAND( 1 ) = iranm( 1 )

      irand( 2 ) = iranm( 2 )

*

      RETURN

*

*     End of PB_JUMPIT

*


      END

pb_combine
subroutine pb_combine(ictxt, scope, op, tmtype, n, ibeg, times)
Definition pblastim.f:3211

pb_boot
subroutine pb_boot()
Definition pblastim.f:2927

pb_enable
subroutine pb_enable()
Definition pblastim.f:3054

pdopbl2
double precision function pdopbl2(subnam, m, n, kkl, kku)
Definition pblastim.f:1084

pb_inquire
double precision function pb_inquire(tmtype, i)
Definition pblastim.f:3129

pdopbl3
double precision function pdopbl3(subnam, m, n, k)
Definition pblastim.f:1313

pb_timer
subroutine pb_timer(i)
Definition pblastim.f:2976

pb_disable
subroutine pb_disable()
Definition pblastim.f:3092

pb_ainfog2l
subroutine pb_ainfog2l(m, n, i, j, desc, nprow, npcol, myrow, mycol, imb1, inb1, mp, nq, ii, jj, prow, pcol, rprow, rpcol)
Definition pblastst.f:2023

pmdimchk
subroutine pmdimchk(ictxt, nout, m, n, matrix, ia, ja, desca, info)
Definition pblastst.f:202

pvdimchk
subroutine pvdimchk(ictxt, nout, n, matrix, ix, jx, descx, incx, info)
Definition pblastst.f:3

icopy
subroutine icopy(n, sx, incx, sy, incy)
Definition pblastst.f:1525

pb_descset2
subroutine pb_descset2(desc, m, n, imb, inb, mb, nb, rsrc, csrc, ctxt, lld)
Definition pblastst.f:3172

pmdescchk
subroutine pmdescchk(ictxt, nout, matrix, desca, dta, ma, na, imba, inba, mba, nba, rsrca, csrca, mpa, nqa, iprea, imida, iposta, igap, gapmul, info)
Definition pblastst.f:746

pb_ladd
subroutine pb_ladd(j, k, i)
Definition pblastst.f:4480

pb_binfo
subroutine pb_binfo(offd, m, n, imb1, inb1, mb, nb, mrrow, mrcol, lcmt00, mblks, nblks, imbloc, inbloc, lmbloc, lnbloc, ilow, low, iupp, upp)
Definition pblastst.f:3577

pb_setran
subroutine pb_setran(iran, iac)
Definition pblastst.f:4759

pb_infog2l
subroutine pb_infog2l(i, j, desc, nprow, npcol, myrow, mycol, ii, jj, prow, pcol)
Definition pblastst.f:1673

pb_locinfo
subroutine pb_locinfo(i, inb, nb, myroc, srcproc, nprocs, ilocblk, ilocoff, mydist)
Definition pblastst.f:3910

pb_descinit2
subroutine pb_descinit2(desc, m, n, imb, inb, mb, nb, rsrc, csrc, ctxt, lld, info)
Definition pblastst.f:3337

pvdescchk
subroutine pvdescchk(ictxt, nout, matrix, descx, dtx, mx, nx, imbx, inbx, mbx, nbx, rsrcx, csrcx, incx, mpx, nqx, iprex, imidx, ipostx, igap, gapmul, info)
Definition pblastst.f:388

pb_chkmat
subroutine pb_chkmat(ictxt, m, mpos0, n, npos0, ia, ja, desca, dpos0, info)
Definition pblastst.f:2742

pb_lmul
subroutine pb_lmul(k, j, i)
Definition pblastst.f:4559

pb_jump
subroutine pb_jump(k, muladd, irann, iranm, ima)
Definition pblastst.f:4648

pb_noabort
integer function pb_noabort(cinfo)
Definition pblastst.f:1622

pb_setlocran
subroutine pb_setlocran(seed, ilocblk, jlocblk, ilocoff, jlocoff, myrdist, mycdist, nprow, npcol, jmp, imuladd, iran)
Definition pblastst.f:4302

pb_initmuladd
subroutine pb_initmuladd(muladd0, jmp, imuladd)
Definition pblastst.f:4196

lsamen
logical function lsamen(n, ca, cb)
Definition pblastst.f:1457

pb_desctrans
subroutine pb_desctrans(descin, descout)
Definition pblastst.f:2964

pb_initjmp
subroutine pb_initjmp(colmaj, nvir, imbvir, inbvir, imbloc, inbloc, mb, nb, rsrc, csrc, nprow, npcol, stride, jmp)
Definition pblastst.f:4045

pb_jumpit
subroutine pb_jumpit(muladd, irann, iranm)
Definition pblastst.f:4822

pb_numroc
integer function pb_numroc(n, i, inb, nb, proc, srcproc, nprocs)
Definition pblastst.f:2548

max
#define max(A, B)
Definition pcgemr.c:180

min
#define min(A, B)
Definition pcgemr.c:181

pilaenv
integer function pilaenv(ictxt, prec)
Definition pilaenv.f:2

pxerbla
subroutine pxerbla(ictxt, srname, info)
Definition pxerbla.f:2

lsame
logical function lsame(ca, cb)
Definition tools.f:1724