d8/d5b/dlar1va_8f_source.html

      SUBROUTINE dlar1va(N, B1, BN, LAMBDA, D, L, LD, LLD,

     $           PIVMIN, GAPTOL, Z, WANTNC, NEGCNT, ZTZ, MINGMA,

     $           R, ISUPPZ, NRMINV, RESID, RQCORR, WORK )

*

      IMPLICIT NONE

*

*  -- ScaLAPACK computational routine (version 2.0) --

*     Univ. of Tennessee, Univ. of California Berkeley, Univ of Colorado Denver

*     July 4, 2010

*

*     .. Scalar Arguments ..

      LOGICAL            WANTNC

      INTEGER   B1, BN, N, NEGCNT, R

      DOUBLE PRECISION   GAPTOL, LAMBDA, MINGMA, NRMINV, PIVMIN, RESID,

     $                   rqcorr, ztz

*     ..

*     .. Array Arguments ..

      INTEGER            ISUPPZ( * )

      DOUBLE PRECISION   D( * ), L( * ), LD( * ), LLD( * ),

     $                  work( * )

      DOUBLE PRECISION Z( * )

*

*  Purpose

*  =======

*

*  DLAR1VA computes the (scaled) r-th column of the inverse of

*  the sumbmatrix in rows B1 through BN of the tridiagonal matrix

*  L D L^T - sigma I. When sigma is close to an eigenvalue, the

*  computed vector is an accurate eigenvector. Usually, r corresponds

*  to the index where the eigenvector is largest in magnitude.

*  The following steps accomplish this computation :

*  (a) Stationary qd transform,  L D L^T - sigma I = L(+) D(+) L(+)^T,

*  (b) Progressive qd transform, L D L^T - sigma I = U(-) D(-) U(-)^T,

*  (c) Computation of the diagonal elements of the inverse of

*      L D L^T - sigma I by combining the above transforms, and choosing

*      r as the index where the diagonal of the inverse is (one of the)

*      largest in magnitude.

*  (d) Computation of the (scaled) r-th column of the inverse using the

*      twisted factorization obtained by combining the top part of the

*      the stationary and the bottom part of the progressive transform.

*

*  Arguments

*  =========

*

*  N        (input) INTEGER

*           The order of the matrix L D L^T.

*

*  B1       (input) INTEGER

*           First index of the submatrix of L D L^T.

*

*  BN       (input) INTEGER

*           Last index of the submatrix of L D L^T.

*

*  LAMBDA    (input) DOUBLE PRECISION

*           The shift. In order to compute an accurate eigenvector,

*           LAMBDA should be a good approximation to an eigenvalue

*           of L D L^T.

*

*  L        (input) DOUBLE PRECISION array, dimension (N-1)

*           The (n-1) subdiagonal elements of the unit bidiagonal matrix

*           L, in elements 1 to N-1.

*

*  D        (input) DOUBLE PRECISION array, dimension (N)

*           The n diagonal elements of the diagonal matrix D.

*

*  LD       (input) DOUBLE PRECISION array, dimension (N-1)

*           The n-1 elements L(i)*D(i).

*

*  LLD      (input) DOUBLE PRECISION array, dimension (N-1)

*           The n-1 elements L(i)*L(i)*D(i).

*

*  PIVMIN   (input) DOUBLE PRECISION

*           The minimum pivot in the Sturm sequence.

*

*  GAPTOL   (input) DOUBLE PRECISION

*           Tolerance that indicates when eigenvector entries are negligible

*           w.r.t. their contribution to the residual.

*

*  Z        (input/output) DOUBLE PRECISION array, dimension (N)

*           On input, all entries of Z must be set to 0.

*           On output, Z contains the (scaled) r-th column of the

*           inverse. The scaling is such that Z(R) equals 1.

*

*  WANTNC   (input) LOGICAL

*           Specifies whether NEGCNT has to be computed.

*

*  NEGCNT   (output) INTEGER

*           If WANTNC is .TRUE. then NEGCNT = the number of pivots < pivmin

*           in the  matrix factorization L D L^T, and NEGCNT = -1 otherwise.

*

*  ZTZ      (output) DOUBLE PRECISION

*           The square of the 2-norm of Z.

*

*  MINGMA   (output) DOUBLE PRECISION

*           The reciprocal of the largest (in magnitude) diagonal

*           element of the inverse of L D L^T - sigma I.

*

*  R        (input/output) INTEGER

*           The twist index for the twisted factorization used to

*           compute Z.

*           On input, 0 <= R <= N. If R is input as 0, R is set to

*           the index where (L D L^T - sigma I)^{-1} is largest

*           in magnitude. If 1 <= R <= N, R is unchanged.

*           On output, R contains the twist index used to compute Z.

*           Ideally, R designates the position of the maximum entry in the

*           eigenvector.

*

*  ISUPPZ   (output) INTEGER array, dimension (2)

*           The support of the vector in Z, i.e., the vector Z is

*           nonzero only in elements ISUPPZ(1) through ISUPPZ( 2 ).

*

*  NRMINV   (output) DOUBLE PRECISION

*           NRMINV = 1/SQRT( ZTZ )

*

*  RESID    (output) DOUBLE PRECISION

*           The residual of the FP vector.

*           RESID = ABS( MINGMA )/SQRT( ZTZ )

*

*  RQCORR   (output) DOUBLE PRECISION

*           The Rayleigh Quotient correction to LAMBDA.

*           RQCORR = MINGMA*TMP

*

*  WORK     (workspace) DOUBLE PRECISION array, dimension (4*N)

*

*  Further Details

*  ===============

*

*  Based on contributions by

*     Beresford Parlett, University of California, Berkeley, USA

*     Jim Demmel, University of California, Berkeley, USA

*     Inderjit Dhillon, University of Texas, Austin, USA

*     Osni Marques, LBNL/NERSC, USA

*     Christof Voemel, University of California, Berkeley, USA

*

*  =====================================================================

*

*     .. Parameters ..

      INTEGER            BLKLEN

      PARAMETER          ( BLKLEN = 16 )

       DOUBLE PRECISION   ZERO, ONE

      parameter( zero = 0.0d0, one = 1.0d0 )


*     ..

*     .. Local Scalars ..

      LOGICAL            SAWNAN1, SAWNAN2

      INTEGER            BI, I, INDLPL, INDP, INDS, INDUMN, NB, NEG1,

     $                   neg2, nx, r1, r2, to

      DOUBLE PRECISION            ABSZCUR, ABSZPREV, DMINUS, DPLUS, EPS,

     $                            S, TMP, ZPREV

*     ..

*     .. External Functions ..

      LOGICAL DISNAN

      DOUBLE PRECISION   DLAMCH

      EXTERNAL           disnan, dlamch

*     ..

*     .. Intrinsic Functions ..

      INTRINSIC          abs, max, min, dble

*     ..

*     .. Executable Statements ..

*

      eps = dlamch( 'Precision' )


      IF( r.EQ.0 ) THEN

         r1 = b1

         r2 = bn

      ELSE

         r1 = r

         r2 = r

      END IF


*     Storage for LPLUS

      indlpl = 0

*     Storage for UMINUS

      indumn = n

      inds = 2*n + 1

      indp = 3*n + 1


      IF( b1.EQ.1 ) THEN

         work( inds ) = zero

      ELSE

         work( inds+b1-1 ) = lld( b1-1 )

      END IF


*

*     Compute the stationary transform (using the differential form)

*     until the index R2.

*

      sawnan1 = .false.

      neg1 = 0

      s = work( inds+b1-1 ) - lambda

      DO 50 i = b1, r1 - 1

         dplus = d( i ) + s

         work( indlpl+i ) = ld( i ) / dplus

         IF(dplus.LT.zero) neg1 = neg1 + 1

         work( inds+i ) = s*work( indlpl+i )*l( i )

         s = work( inds+i ) - lambda

 50   CONTINUE

      sawnan1 = disnan( s )

      IF( sawnan1 ) GOTO 60

      DO 51 i = r1, r2 - 1

         dplus = d( i ) + s

         work( indlpl+i ) = ld( i ) / dplus

         work( inds+i ) = s*work( indlpl+i )*l( i )

         s = work( inds+i ) - lambda

 51   CONTINUE

      sawnan1 = disnan( s )

*

 60   CONTINUE

      IF( sawnan1 ) THEN

*        Runs a slower version of the above loop if a NaN is detected

         neg1 = 0

         s = work( inds+b1-1 ) - lambda

         DO 70 i = b1, r1 - 1

            dplus = d( i ) + s

            IF(abs(dplus).LT.pivmin) dplus = -pivmin

            work( indlpl+i ) = ld( i ) / dplus

            IF(dplus.LT.zero) neg1 = neg1 + 1

            work( inds+i ) = s*work( indlpl+i )*l( i )

            IF( work( indlpl+i ).EQ.zero )

     $                      work( inds+i ) = lld( i )

            s = work( inds+i ) - lambda

 70      CONTINUE

         DO 71 i = r1, r2 - 1

            dplus = d( i ) + s

            IF(abs(dplus).LT.pivmin) dplus = -pivmin

            work( indlpl+i ) = ld( i ) / dplus

            work( inds+i ) = s*work( indlpl+i )*l( i )

            IF( work( indlpl+i ).EQ.zero )

     $                      work( inds+i ) = lld( i )

            s = work( inds+i ) - lambda

 71      CONTINUE

      END IF

*

*     Compute the progressive transform (using the differential form)

*     until the index R1

*

      sawnan2 = .false.

      neg2 = 0

      work( indp+bn-1 ) = d( bn ) - lambda

      DO 80 i = bn - 1, r1, -1

         dminus = lld( i ) + work( indp+i )

         tmp = d( i ) / dminus

         IF(dminus.LT.zero) neg2 = neg2 + 1

         work( indumn+i ) = l( i )*tmp

         work( indp+i-1 ) = work( indp+i )*tmp - lambda

 80   CONTINUE

      tmp = work( indp+r1-1 )

      sawnan2 = disnan( tmp )

      IF( sawnan2 ) THEN

*        Runs a slower version of the above loop if a NaN is detected

         neg2 = 0

         DO 100 i = bn-1, r1, -1

            dminus = lld( i ) + work( indp+i )

            IF(abs(dminus).LT.pivmin) dminus = -pivmin

            tmp = d( i ) / dminus

            IF(dminus.LT.zero) neg2 = neg2 + 1

            work( indumn+i ) = l( i )*tmp

            work( indp+i-1 ) = work( indp+i )*tmp - lambda

            IF( tmp.EQ.zero )

     $          work( indp+i-1 ) = d( i ) - lambda

 100     CONTINUE

      END IF

*

*     Find the index (from R1 to R2) of the largest (in magnitude)

*     diagonal element of the inverse

*

      mingma = work( inds+r1-1 ) + work( indp+r1-1 )

      IF( mingma.LT.zero ) neg1 = neg1 + 1

      IF( wantnc ) THEN

         negcnt = neg1 + neg2

      ELSE

         negcnt = -1

      ENDIF

      IF( abs(mingma).EQ.zero )

     $   mingma = eps*work( inds+r1-1 )

      r = r1

      DO 110 i = r1, r2 - 1

         tmp = work( inds+i ) + work( indp+i )

         IF( tmp.EQ.zero )

     $      tmp = eps*work( inds+i )

         IF( abs( tmp ).LE.abs( mingma ) ) THEN

            mingma = tmp

            r = i + 1

         END IF

 110  CONTINUE

*

*     Compute the FP vector: solve N^T v = e_r

*

      isuppz( 1 ) = b1

      isuppz( 2 ) = bn

      z( r ) = one

      ztz = one

*

*     Compute the FP vector upwards from R

*

      nb = int((r-b1)/blklen)

      nx = r-nb*blklen

      IF( .NOT.sawnan1 ) THEN

         DO 210 bi = r-1, nx, -blklen

            to = bi-blklen+1

            DO 205 i = bi, to, -1

               z( i ) = -( work(indlpl+i)*z(i+1) )

               ztz = ztz + z( i )*z( i )

 205        CONTINUE

            IF( abs(z(to)).LT.eps .AND.

     $        abs(z(to+1)).LT.eps ) THEN

               isuppz(1) = to

               GOTO 220

        ENDIF

 210     CONTINUE

         DO 215 i = nx-1, b1, -1

            z( i ) = -( work(indlpl+i)*z(i+1) )

            ztz = ztz + z( i )*z( i )

 215     CONTINUE

 220     CONTINUE

      ELSE

*        Run slower loop if NaN occurred.

         DO 230 bi = r-1, nx, -blklen

            to = bi-blklen+1

            DO 225 i = bi, to, -1

               IF( z( i+1 ).EQ.zero ) THEN

                  z( i ) = -( ld( i+1 ) / ld( i ) )*z( i+2 )

               ELSE

                  z( i ) = -( work( indlpl+i )*z( i+1 ) )

               END IF

               ztz = ztz + z( i )*z( i )

 225        CONTINUE

            IF( abs(z(to)).LT.eps .AND.

     $        abs(z(to+1)).LT.eps ) THEN

               isuppz(1) = to

               GOTO 240

        ENDIF

 230     CONTINUE

         DO 235 i = nx-1, b1, -1

            IF( z( i+1 ).EQ.zero ) THEN

               z( i ) = -( ld( i+1 ) / ld( i ) )*z( i+2 )

            ELSE

               z( i ) = -( work( indlpl+i )*z( i+1 ) )

            END IF

            ztz = ztz + z( i )*z( i )

 235     CONTINUE

 240     CONTINUE

      ENDIF

      DO 245 i= b1, (isuppz(1)-1)

         z(i) = zero

 245  CONTINUE


*     Compute the FP vector downwards from R in blocks of size BLKLEN

      IF( .NOT.sawnan2 ) THEN

         DO 260 bi = r+1, bn, blklen

            to = bi+blklen-1

            IF ( to.LE.bn ) THEN

               DO 250 i = bi, to

                  z(i) = -(work(indumn+i-1)*z(i-1))

                  ztz = ztz + z( i )*z( i )

 250           CONTINUE

               IF( abs(z(to)).LE.eps .AND.

     $             abs(z(to-1)).LE.eps ) THEN

                  isuppz(2) = to

                  GOTO 265

           ENDIF

            ELSE

               DO 255 i = bi, bn

                  z(i) = -(work(indumn+i-1)*z(i-1))

                  ztz = ztz + z( i )*z( i )

 255           CONTINUE

            ENDIF

 260     CONTINUE

 265     CONTINUE

      ELSE

*        Run slower loop if NaN occurred.

         DO 280 bi = r+1, bn, blklen

            to = bi+blklen-1

            IF ( to.LE.bn ) THEN

               DO 270 i = bi, to

                  zprev = z(i-1)

                  abszprev = abs(zprev)

                  IF( zprev.NE.zero ) THEN

                     z(i)= -(work(indumn+i-1)*zprev)

                  ELSE

                     z(i)= -(ld(i-2)/ld(i-1))*z(i-2)

                  END IF

                  abszcur = abs(z(i))

                  ztz = ztz + abszcur**2

 270           CONTINUE

               IF( abszcur.LT.eps .AND.

     $             abszprev.LT.eps ) THEN

                  isuppz(2) = i

                  GOTO 285

           ENDIF

            ELSE

               DO 275 i = bi, bn

                  zprev = z(i-1)

                  abszprev = abs(zprev)

                  IF( zprev.NE.zero ) THEN

                     z(i)= -(work(indumn+i-1)*zprev)

                  ELSE

                     z(i)= -(ld(i-2)/ld(i-1))*z(i-2)

                  END IF

                  abszcur = abs(z(i))

                  ztz = ztz + abszcur**2

 275           CONTINUE

            ENDIF

 280     CONTINUE

 285     CONTINUE

      END IF

      DO 290 i= isuppz(2)+1,bn

         z(i) = zero

 290  CONTINUE

*

*     Compute quantities for convergence test

*

      tmp = one / ztz

      nrminv = sqrt( tmp )

      resid = abs( mingma )*nrminv

      rqcorr = mingma*tmp

*

      RETURN

*

*     End of DLAR1VA

*

      END