da/d2f/claed8_8f_source.html

*> \brief \b CLAED8 used by sstedc. Merges eigenvalues and deflates secular equation. Used when the original matrix is dense.

*

*  =========== DOCUMENTATION ===========

*

* Online html documentation available at

*            http://www.netlib.org/lapack/explore-html/

*

*> \htmlonly

*> Download CLAED8 + dependencies

*> <a href="http://www.netlib.org/cgi-bin/netlibfiles.tgz?format=tgz&filename=/lapack/lapack_routine/claed8.f">

*> [TGZ]</a>

*> <a href="http://www.netlib.org/cgi-bin/netlibfiles.zip?format=zip&filename=/lapack/lapack_routine/claed8.f">

*> [ZIP]</a>

*> <a href="http://www.netlib.org/cgi-bin/netlibfiles.txt?format=txt&filename=/lapack/lapack_routine/claed8.f">

*> [TXT]</a>

*> \endhtmlonly

*

*  Definition:

*  ===========

*

*       SUBROUTINE CLAED8( K, N, QSIZ, Q, LDQ, D, RHO, CUTPNT, Z, DLAMDA,

*                          Q2, LDQ2, W, INDXP, INDX, INDXQ, PERM, GIVPTR,

*                          GIVCOL, GIVNUM, INFO )

*

*       .. Scalar Arguments ..

*       INTEGER            CUTPNT, GIVPTR, INFO, K, LDQ, LDQ2, N, QSIZ

*       REAL               RHO

*       ..

*       .. Array Arguments ..

*       INTEGER            GIVCOL( 2, * ), INDX( * ), INDXP( * ),

*      $                   INDXQ( * ), PERM( * )

*       REAL               D( * ), DLAMDA( * ), GIVNUM( 2, * ), W( * ),

*      $                   Z( * )

*       COMPLEX            Q( LDQ, * ), Q2( LDQ2, * )

*       ..

*

*

*> \par Purpose:

*  =============

*>

*> \verbatim

*>

*> CLAED8 merges the two sets of eigenvalues together into a single

*> sorted set.  Then it tries to deflate the size of the problem.

*> There are two ways in which deflation can occur:  when two or more

*> eigenvalues are close together or if there is a tiny element in the

*> Z vector.  For each such occurrence the order of the related secular

*> equation problem is reduced by one.

*> \endverbatim

*

*  Arguments:

*  ==========

*

*> \param[out] K

*> \verbatim

*>          K is INTEGER

*>         Contains the number of non-deflated eigenvalues.

*>         This is the order of the related secular equation.

*> \endverbatim

*>

*> \param[in] N

*> \verbatim

*>          N is INTEGER

*>         The dimension of the symmetric tridiagonal matrix.  N >= 0.

*> \endverbatim

*>

*> \param[in] QSIZ

*> \verbatim

*>          QSIZ is INTEGER

*>         The dimension of the unitary matrix used to reduce

*>         the dense or band matrix to tridiagonal form.

*>         QSIZ >= N if ICOMPQ = 1.

*> \endverbatim

*>

*> \param[in,out] Q

*> \verbatim

*>          Q is COMPLEX array, dimension (LDQ,N)

*>         On entry, Q contains the eigenvectors of the partially solved

*>         system which has been previously updated in matrix

*>         multiplies with other partially solved eigensystems.

*>         On exit, Q contains the trailing (N-K) updated eigenvectors

*>         (those which were deflated) in its last N-K columns.

*> \endverbatim

*>

*> \param[in] LDQ

*> \verbatim

*>          LDQ is INTEGER

*>         The leading dimension of the array Q.  LDQ >= max( 1, N ).

*> \endverbatim

*>

*> \param[in,out] D

*> \verbatim

*>          D is REAL array, dimension (N)

*>         On entry, D contains the eigenvalues of the two submatrices to

*>         be combined.  On exit, D contains the trailing (N-K) updated

*>         eigenvalues (those which were deflated) sorted into increasing

*>         order.

*> \endverbatim

*>

*> \param[in,out] RHO

*> \verbatim

*>          RHO is REAL

*>         Contains the off diagonal element associated with the rank-1

*>         cut which originally split the two submatrices which are now

*>         being recombined. RHO is modified during the computation to

*>         the value required by SLAED3.

*> \endverbatim

*>

*> \param[in] CUTPNT

*> \verbatim

*>          CUTPNT is INTEGER

*>         Contains the location of the last eigenvalue in the leading

*>         sub-matrix.  MIN(1,N) <= CUTPNT <= N.

*> \endverbatim

*>

*> \param[in] Z

*> \verbatim

*>          Z is REAL array, dimension (N)

*>         On input this vector contains the updating vector (the last

*>         row of the first sub-eigenvector matrix and the first row of

*>         the second sub-eigenvector matrix).  The contents of Z are

*>         destroyed during the updating process.

*> \endverbatim

*>

*> \param[out] DLAMDA

*> \verbatim

*>          DLAMDA is REAL array, dimension (N)

*>         Contains a copy of the first K eigenvalues which will be used

*>         by SLAED3 to form the secular equation.

*> \endverbatim

*>

*> \param[out] Q2

*> \verbatim

*>          Q2 is COMPLEX array, dimension (LDQ2,N)

*>         If ICOMPQ = 0, Q2 is not referenced.  Otherwise,

*>         Contains a copy of the first K eigenvectors which will be used

*>         by SLAED7 in a matrix multiply (SGEMM) to update the new

*>         eigenvectors.

*> \endverbatim

*>

*> \param[in] LDQ2

*> \verbatim

*>          LDQ2 is INTEGER

*>         The leading dimension of the array Q2.  LDQ2 >= max( 1, N ).

*> \endverbatim

*>

*> \param[out] W

*> \verbatim

*>          W is REAL array, dimension (N)

*>         This will hold the first k values of the final

*>         deflation-altered z-vector and will be passed to SLAED3.

*> \endverbatim

*>

*> \param[out] INDXP

*> \verbatim

*>          INDXP is INTEGER array, dimension (N)

*>         This will contain the permutation used to place deflated

*>         values of D at the end of the array. On output INDXP(1:K)

*>         points to the nondeflated D-values and INDXP(K+1:N)

*>         points to the deflated eigenvalues.

*> \endverbatim

*>

*> \param[out] INDX

*> \verbatim

*>          INDX is INTEGER array, dimension (N)

*>         This will contain the permutation used to sort the contents of

*>         D into ascending order.

*> \endverbatim

*>

*> \param[in] INDXQ

*> \verbatim

*>          INDXQ is INTEGER array, dimension (N)

*>         This contains the permutation which separately sorts the two

*>         sub-problems in D into ascending order.  Note that elements in

*>         the second half of this permutation must first have CUTPNT

*>         added to their values in order to be accurate.

*> \endverbatim

*>

*> \param[out] PERM

*> \verbatim

*>          PERM is INTEGER array, dimension (N)

*>         Contains the permutations (from deflation and sorting) to be

*>         applied to each eigenblock.

*> \endverbatim

*>

*> \param[out] GIVPTR

*> \verbatim

*>          GIVPTR is INTEGER

*>         Contains the number of Givens rotations which took place in

*>         this subproblem.

*> \endverbatim

*>

*> \param[out] GIVCOL

*> \verbatim

*>          GIVCOL is INTEGER array, dimension (2, N)

*>         Each pair of numbers indicates a pair of columns to take place

*>         in a Givens rotation.

*> \endverbatim

*>

*> \param[out] GIVNUM

*> \verbatim

*>          GIVNUM is REAL array, dimension (2, N)

*>         Each number indicates the S value to be used in the

*>         corresponding Givens rotation.

*> \endverbatim

*>

*> \param[out] INFO

*> \verbatim

*>          INFO is INTEGER

*>          = 0:  successful exit.

*>          < 0:  if INFO = -i, the i-th argument had an illegal value.

*> \endverbatim

*

*  Authors:

*  ========

*

*> \author Univ. of Tennessee

*> \author Univ. of California Berkeley

*> \author Univ. of Colorado Denver

*> \author NAG Ltd.

*

*> \date September 2012

*

*> \ingroup complexOTHERcomputational

*

*  =====================================================================

      SUBROUTINE claed8( K, N, QSIZ, Q, LDQ, D, RHO, CUTPNT, Z, DLAMDA,

     $                   q2, ldq2, w, indxp, indx, indxq, perm, givptr,

     $                   givcol, givnum, info )

*

*  -- LAPACK computational routine (version 3.4.2) --

*  -- LAPACK is a software package provided by Univ. of Tennessee,    --

*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--

*     September 2012

*

*     .. Scalar Arguments ..

      INTEGER            cutpnt, givptr, info, k, ldq, ldq2, n, qsiz

      REAL               rho

*     ..

*     .. Array Arguments ..

      INTEGER            givcol( 2, * ), indx( * ), indxp( * ),

     $                   indxq( * ), perm( * )

      REAL               d( * ), dlamda( * ), givnum( 2, * ), w( * ),

     $                   z( * )

      COMPLEX            q( ldq, * ), q2( ldq2, * )

*     ..

*

*  =====================================================================

*

*     .. Parameters ..

      REAL               mone, zero, one, two, eight

      parameter( mone = -1.0e0, zero = 0.0e0, one = 1.0e0,

     $                   two = 2.0e0, eight = 8.0e0 )

*     ..

*     .. Local Scalars ..

      INTEGER            i, imax, j, jlam, jmax, jp, k2, n1, n1p1, n2

      REAL               c, eps, s, t, tau, tol

*     ..

*     .. External Functions ..

      INTEGER            isamax

      REAL               slamch, slapy2

      EXTERNAL           isamax, slamch, slapy2

*     ..

*     .. External Subroutines ..

      EXTERNAL           ccopy, clacpy, csrot, scopy, slamrg, sscal,

     $                   xerbla

*     ..

*     .. Intrinsic Functions ..

      INTRINSIC          abs, max, min, sqrt

*     ..

*     .. Executable Statements ..

*

*     Test the input parameters.

*

      info = 0

*

      IF( n.LT.0 ) THEN

         info = -2

      ELSE IF( qsiz.LT.n ) THEN

         info = -3

      ELSE IF( ldq.LT.max( 1, n ) ) THEN

         info = -5

      ELSE IF( cutpnt.LT.min( 1, n ) .OR. cutpnt.GT.n ) THEN

         info = -8

      ELSE IF( ldq2.LT.max( 1, n ) ) THEN

         info = -12

      END IF

      IF( info.NE.0 ) THEN

         CALL xerbla( 'CLAED8', -info )

         return

      END IF

*

*     Need to initialize GIVPTR to O here in case of quick exit

*     to prevent an unspecified code behavior (usually sigfault)

*     when IWORK array on entry to *stedc is not zeroed

*     (or at least some IWORK entries which used in *laed7 for GIVPTR).

*

      givptr = 0

*

*     Quick return if possible

*

      IF( n.EQ.0 )

     $   return

*

      n1 = cutpnt

      n2 = n - n1

      n1p1 = n1 + 1

*

      IF( rho.LT.zero ) THEN

         CALL sscal( n2, mone, z( n1p1 ), 1 )

      END IF

*

*     Normalize z so that norm(z) = 1

*

      t = one / sqrt( two )

      DO 10 j = 1, n

         indx( j ) = j

   10 continue

      CALL sscal( n, t, z, 1 )

      rho = abs( two*rho )

*

*     Sort the eigenvalues into increasing order

*

      DO 20 i = cutpnt + 1, n

         indxq( i ) = indxq( i ) + cutpnt

   20 continue

      DO 30 i = 1, n

         dlamda( i ) = d( indxq( i ) )

         w( i ) = z( indxq( i ) )

   30 continue

      i = 1

      j = cutpnt + 1

      CALL slamrg( n1, n2, dlamda, 1, 1, indx )

      DO 40 i = 1, n

         d( i ) = dlamda( indx( i ) )

         z( i ) = w( indx( i ) )

   40 continue

*

*     Calculate the allowable deflation tolerance

*

      imax = isamax( n, z, 1 )

      jmax = isamax( n, d, 1 )

      eps = slamch( 'Epsilon' )

      tol = eight*eps*abs( d( jmax ) )

*

*     If the rank-1 modifier is small enough, no more needs to be done

*     -- except to reorganize Q so that its columns correspond with the

*     elements in D.

*

      IF( rho*abs( z( imax ) ).LE.tol ) THEN

         k = 0

         DO 50 j = 1, n

            perm( j ) = indxq( indx( j ) )

            CALL ccopy( qsiz, q( 1, perm( j ) ), 1, q2( 1, j ), 1 )

   50    continue

         CALL clacpy( 'A', qsiz, n, q2( 1, 1 ), ldq2, q( 1, 1 ), ldq )

         return

      END IF

*

*     If there are multiple eigenvalues then the problem deflates.  Here

*     the number of equal eigenvalues are found.  As each equal

*     eigenvalue is found, an elementary reflector is computed to rotate

*     the corresponding eigensubspace so that the corresponding

*     components of Z are zero in this new basis.

*

      k = 0

      k2 = n + 1

      DO 60 j = 1, n

         IF( rho*abs( z( j ) ).LE.tol ) THEN

*

*           Deflate due to small z component.

*

            k2 = k2 - 1

            indxp( k2 ) = j

            IF( j.EQ.n )

     $         go to 100

         ELSE

            jlam = j

            go to 70

         END IF

   60 continue

   70 continue

      j = j + 1

      IF( j.GT.n )

     $   go to 90

      IF( rho*abs( z( j ) ).LE.tol ) THEN

*

*        Deflate due to small z component.

*

         k2 = k2 - 1

         indxp( k2 ) = j

      ELSE

*

*        Check if eigenvalues are close enough to allow deflation.

*

         s = z( jlam )

         c = z( j )

*

*        Find sqrt(a**2+b**2) without overflow or

*        destructive underflow.

*

         tau = slapy2( c, s )

         t = d( j ) - d( jlam )

         c = c / tau

         s = -s / tau

         IF( abs( t*c*s ).LE.tol ) THEN

*

*           Deflation is possible.

*

            z( j ) = tau

            z( jlam ) = zero

*

*           Record the appropriate Givens rotation

*

            givptr = givptr + 1

            givcol( 1, givptr ) = indxq( indx( jlam ) )

            givcol( 2, givptr ) = indxq( indx( j ) )

            givnum( 1, givptr ) = c

            givnum( 2, givptr ) = s

            CALL csrot( qsiz, q( 1, indxq( indx( jlam ) ) ), 1,

     $                  q( 1, indxq( indx( j ) ) ), 1, c, s )

            t = d( jlam )*c*c + d( j )*s*s

            d( j ) = d( jlam )*s*s + d( j )*c*c

            d( jlam ) = t

            k2 = k2 - 1

            i = 1

   80       continue

            IF( k2+i.LE.n ) THEN

               IF( d( jlam ).LT.d( indxp( k2+i ) ) ) THEN

                  indxp( k2+i-1 ) = indxp( k2+i )

                  indxp( k2+i ) = jlam

                  i = i + 1

                  go to 80

               ELSE

                  indxp( k2+i-1 ) = jlam

               END IF

            ELSE

               indxp( k2+i-1 ) = jlam

            END IF

            jlam = j

         ELSE

            k = k + 1

            w( k ) = z( jlam )

            dlamda( k ) = d( jlam )

            indxp( k ) = jlam

            jlam = j

         END IF

      END IF

      go to 70

   90 continue

*

*     Record the last eigenvalue.

*

      k = k + 1

      w( k ) = z( jlam )

      dlamda( k ) = d( jlam )

      indxp( k ) = jlam

*

  100 continue

*

*     Sort the eigenvalues and corresponding eigenvectors into DLAMDA

*     and Q2 respectively.  The eigenvalues/vectors which were not

*     deflated go into the first K slots of DLAMDA and Q2 respectively,

*     while those which were deflated go into the last N - K slots.

*

      DO 110 j = 1, n

         jp = indxp( j )

         dlamda( j ) = d( jp )

         perm( j ) = indxq( indx( jp ) )

         CALL ccopy( qsiz, q( 1, perm( j ) ), 1, q2( 1, j ), 1 )

  110 continue

*

*     The deflated eigenvalues and their corresponding vectors go back

*     into the last N - K slots of D and Q respectively.

*

      IF( k.LT.n ) THEN

         CALL scopy( n-k, dlamda( k+1 ), 1, d( k+1 ), 1 )

         CALL clacpy( 'A', qsiz, n-k, q2( 1, k+1 ), ldq2, q( 1, k+1 ),

     $                ldq )

      END IF

*

      return

*

*     End of CLAED8

*

      END