◆ slaqr2()

subroutine slaqr2	(	logical	wantt,
		logical	wantz,
		integer	n,
		integer	ktop,
		integer	kbot,
		integer	nw,
		real, dimension( ldh, * )	h,
		integer	ldh,
		integer	iloz,
		integer	ihiz,
		real, dimension( ldz, * )	z,
		integer	ldz,
		integer	ns,
		integer	nd,
		real, dimension( * )	sr,
		real, dimension( * )	si,
		real, dimension( ldv, * )	v,
		integer	ldv,
		integer	nh,
		real, dimension( ldt, * )	t,
		integer	ldt,
		integer	nv,
		real, dimension( ldwv, * )	wv,
		integer	ldwv,
		real, dimension( * )	work,
		integer	lwork )

SLAQR2 performs the orthogonal similarity transformation of a Hessenberg matrix to detect and deflate fully converged eigenvalues from a trailing principal submatrix (aggressive early deflation).

Download SLAQR2 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!>    SLAQR2 is identical to SLAQR3 except that it avoids
!>    recursion by calling SLAHQR instead of SLAQR4.
!>
!>    Aggressive early deflation:
!>
!>    This subroutine accepts as input an upper Hessenberg matrix
!>    H and performs an orthogonal similarity transformation
!>    designed to detect and deflate fully converged eigenvalues from
!>    a trailing principal submatrix.  On output H has been over-
!>    written by a new Hessenberg matrix that is a perturbation of
!>    an orthogonal similarity transformation of H.  It is to be
!>    hoped that the final version of H has many zero subdiagonal
!>    entries.
!>

Parameters

[in]	WANTT	!> WANTT is LOGICAL !> If .TRUE., then the Hessenberg matrix H is fully updated !> so that the quasi-triangular Schur factor may be !> computed (in cooperation with the calling subroutine). !> If .FALSE., then only enough of H is updated to preserve !> the eigenvalues. !>
[in]	WANTZ	!> WANTZ is LOGICAL !> If .TRUE., then the orthogonal matrix Z is updated so !> so that the orthogonal Schur factor may be computed !> (in cooperation with the calling subroutine). !> If .FALSE., then Z is not referenced. !>
[in]	N	!> N is INTEGER !> The order of the matrix H and (if WANTZ is .TRUE.) the !> order of the orthogonal matrix Z. !>
[in]	KTOP	!> KTOP is INTEGER !> It is assumed that either KTOP = 1 or H(KTOP,KTOP-1)=0. !> KBOT and KTOP together determine an isolated block !> along the diagonal of the Hessenberg matrix. !>
[in]	KBOT	!> KBOT is INTEGER !> It is assumed without a check that either !> KBOT = N or H(KBOT+1,KBOT)=0. KBOT and KTOP together !> determine an isolated block along the diagonal of the !> Hessenberg matrix. !>
[in]	NW	!> NW is INTEGER !> Deflation window size. 1 <= NW <= (KBOT-KTOP+1). !>
[in,out]	H	!> H is REAL array, dimension (LDH,N) !> On input the initial N-by-N section of H stores the !> Hessenberg matrix undergoing aggressive early deflation. !> On output H has been transformed by an orthogonal !> similarity transformation, perturbed, and the returned !> to Hessenberg form that (it is to be hoped) has some !> zero subdiagonal entries. !>
[in]	LDH	!> LDH is INTEGER !> Leading dimension of H just as declared in the calling !> subroutine. N <= LDH !>
[in]	ILOZ	!> ILOZ is INTEGER !>
[in]	IHIZ	!> IHIZ is INTEGER !> Specify the rows of Z to which transformations must be !> applied if WANTZ is .TRUE.. 1 <= ILOZ <= IHIZ <= N. !>
[in,out]	Z	!> Z is REAL array, dimension (LDZ,N) !> IF WANTZ is .TRUE., then on output, the orthogonal !> similarity transformation mentioned above has been !> accumulated into Z(ILOZ:IHIZ,ILOZ:IHIZ) from the right. !> If WANTZ is .FALSE., then Z is unreferenced. !>
[in]	LDZ	!> LDZ is INTEGER !> The leading dimension of Z just as declared in the !> calling subroutine. 1 <= LDZ. !>
[out]	NS	!> NS is INTEGER !> The number of unconverged (ie approximate) eigenvalues !> returned in SR and SI that may be used as shifts by the !> calling subroutine. !>
[out]	ND	!> ND is INTEGER !> The number of converged eigenvalues uncovered by this !> subroutine. !>
[out]	SR	!> SR is REAL array, dimension (KBOT) !>
[out]	SI	!> SI is REAL array, dimension (KBOT) !> On output, the real and imaginary parts of approximate !> eigenvalues that may be used for shifts are stored in !> SR(KBOT-ND-NS+1) through SR(KBOT-ND) and !> SI(KBOT-ND-NS+1) through SI(KBOT-ND), respectively. !> The real and imaginary parts of converged eigenvalues !> are stored in SR(KBOT-ND+1) through SR(KBOT) and !> SI(KBOT-ND+1) through SI(KBOT), respectively. !>
[out]	V	!> V is REAL array, dimension (LDV,NW) !> An NW-by-NW work array. !>
[in]	LDV	!> LDV is INTEGER !> The leading dimension of V just as declared in the !> calling subroutine. NW <= LDV !>
[in]	NH	!> NH is INTEGER !> The number of columns of T. NH >= NW. !>
[out]	T	!> T is REAL array, dimension (LDT,NW) !>
[in]	LDT	!> LDT is INTEGER !> The leading dimension of T just as declared in the !> calling subroutine. NW <= LDT !>
[in]	NV	!> NV is INTEGER !> The number of rows of work array WV available for !> workspace. NV >= NW. !>
[out]	WV	!> WV is REAL array, dimension (LDWV,NW) !>
[in]	LDWV	!> LDWV is INTEGER !> The leading dimension of W just as declared in the !> calling subroutine. NW <= LDV !>
[out]	WORK	!> WORK is REAL array, dimension (LWORK) !> On exit, WORK(1) is set to an estimate of the optimal value !> of LWORK for the given values of N, NW, KTOP and KBOT. !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the work array WORK. LWORK = 2*NW !> suffices, but greater efficiency may result from larger !> values of LWORK. !> !> If LWORK = -1, then a workspace query is assumed; SLAQR2 !> only estimates the optimal workspace size for the given !> values of N, NW, KTOP and KBOT. The estimate is returned !> in WORK(1). No error message related to LWORK is issued !> by XERBLA. Neither H nor Z are accessed. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: Karen Braman and Ralph Byers, Department of Mathematics, University of Kansas, USA

Definition at line 273 of file slaqr2.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            IHIZ, ILOZ, KBOT, KTOP, LDH, LDT, LDV, LDWV,
     $                   LDZ, LWORK, N, ND, NH, NS, NV, NW
      LOGICAL            WANTT, WANTZ
*     ..
*     .. Array Arguments ..
      REAL               H( LDH, * ), SI( * ), SR( * ), T( LDT, * ),
     $                   V( LDV, * ), WORK( * ), WV( LDWV, * ),
     $                   Z( LDZ, * )
*     ..
*
*  ================================================================
*     .. Parameters ..
      REAL               ZERO, ONE
      parameter( zero = 0.0e0, one = 1.0e0 )
*     ..
*     .. Local Scalars ..
      REAL               AA, BB, CC, CS, DD, EVI, EVK, FOO, S,
     $                   SAFMAX, SAFMIN, SMLNUM, SN, TAU, ULP
      INTEGER            I, IFST, ILST, INFO, INFQR, J, JW, K, KCOL,
     $                   KEND, KLN, KROW, KWTOP, LTOP, LWK1, LWK2,
     $                   LWKOPT
      LOGICAL            BULGE, SORTED
*     ..
*     .. External Functions ..
      REAL               SLAMCH, SROUNDUP_LWORK
      EXTERNAL           slamch, sroundup_lwork
*     ..
*     .. External Subroutines ..
      EXTERNAL           scopy, sgehrd, sgemm, slacpy,
     $                   slahqr,
     $                   slanv2, slarf1l, slarfg, slaset, sormhr,
     $                   strexc
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, int, max, min, real, sqrt
*     ..
*     .. Executable Statements ..
*
*     ==== Estimate optimal workspace. ====
*
      jw = min( nw, kbot-ktop+1 )
      IF( jw.LE.2 ) THEN
         lwkopt = 1
      ELSE
*
*        ==== Workspace query call to SGEHRD ====
*
         CALL sgehrd( jw, 1, jw-1, t, ldt, work, work, -1, info )
         lwk1 = int( work( 1 ) )
*
*        ==== Workspace query call to SORMHR ====
*
         CALL sormhr( 'R', 'N', jw, jw, 1, jw-1, t, ldt, work, v,
     $                ldv,
     $                work, -1, info )
         lwk2 = int( work( 1 ) )
*
*        ==== Optimal workspace ====
*
         lwkopt = jw + max( lwk1, lwk2 )
      END IF
*
*     ==== Quick return in case of workspace query. ====
*
      IF( lwork.EQ.-1 ) THEN
         work( 1 ) = sroundup_lwork( lwkopt )
         RETURN
      END IF
*
*     ==== Nothing to do ...
*     ... for an empty active block ... ====
      ns = 0
      nd = 0
      work( 1 ) = one
      IF( ktop.GT.kbot )
     $   RETURN
*     ... nor for an empty deflation window. ====
      IF( nw.LT.1 )
     $   RETURN
*
*     ==== Machine constants ====
*
      safmin = slamch( 'SAFE MINIMUM' )
      safmax = one / safmin
      ulp = slamch( 'PRECISION' )
      smlnum = safmin*( real( n ) / ulp )
*
*     ==== Setup deflation window ====
*
      jw = min( nw, kbot-ktop+1 )
      kwtop = kbot - jw + 1
      IF( kwtop.EQ.ktop ) THEN
         s = zero
      ELSE
         s = h( kwtop, kwtop-1 )
      END IF
*
      IF( kbot.EQ.kwtop ) THEN
*
*        ==== 1-by-1 deflation window: not much to do ====
*
         sr( kwtop ) = h( kwtop, kwtop )
         si( kwtop ) = zero
         ns = 1
         nd = 0
         IF( abs( s ).LE.max( smlnum, ulp*abs( h( kwtop, kwtop ) ) ) )
     $        THEN
            ns = 0
            nd = 1
            IF( kwtop.GT.ktop )
     $         h( kwtop, kwtop-1 ) = zero
         END IF
         work( 1 ) = one
         RETURN
      END IF
*
*     ==== Convert to spike-triangular form.  (In case of a
*     .    rare QR failure, this routine continues to do
*     .    aggressive early deflation using that part of
*     .    the deflation window that converged using INFQR
*     .    here and there to keep track.) ====
*
      CALL slacpy( 'U', jw, jw, h( kwtop, kwtop ), ldh, t, ldt )
      CALL scopy( jw-1, h( kwtop+1, kwtop ), ldh+1, t( 2, 1 ),
     $            ldt+1 )
*
      CALL slaset( 'A', jw, jw, zero, one, v, ldv )
      CALL slahqr( .true., .true., jw, 1, jw, t, ldt, sr( kwtop ),
     $             si( kwtop ), 1, jw, v, ldv, infqr )
*
*     ==== STREXC needs a clean margin near the diagonal ====
*
      DO 10 j = 1, jw - 3
         t( j+2, j ) = zero
         t( j+3, j ) = zero
   10 CONTINUE
      IF( jw.GT.2 )
     $   t( jw, jw-2 ) = zero
*
*     ==== Deflation detection loop ====
*
      ns = jw
      ilst = infqr + 1
   20 CONTINUE
      IF( ilst.LE.ns ) THEN
         IF( ns.EQ.1 ) THEN
            bulge = .false.
         ELSE
            bulge = t( ns, ns-1 ).NE.zero
         END IF
*
*        ==== Small spike tip test for deflation ====
*
         IF( .NOT.bulge ) THEN
*
*           ==== Real eigenvalue ====
*
            foo = abs( t( ns, ns ) )
            IF( foo.EQ.zero )
     $         foo = abs( s )
            IF( abs( s*v( 1, ns ) ).LE.max( smlnum, ulp*foo ) ) THEN
*
*              ==== Deflatable ====
*
               ns = ns - 1
            ELSE
*
*              ==== Undeflatable.   Move it up out of the way.
*              .    (STREXC can not fail in this case.) ====
*
               ifst = ns
               CALL strexc( 'V', jw, t, ldt, v, ldv, ifst, ilst,
     $                      work,
     $                      info )
               ilst = ilst + 1
            END IF
         ELSE
*
*           ==== Complex conjugate pair ====
*
            foo = abs( t( ns, ns ) ) + sqrt( abs( t( ns, ns-1 ) ) )*
     $            sqrt( abs( t( ns-1, ns ) ) )
            IF( foo.EQ.zero )
     $         foo = abs( s )
            IF( max( abs( s*v( 1, ns ) ), abs( s*v( 1, ns-1 ) ) ).LE.
     $          max( smlnum, ulp*foo ) ) THEN
*
*              ==== Deflatable ====
*
               ns = ns - 2
            ELSE
*
*              ==== Undeflatable. Move them up out of the way.
*              .    Fortunately, STREXC does the right thing with
*              .    ILST in case of a rare exchange failure. ====
*
               ifst = ns
               CALL strexc( 'V', jw, t, ldt, v, ldv, ifst, ilst,
     $                      work,
     $                      info )
               ilst = ilst + 2
            END IF
         END IF
*
*        ==== End deflation detection loop ====
*
         GO TO 20
      END IF
*
*        ==== Return to Hessenberg form ====
*
      IF( ns.EQ.0 )
     $   s = zero
*
      IF( ns.LT.jw ) THEN
*
*        ==== sorting diagonal blocks of T improves accuracy for
*        .    graded matrices.  Bubble sort deals well with
*        .    exchange failures. ====
*
         sorted = .false.
         i = ns + 1
   30    CONTINUE
         IF( sorted )
     $      GO TO 50
         sorted = .true.
*
         kend = i - 1
         i = infqr + 1
         IF( i.EQ.ns ) THEN
            k = i + 1
         ELSE IF( t( i+1, i ).EQ.zero ) THEN
            k = i + 1
         ELSE
            k = i + 2
         END IF
   40    CONTINUE
         IF( k.LE.kend ) THEN
            IF( k.EQ.i+1 ) THEN
               evi = abs( t( i, i ) )
            ELSE
               evi = abs( t( i, i ) ) + sqrt( abs( t( i+1, i ) ) )*
     $               sqrt( abs( t( i, i+1 ) ) )
            END IF
*
            IF( k.EQ.kend ) THEN
               evk = abs( t( k, k ) )
            ELSE IF( t( k+1, k ).EQ.zero ) THEN
               evk = abs( t( k, k ) )
            ELSE
               evk = abs( t( k, k ) ) + sqrt( abs( t( k+1, k ) ) )*
     $               sqrt( abs( t( k, k+1 ) ) )
            END IF
*
            IF( evi.GE.evk ) THEN
               i = k
            ELSE
               sorted = .false.
               ifst = i
               ilst = k
               CALL strexc( 'V', jw, t, ldt, v, ldv, ifst, ilst,
     $                      work,
     $                      info )
               IF( info.EQ.0 ) THEN
                  i = ilst
               ELSE
                  i = k
               END IF
            END IF
            IF( i.EQ.kend ) THEN
               k = i + 1
            ELSE IF( t( i+1, i ).EQ.zero ) THEN
               k = i + 1
            ELSE
               k = i + 2
            END IF
            GO TO 40
         END IF
         GO TO 30
   50    CONTINUE
      END IF
*
*     ==== Restore shift/eigenvalue array from T ====
*
      i = jw
   60 CONTINUE
      IF( i.GE.infqr+1 ) THEN
         IF( i.EQ.infqr+1 ) THEN
            sr( kwtop+i-1 ) = t( i, i )
            si( kwtop+i-1 ) = zero
            i = i - 1
         ELSE IF( t( i, i-1 ).EQ.zero ) THEN
            sr( kwtop+i-1 ) = t( i, i )
            si( kwtop+i-1 ) = zero
            i = i - 1
         ELSE
            aa = t( i-1, i-1 )
            cc = t( i, i-1 )
            bb = t( i-1, i )
            dd = t( i, i )
            CALL slanv2( aa, bb, cc, dd, sr( kwtop+i-2 ),
     $                   si( kwtop+i-2 ), sr( kwtop+i-1 ),
     $                   si( kwtop+i-1 ), cs, sn )
            i = i - 2
         END IF
         GO TO 60
      END IF
*
      IF( ns.LT.jw .OR. s.EQ.zero ) THEN
         IF( ns.GT.1 .AND. s.NE.zero ) THEN
*
*           ==== Reflect spike back into lower triangle ====
*
            CALL scopy( ns, v, ldv, work, 1 )
            CALL slarfg( ns, work( 1 ), work( 2 ), 1, tau )
*
            CALL slaset( 'L', jw-2, jw-2, zero, zero, t( 3, 1 ),
     $                   ldt )
*
            CALL slarf1f( 'L', ns, jw, work, 1, tau, t, ldt,
     $                    work( jw+1 ) )
            CALL slarf1f( 'R', ns, ns, work, 1, tau, t, ldt,
     $                    work( jw+1 ) )
            CALL slarf1f( 'R', jw, ns, work, 1, tau, v, ldv,
     $                    work( jw+1 ) )
*
            CALL sgehrd( jw, 1, ns, t, ldt, work, work( jw+1 ),
     $                   lwork-jw, info )
         END IF
*
*        ==== Copy updated reduced window into place ====
*
         IF( kwtop.GT.1 )
     $      h( kwtop, kwtop-1 ) = s*v( 1, 1 )
         CALL slacpy( 'U', jw, jw, t, ldt, h( kwtop, kwtop ), ldh )
         CALL scopy( jw-1, t( 2, 1 ), ldt+1, h( kwtop+1, kwtop ),
     $               ldh+1 )
*
*        ==== Accumulate orthogonal matrix in order update
*        .    H and Z, if requested.  ====
*
         IF( ns.GT.1 .AND. s.NE.zero )
     $      CALL sormhr( 'R', 'N', jw, ns, 1, ns, t, ldt, work, v,
     $                   ldv,
     $                   work( jw+1 ), lwork-jw, info )
*
*        ==== Update vertical slab in H ====
*
         IF( wantt ) THEN
            ltop = 1
         ELSE
            ltop = ktop
         END IF
         DO 70 krow = ltop, kwtop - 1, nv
            kln = min( nv, kwtop-krow )
            CALL sgemm( 'N', 'N', kln, jw, jw, one, h( krow, kwtop ),
     $                  ldh, v, ldv, zero, wv, ldwv )
            CALL slacpy( 'A', kln, jw, wv, ldwv, h( krow, kwtop ),
     $                   ldh )
   70    CONTINUE
*
*        ==== Update horizontal slab in H ====
*
         IF( wantt ) THEN
            DO 80 kcol = kbot + 1, n, nh
               kln = min( nh, n-kcol+1 )
               CALL sgemm( 'C', 'N', jw, kln, jw, one, v, ldv,
     $                     h( kwtop, kcol ), ldh, zero, t, ldt )
               CALL slacpy( 'A', jw, kln, t, ldt, h( kwtop, kcol ),
     $                      ldh )
   80       CONTINUE
         END IF
*
*        ==== Update vertical slab in Z ====
*
         IF( wantz ) THEN
            DO 90 krow = iloz, ihiz, nv
               kln = min( nv, ihiz-krow+1 )
               CALL sgemm( 'N', 'N', kln, jw, jw, one, z( krow,
     $                     kwtop ),
     $                     ldz, v, ldv, zero, wv, ldwv )
               CALL slacpy( 'A', kln, jw, wv, ldwv, z( krow, kwtop ),
     $                      ldz )
   90       CONTINUE
         END IF
      END IF
*
*     ==== Return the number of deflations ... ====
*
      nd = jw - ns
*
*     ==== ... and the number of shifts. (Subtracting
*     .    INFQR from the spike length takes care
*     .    of the case of a rare QR failure while
*     .    calculating eigenvalues of the deflation
*     .    window.)  ====
*
      ns = ns - infqr
*
*      ==== Return optimal workspace. ====
*
      work( 1 ) = sroundup_lwork( lwkopt )
*
*     ==== End of SLAQR2 ====
*

Here is the call graph for this function:

Here is the caller graph for this function: