subroutine cla_porfsx_extended	(	integer	PREC_TYPE,
		character	UPLO,
		integer	N,
		integer	NRHS,
		complex, dimension( lda, * )	A,
		integer	LDA,
		complex, dimension( ldaf, * )	AF,
		integer	LDAF,
		logical	COLEQU,
		real, dimension( * )	C,
		complex, dimension( ldb, * )	B,
		integer	LDB,
		complex, dimension( ldy, * )	Y,
		integer	LDY,
		real, dimension( * )	BERR_OUT,
		integer	N_NORMS,
		real, dimension( nrhs, * )	ERR_BNDS_NORM,
		real, dimension( nrhs, * )	ERR_BNDS_COMP,
		complex, dimension( * )	RES,
		real, dimension( * )	AYB,
		complex, dimension( * )	DY,
		complex, dimension( * )	Y_TAIL,
		real	RCOND,
		integer	ITHRESH,
		real	RTHRESH,
		real	DZ_UB,
		logical	IGNORE_CWISE,
		integer	INFO
	)

CLA_PORFSX_EXTENDED improves the computed solution to a system of linear equations for symmetric or Hermitian positive-definite matrices by performing extra-precise iterative refinement and provides error bounds and backward error estimates for the solution.

Download CLA_PORFSX_EXTENDED + dependencies [TGZ] [ZIP] [TXT]

Purpose:

 CLA_PORFSX_EXTENDED improves the computed solution to a system of
 linear equations by performing extra-precise iterative refinement
 and provides error bounds and backward error estimates for the solution.
 This subroutine is called by CPORFSX to perform iterative refinement.
 In addition to normwise error bound, the code provides maximum
 componentwise error bound if possible. See comments for ERR_BNDS_NORM
 and ERR_BNDS_COMP for details of the error bounds. Note that this
 subroutine is only resonsible for setting the second fields of
 ERR_BNDS_NORM and ERR_BNDS_COMP.

Parameters

[in]	PREC_TYPE	PREC_TYPE is INTEGER Specifies the intermediate precision to be used in refinement. The value is defined by ILAPREC(P) where P is a CHARACTER and P = 'S': Single = 'D': Double = 'I': Indigenous = 'X', 'E': Extra
[in]	UPLO	UPLO is CHARACTER*1 = 'U': Upper triangle of A is stored; = 'L': Lower triangle of A is stored.
[in]	N	N is INTEGER The number of linear equations, i.e., the order of the matrix A. N >= 0.
[in]	NRHS	NRHS is INTEGER The number of right-hand-sides, i.e., the number of columns of the matrix B.
[in]	A	A is COMPLEX array, dimension (LDA,N) On entry, the N-by-N matrix A.
[in]	LDA	LDA is INTEGER The leading dimension of the array A. LDA >= max(1,N).
[in]	AF	AF is COMPLEX array, dimension (LDAF,N) The triangular factor U or L from the Cholesky factorization A = U*TU or A = LL*T, as computed by CPOTRF.
[in]	LDAF	LDAF is INTEGER The leading dimension of the array AF. LDAF >= max(1,N).
[in]	COLEQU	COLEQU is LOGICAL If .TRUE. then column equilibration was done to A before calling this routine. This is needed to compute the solution and error bounds correctly.
[in]	C	C is REAL array, dimension (N) The column scale factors for A. If COLEQU = .FALSE., C is not accessed. If C is input, each element of C should be a power of the radix to ensure a reliable solution and error estimates. Scaling by powers of the radix does not cause rounding errors unless the result underflows or overflows. Rounding errors during scaling lead to refining with a matrix that is not equivalent to the input matrix, producing error estimates that may not be reliable.
[in]	B	B is COMPLEX array, dimension (LDB,NRHS) The right-hand-side matrix B.
[in]	LDB	LDB is INTEGER The leading dimension of the array B. LDB >= max(1,N).
[in,out]	Y	Y is COMPLEX array, dimension (LDY,NRHS) On entry, the solution matrix X, as computed by CPOTRS. On exit, the improved solution matrix Y.
[in]	LDY	LDY is INTEGER The leading dimension of the array Y. LDY >= max(1,N).
[out]	BERR_OUT	BERR_OUT is REAL array, dimension (NRHS) On exit, BERR_OUT(j) contains the componentwise relative backward error for right-hand-side j from the formula max(i) ( abs(RES(i)) / ( abs(op(A_s))*abs(Y) + abs(B_s) )(i) ) where abs(Z) is the componentwise absolute value of the matrix or vector Z. This is computed by CLA_LIN_BERR.
[in]	N_NORMS	N_NORMS is INTEGER Determines which error bounds to return (see ERR_BNDS_NORM and ERR_BNDS_COMP). If N_NORMS >= 1 return normwise error bounds. If N_NORMS >= 2 return componentwise error bounds.
[in,out]	ERR_BNDS_NORM	ERR_BNDS_NORM is REAL array, dimension (NRHS, N_ERR_BNDS) For each right-hand side, this array contains information about various error bounds and condition numbers corresponding to the normwise relative error, which is defined as follows: Normwise relative error in the ith solution vector: max_j (abs(XTRUE(j,i) - X(j,i))) ------------------------------ max_j abs(X(j,i)) The array is indexed by the type of error information as described below. There currently are up to three pieces of information returned. The first index in ERR_BNDS_NORM(i,:) corresponds to the ith right-hand side. The second index in ERR_BNDS_NORM(:,err) contains the following three fields: err = 1 "Trust/don't trust" boolean. Trust the answer if the reciprocal condition number is less than the threshold sqrt(n) * slamch('Epsilon'). err = 2 "Guaranteed" error bound: The estimated forward error, almost certainly within a factor of 10 of the true error so long as the next entry is greater than the threshold sqrt(n) * slamch('Epsilon'). This error bound should only be trusted if the previous boolean is true. err = 3 Reciprocal condition number: Estimated normwise reciprocal condition number. Compared with the threshold sqrt(n) * slamch('Epsilon') to determine if the error estimate is "guaranteed". These reciprocal condition numbers are 1 / (norm(Z^{-1},inf) * norm(Z,inf)) for some appropriately scaled matrix Z. Let Z = S*A, where S scales each row by a power of the radix so all absolute row sums of Z are approximately 1. This subroutine is only responsible for setting the second field above. See Lapack Working Note 165 for further details and extra cautions.
[in,out]	ERR_BNDS_COMP	ERR_BNDS_COMP is REAL array, dimension (NRHS, N_ERR_BNDS) For each right-hand side, this array contains information about various error bounds and condition numbers corresponding to the componentwise relative error, which is defined as follows: Componentwise relative error in the ith solution vector: abs(XTRUE(j,i) - X(j,i)) max_j ---------------------- abs(X(j,i)) The array is indexed by the right-hand side i (on which the componentwise relative error depends), and the type of error information as described below. There currently are up to three pieces of information returned for each right-hand side. If componentwise accuracy is not requested (PARAMS(3) = 0.0), then ERR_BNDS_COMP is not accessed. If N_ERR_BNDS .LT. 3, then at most the first (:,N_ERR_BNDS) entries are returned. The first index in ERR_BNDS_COMP(i,:) corresponds to the ith right-hand side. The second index in ERR_BNDS_COMP(:,err) contains the following three fields: err = 1 "Trust/don't trust" boolean. Trust the answer if the reciprocal condition number is less than the threshold sqrt(n) * slamch('Epsilon'). err = 2 "Guaranteed" error bound: The estimated forward error, almost certainly within a factor of 10 of the true error so long as the next entry is greater than the threshold sqrt(n) * slamch('Epsilon'). This error bound should only be trusted if the previous boolean is true. err = 3 Reciprocal condition number: Estimated componentwise reciprocal condition number. Compared with the threshold sqrt(n) * slamch('Epsilon') to determine if the error estimate is "guaranteed". These reciprocal condition numbers are 1 / (norm(Z^{-1},inf) * norm(Z,inf)) for some appropriately scaled matrix Z. Let Z = S(Adiag(x)), where x is the solution for the current right-hand side and S scales each row of A*diag(x) by a power of the radix so all absolute row sums of Z are approximately 1. This subroutine is only responsible for setting the second field above. See Lapack Working Note 165 for further details and extra cautions.
[in]	RES	RES is COMPLEX array, dimension (N) Workspace to hold the intermediate residual.
[in]	AYB	AYB is REAL array, dimension (N) Workspace.
[in]	DY	DY is COMPLEX array, dimension (N) Workspace to hold the intermediate solution.
[in]	Y_TAIL	Y_TAIL is COMPLEX array, dimension (N) Workspace to hold the trailing bits of the intermediate solution.
[in]	RCOND	RCOND is REAL Reciprocal scaled condition number. This is an estimate of the reciprocal Skeel condition number of the matrix A after equilibration (if done). If this is less than the machine precision (in particular, if it is zero), the matrix is singular to working precision. Note that the error may still be small even if this number is very small and the matrix appears ill- conditioned.
[in]	ITHRESH	ITHRESH is INTEGER The maximum number of residual computations allowed for refinement. The default is 10. For 'aggressive' set to 100 to permit convergence using approximate factorizations or factorizations other than LU. If the factorization uses a technique other than Gaussian elimination, the guarantees in ERR_BNDS_NORM and ERR_BNDS_COMP may no longer be trustworthy.
[in]	RTHRESH	RTHRESH is REAL Determines when to stop refinement if the error estimate stops decreasing. Refinement will stop when the next solution no longer satisfies norm(dx_{i+1}) < RTHRESH * norm(dx_i) where norm(Z) is the infinity norm of Z. RTHRESH satisfies 0 < RTHRESH <= 1. The default value is 0.5. For 'aggressive' set to 0.9 to permit convergence on extremely ill-conditioned matrices. See LAWN 165 for more details.
[in]	DZ_UB	DZ_UB is REAL Determines when to start considering componentwise convergence. Componentwise convergence is only considered after each component of the solution Y is stable, which we definte as the relative change in each component being less than DZ_UB. The default value is 0.25, requiring the first bit to be stable. See LAWN 165 for more details.
[in]	IGNORE_CWISE	IGNORE_CWISE is LOGICAL If .TRUE. then ignore componentwise convergence. Default value is .FALSE..
[out]	INFO	INFO is INTEGER = 0: Successful exit. < 0: if INFO = -i, the ith argument to CPOTRS had an illegal value

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Date: September 2012

Definition at line 392 of file cla_porfsx_extended.f.

 *
 *  -- LAPACK computational routine (version 3.4.2) --
 *  -- LAPACK is a software package provided by Univ. of Tennessee,    --
 *  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
 *     September 2012
 *
 *     .. Scalar Arguments ..
       INTEGER            info, lda, ldaf, ldb, ldy, n, nrhs, prec_type,
      $                   n_norms, ithresh
       CHARACTER          uplo
       LOGICAL            colequ, ignore_cwise
       REAL               rthresh, dz_ub
 *     ..
 *     .. Array Arguments ..
       COMPLEX            a( lda, * ), af( ldaf, * ), b( ldb, * ),
      $                   y( ldy, * ), res( * ), dy( * ), y_tail( * )
       REAL               c( * ), ayb( * ), rcond, berr_out( * ),
      $                   err_bnds_norm( nrhs, * ),
      $                   err_bnds_comp( nrhs, * )
 *     ..
 *
 *  =====================================================================
 *
 *     .. Local Scalars ..
       INTEGER            uplo2, cnt, i, j, x_state, z_state,
      $                   y_prec_state
       REAL               yk, dyk, ymin, normy, normx, normdx, dxrat,
      $                   dzrat, prevnormdx, prev_dz_z, dxratmax,
      $                   dzratmax, dx_x, dz_z, final_dx_x, final_dz_z,
      $                   eps, hugeval, incr_thresh
       LOGICAL            incr_prec
       COMPLEX            zdum
 *     ..
 *     .. Parameters ..
       INTEGER            unstable_state, working_state, conv_state,
      $                   noprog_state, base_residual, extra_residual,
      $                   extra_y
       parameter                ( unstable_state = 0, working_state = 1,
      $                   conv_state = 2, noprog_state = 3 )
       parameter                ( base_residual = 0, extra_residual = 1,
      $                   extra_y = 2 )
       INTEGER            final_nrm_err_i, final_cmp_err_i, berr_i
       INTEGER            rcond_i, nrm_rcond_i, nrm_err_i, cmp_rcond_i
       INTEGER            cmp_err_i, piv_growth_i
       parameter                ( final_nrm_err_i = 1, final_cmp_err_i = 2,
      $                   berr_i = 3 )
       parameter                ( rcond_i = 4, nrm_rcond_i = 5, nrm_err_i = 6 )
       parameter                ( cmp_rcond_i = 7, cmp_err_i = 8,
      $                   piv_growth_i = 9 )
       INTEGER            la_linrx_itref_i, la_linrx_ithresh_i,
      $                   la_linrx_cwise_i
       parameter                ( la_linrx_itref_i = 1,
      $                   la_linrx_ithresh_i = 2 )
       parameter                ( la_linrx_cwise_i = 3 )
       INTEGER            la_linrx_trust_i, la_linrx_err_i,
      $                   la_linrx_rcond_i
       parameter                ( la_linrx_trust_i = 1, la_linrx_err_i = 2 )
       parameter                ( la_linrx_rcond_i = 3 )
 *     ..
 *     .. External Functions ..
       LOGICAL            lsame
       EXTERNAL           ilauplo
       INTEGER            ilauplo
 *     ..
 *     .. External Subroutines ..
       EXTERNAL           caxpy, ccopy, cpotrs, chemv, blas_chemv_x,
      $                   blas_chemv2_x, cla_heamv, cla_wwaddw,
      $                   cla_lin_berr, slamch
       REAL               slamch
 *     ..
 *     .. Intrinsic Functions ..
       INTRINSIC          abs, REAL, aimag, max, min
 *     ..
 *     .. Statement Functions ..
       REAL               cabs1
 *     ..
 *     .. Statement Function Definitions ..
       cabs1( zdum ) = abs( REAL( ZDUM ) ) + abs( aimag( zdum ) )
 *     ..
 *     .. Executable Statements ..
 *
       IF (info.NE.0) RETURN
       eps = slamch( 'Epsilon' )
       hugeval = slamch( 'Overflow' )
 *     Force HUGEVAL to Inf
       hugeval = hugeval * hugeval
 *     Using HUGEVAL may lead to spurious underflows.
       incr_thresh = REAL(N) * eps
 
       IF (lsame(uplo, 'L')) THEN
          uplo2 = ilauplo( 'L' )
       ELSE
          uplo2 = ilauplo( 'U' )
       ENDIF
 
       DO j = 1, nrhs
          y_prec_state = extra_residual
          IF (y_prec_state .EQ. extra_y) THEN
             DO i = 1, n
                y_tail( i ) = 0.0
             END DO
          END IF
 
          dxrat = 0.0
          dxratmax = 0.0
          dzrat = 0.0
          dzratmax = 0.0
          final_dx_x = hugeval
          final_dz_z = hugeval
          prevnormdx = hugeval
          prev_dz_z = hugeval
          dz_z = hugeval
          dx_x = hugeval
 
          x_state = working_state
          z_state = unstable_state
          incr_prec = .false.
 
          DO cnt = 1, ithresh
 *
 *         Compute residual RES = B_s - op(A_s) * Y,
 *             op(A) = A, A**T, or A**H depending on TRANS (and type).
 *
             CALL ccopy( n, b( 1, j ), 1, res, 1 )
             IF (y_prec_state .EQ. base_residual) THEN
                CALL chemv(uplo, n, cmplx(-1.0), a, lda, y(1,j), 1,
      $              cmplx(1.0), res, 1)
             ELSE IF (y_prec_state .EQ. extra_residual) THEN
                CALL blas_chemv_x(uplo2, n, cmplx(-1.0), a, lda,
      $              y( 1, j ), 1, cmplx(1.0), res, 1, prec_type)
             ELSE
                CALL blas_chemv2_x(uplo2, n, cmplx(-1.0), a, lda,
      $              y(1, j), y_tail, 1, cmplx(1.0), res, 1, prec_type)
             END IF
 
 !         XXX: RES is no longer needed.
             CALL ccopy( n, res, 1, dy, 1 )
             CALL cpotrs( uplo, n, 1, af, ldaf, dy, n, info)
 *
 *         Calculate relative changes DX_X, DZ_Z and ratios DXRAT, DZRAT.
 *
             normx = 0.0
             normy = 0.0
             normdx = 0.0
             dz_z = 0.0
             ymin = hugeval
 
             DO i = 1, n
                yk = cabs1(y(i, j))
                dyk = cabs1(dy(i))
 
                IF (yk .NE. 0.0) THEN
                   dz_z = max( dz_z, dyk / yk )
                ELSE IF (dyk .NE. 0.0) THEN
                   dz_z = hugeval
                END IF
 
                ymin = min( ymin, yk )
 
                normy = max( normy, yk )
 
                IF ( colequ ) THEN
                   normx = max(normx, yk * c(i))
                   normdx = max(normdx, dyk * c(i))
                ELSE
                   normx = normy
                   normdx = max(normdx, dyk)
                END IF
             END DO
 
             IF (normx .NE. 0.0) THEN
                dx_x = normdx / normx
             ELSE IF (normdx .EQ. 0.0) THEN
                dx_x = 0.0
             ELSE
                dx_x = hugeval
             END IF
 
             dxrat = normdx / prevnormdx
             dzrat = dz_z / prev_dz_z
 *
 *         Check termination criteria.
 *
             IF (ymin*rcond .LT. incr_thresh*normy
      $           .AND. y_prec_state .LT. extra_y)
      $           incr_prec = .true.
 
             IF (x_state .EQ. noprog_state .AND. dxrat .LE. rthresh)
      $           x_state = working_state
             IF (x_state .EQ. working_state) THEN
                IF (dx_x .LE. eps) THEN
                   x_state = conv_state
                ELSE IF (dxrat .GT. rthresh) THEN
                   IF (y_prec_state .NE. extra_y) THEN
                      incr_prec = .true.
                   ELSE
                      x_state = noprog_state
                   END IF
                ELSE
                   IF (dxrat .GT. dxratmax) dxratmax = dxrat
                END IF
                IF (x_state .GT. working_state) final_dx_x = dx_x
             END IF
 
             IF (z_state .EQ. unstable_state .AND. dz_z .LE. dz_ub)
      $           z_state = working_state
             IF (z_state .EQ. noprog_state .AND. dzrat .LE. rthresh)
      $           z_state = working_state
             IF (z_state .EQ. working_state) THEN
                IF (dz_z .LE. eps) THEN
                   z_state = conv_state
                ELSE IF (dz_z .GT. dz_ub) THEN
                   z_state = unstable_state
                   dzratmax = 0.0
                   final_dz_z = hugeval
                ELSE IF (dzrat .GT. rthresh) THEN
                   IF (y_prec_state .NE. extra_y) THEN
                      incr_prec = .true.
                   ELSE
                      z_state = noprog_state
                   END IF
                ELSE
                   IF (dzrat .GT. dzratmax) dzratmax = dzrat
                END IF
                IF (z_state .GT. working_state) final_dz_z = dz_z
             END IF
 
             IF ( x_state.NE.working_state.AND.
      $           (ignore_cwise.OR.z_state.NE.working_state) )
      $           GOTO 666
 
             IF (incr_prec) THEN
                incr_prec = .false.
                y_prec_state = y_prec_state + 1
                DO i = 1, n
                   y_tail( i ) = 0.0
                END DO
             END IF
 
             prevnormdx = normdx
             prev_dz_z = dz_z
 *
 *           Update soluton.
 *
             IF (y_prec_state .LT. extra_y) THEN
                CALL caxpy( n, cmplx(1.0), dy, 1, y(1,j), 1 )
             ELSE
                CALL cla_wwaddw(n, y(1,j), y_tail, dy)
             END IF
 
          END DO
 *        Target of "IF (Z_STOP .AND. X_STOP)".  Sun's f77 won't EXIT.
  666     CONTINUE
 *
 *     Set final_* when cnt hits ithresh.
 *
          IF (x_state .EQ. working_state) final_dx_x = dx_x
          IF (z_state .EQ. working_state) final_dz_z = dz_z
 *
 *     Compute error bounds.
 *
          IF (n_norms .GE. 1) THEN
             err_bnds_norm( j, la_linrx_err_i ) =
      $           final_dx_x / (1 - dxratmax)
          END IF
          IF (n_norms .GE. 2) THEN
             err_bnds_comp( j, la_linrx_err_i ) =
      $           final_dz_z / (1 - dzratmax)
          END IF
 *
 *     Compute componentwise relative backward error from formula
 *         max(i) ( abs(R(i)) / ( abs(op(A_s))*abs(Y) + abs(B_s) )(i) )
 *     where abs(Z) is the componentwise absolute value of the matrix
 *     or vector Z.
 *
 *        Compute residual RES = B_s - op(A_s) * Y,
 *            op(A) = A, A**T, or A**H depending on TRANS (and type).
 *
          CALL ccopy( n, b( 1, j ), 1, res, 1 )
          CALL chemv(uplo, n, cmplx(-1.0), a, lda, y(1,j), 1, cmplx(1.0),
      $        res, 1)
 
          DO i = 1, n
             ayb( i ) = cabs1( b( i, j ) )
          END DO
 *
 *     Compute abs(op(A_s))*abs(Y) + abs(B_s).
 *
          CALL cla_heamv (uplo2, n, 1.0,
      $        a, lda, y(1, j), 1, 1.0, ayb, 1)
 
          CALL cla_lin_berr (n, n, 1, res, ayb, berr_out(j))
 *
 *     End of loop for each RHS.
 *
       END DO
 *
       RETURN

Here is the call graph for this function:

Here is the caller graph for this function: