d5/d4a/zcgesv_8f_source.html

 *> \brief <b> ZCGESV computes the solution to system of linear equations A * X = B for GE matrices</b> (mixed precision with iterative refinement)

 *

 *  =========== DOCUMENTATION ===========

 *

 * Online html documentation available at

 *            http://www.netlib.org/lapack/explore-html/

 *

 *> \htmlonly

 *> Download ZCGESV + dependencies

 *> <a href="http://www.netlib.org/cgi-bin/netlibfiles.tgz?format=tgz&filename=/lapack/lapack_routine/zcgesv.f">

 *> [TGZ]</a>

 *> <a href="http://www.netlib.org/cgi-bin/netlibfiles.zip?format=zip&filename=/lapack/lapack_routine/zcgesv.f">

 *> [ZIP]</a>

 *> <a href="http://www.netlib.org/cgi-bin/netlibfiles.txt?format=txt&filename=/lapack/lapack_routine/zcgesv.f">

 *> [TXT]</a>

 *> \endhtmlonly

 *

 *  Definition:

 *  ===========

 *

 *       SUBROUTINE ZCGESV( N, NRHS, A, LDA, IPIV, B, LDB, X, LDX, WORK,

 *                          SWORK, RWORK, ITER, INFO )

 *

 *       .. Scalar Arguments ..

 *       INTEGER            INFO, ITER, LDA, LDB, LDX, N, NRHS

 *       ..

 *       .. Array Arguments ..

 *       INTEGER            IPIV( * )

 *       DOUBLE PRECISION   RWORK( * )

 *       COMPLEX            SWORK( * )

 *       COMPLEX*16         A( LDA, * ), B( LDB, * ), WORK( N, * ),

 *      $                   X( LDX, * )

 *       ..

 *

 *

 *> \par Purpose:

 *  =============

 *>

 *> \verbatim

 *>

 *> ZCGESV computes the solution to a complex system of linear equations

 *>    A * X = B,

 *> where A is an N-by-N matrix and X and B are N-by-NRHS matrices.

 *>

 *> ZCGESV first attempts to factorize the matrix in COMPLEX and use this

 *> factorization within an iterative refinement procedure to produce a

 *> solution with COMPLEX*16 normwise backward error quality (see below).

 *> If the approach fails the method switches to a COMPLEX*16

 *> factorization and solve.

 *>

 *> The iterative refinement is not going to be a winning strategy if

 *> the ratio COMPLEX performance over COMPLEX*16 performance is too

 *> small. A reasonable strategy should take the number of right-hand

 *> sides and the size of the matrix into account. This might be done

 *> with a call to ILAENV in the future. Up to now, we always try

 *> iterative refinement.

 *>

 *> The iterative refinement process is stopped if

 *>     ITER > ITERMAX

 *> or for all the RHS we have:

 *>     RNRM < SQRT(N)*XNRM*ANRM*EPS*BWDMAX

 *> where

 *>     o ITER is the number of the current iteration in the iterative

 *>       refinement process

 *>     o RNRM is the infinity-norm of the residual

 *>     o XNRM is the infinity-norm of the solution

 *>     o ANRM is the infinity-operator-norm of the matrix A

 *>     o EPS is the machine epsilon returned by DLAMCH('Epsilon')

 *> The value ITERMAX and BWDMAX are fixed to 30 and 1.0D+00

 *> respectively.

 *> \endverbatim

 *

 *  Arguments:

 *  ==========

 *

 *> \param[in] N

 *> \verbatim

 *>          N is INTEGER

 *>          The number of linear equations, i.e., the order of the

 *>          matrix A.  N >= 0.

 *> \endverbatim

 *>

 *> \param[in] NRHS

 *> \verbatim

 *>          NRHS is INTEGER

 *>          The number of right hand sides, i.e., the number of columns

 *>          of the matrix B.  NRHS >= 0.

 *> \endverbatim

 *>

 *> \param[in,out] A

 *> \verbatim

 *>          A is COMPLEX*16 array,

 *>          dimension (LDA,N)

 *>          On entry, the N-by-N coefficient matrix A.

 *>          On exit, if iterative refinement has been successfully used

 *>          (INFO.EQ.0 and ITER.GE.0, see description below), then A is

 *>          unchanged, if double precision factorization has been used

 *>          (INFO.EQ.0 and ITER.LT.0, see description below), then the

 *>          array A contains the factors L and U from the factorization

 *>          A = P*L*U; the unit diagonal elements of L are not stored.

 *> \endverbatim

 *>

 *> \param[in] LDA

 *> \verbatim

 *>          LDA is INTEGER

 *>          The leading dimension of the array A.  LDA >= max(1,N).

 *> \endverbatim

 *>

 *> \param[out] IPIV

 *> \verbatim

 *>          IPIV is INTEGER array, dimension (N)

 *>          The pivot indices that define the permutation matrix P;

 *>          row i of the matrix was interchanged with row IPIV(i).

 *>          Corresponds either to the single precision factorization

 *>          (if INFO.EQ.0 and ITER.GE.0) or the double precision

 *>          factorization (if INFO.EQ.0 and ITER.LT.0).

 *> \endverbatim

 *>

 *> \param[in] B

 *> \verbatim

 *>          B is COMPLEX*16 array, dimension (LDB,NRHS)

 *>          The N-by-NRHS right hand side matrix B.

 *> \endverbatim

 *>

 *> \param[in] LDB

 *> \verbatim

 *>          LDB is INTEGER

 *>          The leading dimension of the array B.  LDB >= max(1,N).

 *> \endverbatim

 *>

 *> \param[out] X

 *> \verbatim

 *>          X is COMPLEX*16 array, dimension (LDX,NRHS)

 *>          If INFO = 0, the N-by-NRHS solution matrix X.

 *> \endverbatim

 *>

 *> \param[in] LDX

 *> \verbatim

 *>          LDX is INTEGER

 *>          The leading dimension of the array X.  LDX >= max(1,N).

 *> \endverbatim

 *>

 *> \param[out] WORK

 *> \verbatim

 *>          WORK is COMPLEX*16 array, dimension (N*NRHS)

 *>          This array is used to hold the residual vectors.

 *> \endverbatim

 *>

 *> \param[out] SWORK

 *> \verbatim

 *>          SWORK is COMPLEX array, dimension (N*(N+NRHS))

 *>          This array is used to use the single precision matrix and the

 *>          right-hand sides or solutions in single precision.

 *> \endverbatim

 *>

 *> \param[out] RWORK

 *> \verbatim

 *>          RWORK is DOUBLE PRECISION array, dimension (N)

 *> \endverbatim

 *>

 *> \param[out] ITER

 *> \verbatim

 *>          ITER is INTEGER

 *>          < 0: iterative refinement has failed, COMPLEX*16

 *>               factorization has been performed

 *>               -1 : the routine fell back to full precision for

 *>                    implementation- or machine-specific reasons

 *>               -2 : narrowing the precision induced an overflow,

 *>                    the routine fell back to full precision

 *>               -3 : failure of CGETRF

 *>               -31: stop the iterative refinement after the 30th

 *>                    iterations

 *>          > 0: iterative refinement has been successfully used.

 *>               Returns the number of iterations

 *> \endverbatim

 *>

 *> \param[out] INFO

 *> \verbatim

 *>          INFO is INTEGER

 *>          = 0:  successful exit

 *>          < 0:  if INFO = -i, the i-th argument had an illegal value

 *>          > 0:  if INFO = i, U(i,i) computed in COMPLEX*16 is exactly

 *>                zero.  The factorization has been completed, but the

 *>                factor U is exactly singular, so the solution

 *>                could not be computed.

 *> \endverbatim

 *

 *  Authors:

 *  ========

 *

 *> \author Univ. of Tennessee

 *> \author Univ. of California Berkeley

 *> \author Univ. of Colorado Denver

 *> \author NAG Ltd.

 *

 *> \date June 2016

 *

 *> \ingroup complex16GEsolve

 *

 *  =====================================================================

       SUBROUTINE zcgesv( N, NRHS, A, LDA, IPIV, B, LDB, X, LDX, WORK,

      $                   swork, rwork, iter, info )

 *

 *  -- LAPACK driver routine (version 3.6.1) --

 *  -- LAPACK is a software package provided by Univ. of Tennessee,    --

 *  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--

 *     June 2016

 *

 *     .. Scalar Arguments ..

       INTEGER            INFO, ITER, LDA, LDB, LDX, N, NRHS

 *     ..

 *     .. Array Arguments ..

       INTEGER            IPIV( * )

       DOUBLE PRECISION   RWORK( * )

       COMPLEX            SWORK( * )

       COMPLEX*16         A( lda, * ), B( ldb, * ), WORK( n, * ),

      $                   x( ldx, * )

 *     ..

 *

 *  =====================================================================

 *

 *     .. Parameters ..

       LOGICAL            DOITREF

       parameter                ( doitref = .true. )

 *

       INTEGER            ITERMAX

       parameter                ( itermax = 30 )

 *

       DOUBLE PRECISION   BWDMAX

       parameter                ( bwdmax = 1.0e+00 )

 *

       COMPLEX*16         NEGONE, ONE

       parameter                ( negone = ( -1.0d+00, 0.0d+00 ),

      $                   one = ( 1.0d+00, 0.0d+00 ) )

 *

 *     .. Local Scalars ..

       INTEGER            I, IITER, PTSA, PTSX

       DOUBLE PRECISION   ANRM, CTE, EPS, RNRM, XNRM

       COMPLEX*16         ZDUM

 *

 *     .. External Subroutines ..

       EXTERNAL           cgetrs, cgetrf, clag2z, xerbla, zaxpy, zgemm,

      $                   zlacpy, zlag2c

 *     ..

 *     .. External Functions ..

       INTEGER            IZAMAX

       DOUBLE PRECISION   DLAMCH, ZLANGE

       EXTERNAL           izamax, dlamch, zlange

 *     ..

 *     .. Intrinsic Functions ..

       INTRINSIC          abs, dble, max, sqrt

 *     ..

 *     .. Statement Functions ..

       DOUBLE PRECISION   CABS1

 *     ..

 *     .. Statement Function definitions ..

       cabs1( zdum ) = abs( dble( zdum ) ) + abs( dimag( zdum ) )

 *     ..

 *     .. Executable Statements ..

 *

       info = 0

       iter = 0

 *

 *     Test the input parameters.

 *

       IF( n.LT.0 ) THEN

          info = -1

       ELSE IF( nrhs.LT.0 ) THEN

          info = -2

       ELSE IF( lda.LT.max( 1, n ) ) THEN

          info = -4

       ELSE IF( ldb.LT.max( 1, n ) ) THEN

          info = -7

       ELSE IF( ldx.LT.max( 1, n ) ) THEN

          info = -9

       END IF

       IF( info.NE.0 ) THEN

          CALL xerbla( 'ZCGESV', -info )

          RETURN

       END IF

 *

 *     Quick return if (N.EQ.0).

 *

       IF( n.EQ.0 )

      $   RETURN

 *

 *     Skip single precision iterative refinement if a priori slower

 *     than double precision factorization.

 *

       IF( .NOT.doitref ) THEN

          iter = -1

          GO TO 40

       END IF

 *

 *     Compute some constants.

 *

       anrm = zlange( 'I', n, n, a, lda, rwork )

       eps = dlamch( 'Epsilon' )

       cte = anrm*eps*sqrt( dble( n ) )*bwdmax

 *

 *     Set the indices PTSA, PTSX for referencing SA and SX in SWORK.

 *

       ptsa = 1

       ptsx = ptsa + n*n

 *

 *     Convert B from double precision to single precision and store the

 *     result in SX.

 *

       CALL zlag2c( n, nrhs, b, ldb, swork( ptsx ), n, info )

 *

       IF( info.NE.0 ) THEN

          iter = -2

          GO TO 40

       END IF

 *

 *     Convert A from double precision to single precision and store the

 *     result in SA.

 *

       CALL zlag2c( n, n, a, lda, swork( ptsa ), n, info )

 *

       IF( info.NE.0 ) THEN

          iter = -2

          GO TO 40

       END IF

 *

 *     Compute the LU factorization of SA.

 *

       CALL cgetrf( n, n, swork( ptsa ), n, ipiv, info )

 *

       IF( info.NE.0 ) THEN

          iter = -3

          GO TO 40

       END IF

 *

 *     Solve the system SA*SX = SB.

 *

       CALL cgetrs( 'No transpose', n, nrhs, swork( ptsa ), n, ipiv,

      $             swork( ptsx ), n, info )

 *

 *     Convert SX back to double precision

 *

       CALL clag2z( n, nrhs, swork( ptsx ), n, x, ldx, info )

 *

 *     Compute R = B - AX (R is WORK).

 *

       CALL zlacpy( 'All', n, nrhs, b, ldb, work, n )

 *

       CALL zgemm( 'No Transpose', 'No Transpose', n, nrhs, n, negone, a,

      $            lda, x, ldx, one, work, n )

 *

 *     Check whether the NRHS normwise backward errors satisfy the

 *     stopping criterion. If yes, set ITER=0 and return.

 *

       DO i = 1, nrhs

          xnrm = cabs1( x( izamax( n, x( 1, i ), 1 ), i ) )

          rnrm = cabs1( work( izamax( n, work( 1, i ), 1 ), i ) )

          IF( rnrm.GT.xnrm*cte )

      $      GO TO 10

       END DO

 *

 *     If we are here, the NRHS normwise backward errors satisfy the

 *     stopping criterion. We are good to exit.

 *

       iter = 0

       RETURN

 *

    10 CONTINUE

 *

       DO 30 iiter = 1, itermax

 *

 *        Convert R (in WORK) from double precision to single precision

 *        and store the result in SX.

 *

          CALL zlag2c( n, nrhs, work, n, swork( ptsx ), n, info )

 *

          IF( info.NE.0 ) THEN

             iter = -2

             GO TO 40

          END IF

 *

 *        Solve the system SA*SX = SR.

 *

          CALL cgetrs( 'No transpose', n, nrhs, swork( ptsa ), n, ipiv,

      $                swork( ptsx ), n, info )

 *

 *        Convert SX back to double precision and update the current

 *        iterate.

 *

          CALL clag2z( n, nrhs, swork( ptsx ), n, work, n, info )

 *

          DO i = 1, nrhs

             CALL zaxpy( n, one, work( 1, i ), 1, x( 1, i ), 1 )

          END DO

 *

 *        Compute R = B - AX (R is WORK).

 *

          CALL zlacpy( 'All', n, nrhs, b, ldb, work, n )

 *

          CALL zgemm( 'No Transpose', 'No Transpose', n, nrhs, n, negone,

      $               a, lda, x, ldx, one, work, n )

 *

 *        Check whether the NRHS normwise backward errors satisfy the

 *        stopping criterion. If yes, set ITER=IITER>0 and return.

 *

          DO i = 1, nrhs

             xnrm = cabs1( x( izamax( n, x( 1, i ), 1 ), i ) )

             rnrm = cabs1( work( izamax( n, work( 1, i ), 1 ), i ) )

             IF( rnrm.GT.xnrm*cte )

      $         GO TO 20

          END DO

 *

 *        If we are here, the NRHS normwise backward errors satisfy the

 *        stopping criterion, we are good to exit.

 *

          iter = iiter

 *

          RETURN

 *

    20    CONTINUE

 *

    30 CONTINUE

 *

 *     If we are at this place of the code, this is because we have

 *     performed ITER=ITERMAX iterations and never satisified the stopping

 *     criterion, set up the ITER flag accordingly and follow up on double

 *     precision routine.

 *

       iter = -itermax - 1

 *

    40 CONTINUE

 *

 *     Single-precision iterative refinement failed to converge to a

 *     satisfactory solution, so we resort to double precision.

 *

       CALL zgetrf( n, n, a, lda, ipiv, info )

 *

       IF( info.NE.0 )

      $   RETURN

 *

       CALL zlacpy( 'All', n, nrhs, b, ldb, x, ldx )

       CALL zgetrs( 'No transpose', n, nrhs, a, lda, ipiv, x, ldx,

      $             info )

 *

       RETURN

 *

 *     End of ZCGESV.

 *

       END

zgetrs
subroutine zgetrs(TRANS, N, NRHS, A, LDA, IPIV, B, LDB, INFO)
ZGETRS
Definition: zgetrs.f:123

zlacpy
subroutine zlacpy(UPLO, M, N, A, LDA, B, LDB)
ZLACPY copies all or part of one two-dimensional array to another.
Definition: zlacpy.f:105

zlag2c
subroutine zlag2c(M, N, A, LDA, SA, LDSA, INFO)
ZLAG2C converts a complex double precision matrix to a complex single precision matrix.
Definition: zlag2c.f:109

cgetrs
subroutine cgetrs(TRANS, N, NRHS, A, LDA, IPIV, B, LDB, INFO)
CGETRS
Definition: cgetrs.f:123

zgetrf
subroutine zgetrf(M, N, A, LDA, IPIV, INFO)
ZGETRF VARIANT: Crout Level 3 BLAS version of the algorithm.
Definition: zgetrf.f:102

zgemm
subroutine zgemm(TRANSA, TRANSB, M, N, K, ALPHA, A, LDA, B, LDB, BETA, C, LDC)
ZGEMM
Definition: zgemm.f:189

xerbla
subroutine xerbla(SRNAME, INFO)
XERBLA
Definition: xerbla.f:62

cgetrf
subroutine cgetrf(M, N, A, LDA, IPIV, INFO)
CGETRF
Definition: cgetrf.f:110

clag2z
subroutine clag2z(M, N, SA, LDSA, A, LDA, INFO)
CLAG2Z converts a complex single precision matrix to a complex double precision matrix.
Definition: clag2z.f:105

zcgesv
subroutine zcgesv(N, NRHS, A, LDA, IPIV, B, LDB, X, LDX, WORK,                                                                                           SWORK, RWORK, ITER, INFO)
 ZCGESV computes the solution to system of linear equations A * X = B for GE matrices (mixed precisio...
Definition: zcgesv.f:203

zaxpy
subroutine zaxpy(N, ZA, ZX, INCX, ZY, INCY)
ZAXPY
Definition: zaxpy.f:53