d3/d6f/cgetsqrhrt_8f_source.html

*> \brief \b CGETSQRHRT

*

*  =========== DOCUMENTATION ===========

*

* Online html documentation available at

*            http://www.netlib.org/lapack/explore-html/

*

*> Download CGETSQRHRT + dependencies

*> <a href="http://www.netlib.org/cgi-bin/netlibfiles.tgz?format=tgz&filename=/lapack/lapack_routine/cgetsqrhrt.f">

*> [TGZ]</a>

*> <a href="http://www.netlib.org/cgi-bin/netlibfiles.zip?format=zip&filename=/lapack/lapack_routine/cgetsqrhrt.f">

*> [ZIP]</a>

*> <a href="http://www.netlib.org/cgi-bin/netlibfiles.txt?format=txt&filename=/lapack/lapack_routine/cgetsqrhrt.f">

*> [TXT]</a>

*

*  Definition:

*  ===========

*

*       SUBROUTINE CGETSQRHRT( M, N, MB1, NB1, NB2, A, LDA, T, LDT, WORK,

*      $                       LWORK, INFO )

*       IMPLICIT NONE

*

*       .. Scalar Arguments ..

*       INTEGER           INFO, LDA, LDT, LWORK, M, N, NB1, NB2, MB1

*       ..

*       .. Array Arguments ..

*       COMPLEX*16        A( LDA, * ), T( LDT, * ), WORK( * )

*       ..

*

*

*> \par Purpose:

*  =============

*>

*> \verbatim

*>

*> CGETSQRHRT computes a NB2-sized column blocked QR-factorization

*> of a complex M-by-N matrix A with M >= N,

*>

*>    A = Q * R.

*>

*> The routine uses internally a NB1-sized column blocked and MB1-sized

*> row blocked TSQR-factorization and perfors the reconstruction

*> of the Householder vectors from the TSQR output. The routine also

*> converts the R_tsqr factor from the TSQR-factorization output into

*> the R factor that corresponds to the Householder QR-factorization,

*>

*>    A = Q_tsqr * R_tsqr = Q * R.

*>

*> The output Q and R factors are stored in the same format as in CGEQRT

*> (Q is in blocked compact WY-representation). See the documentation

*> of CGEQRT for more details on the format.

*> \endverbatim

*

*  Arguments:

*  ==========

*

*> \param[in] M

*> \verbatim

*>          M is INTEGER

*>          The number of rows of the matrix A.  M >= 0.

*> \endverbatim

*>

*> \param[in] N

*> \verbatim

*>          N is INTEGER

*>          The number of columns of the matrix A. M >= N >= 0.

*> \endverbatim

*>

*> \param[in] MB1

*> \verbatim

*>          MB1 is INTEGER

*>          The row block size to be used in the blocked TSQR.

*>          MB1 > N.

*> \endverbatim

*>

*> \param[in] NB1

*> \verbatim

*>          NB1 is INTEGER

*>          The column block size to be used in the blocked TSQR.

*>          N >= NB1 >= 1.

*> \endverbatim

*>

*> \param[in] NB2

*> \verbatim

*>          NB2 is INTEGER

*>          The block size to be used in the blocked QR that is

*>          output. NB2 >= 1.

*> \endverbatim

*>

*> \param[in,out] A

*> \verbatim

*>          A is COMPLEX*16 array, dimension (LDA,N)

*>

*>          On entry: an M-by-N matrix A.

*>

*>          On exit:

*>           a) the elements on and above the diagonal

*>              of the array contain the N-by-N upper-triangular

*>              matrix R corresponding to the Householder QR;

*>           b) the elements below the diagonal represent Q by

*>              the columns of blocked V (compact WY-representation).

*> \endverbatim

*>

*> \param[in] LDA

*> \verbatim

*>          LDA is INTEGER

*>          The leading dimension of the array A.  LDA >= max(1,M).

*> \endverbatim

*>

*> \param[out] T

*> \verbatim

*>          T is COMPLEX array, dimension (LDT,N))

*>          The upper triangular block reflectors stored in compact form

*>          as a sequence of upper triangular blocks.

*> \endverbatim

*>

*> \param[in] LDT

*> \verbatim

*>          LDT is INTEGER

*>          The leading dimension of the array T.  LDT >= NB2.

*> \endverbatim

*>

*> \param[out] WORK

*> \verbatim

*>          (workspace) COMPLEX array, dimension (MAX(1,LWORK))

*>          On exit, if INFO = 0, WORK(1) returns the optimal LWORK.

*> \endverbatim

*>

*> \param[in] LWORK

*> \verbatim

*>          LWORK is INTEGER

*>          The dimension of the array WORK.

*>          If MIN(M,N) = 0, LWORK >= 1, else

*>          LWORK >= MAX( 1, LWT + LW1, MAX( LWT+N*N+LW2, LWT+N*N+N ) ),

*>          where

*>             NUM_ALL_ROW_BLOCKS = CEIL((M-N)/(MB1-N)),

*>             NB1LOCAL = MIN(NB1,N).

*>             LWT = NUM_ALL_ROW_BLOCKS * N * NB1LOCAL,

*>             LW1 = NB1LOCAL * N,

*>             LW2 = NB1LOCAL * MAX( NB1LOCAL, ( N - NB1LOCAL ) ).

*>

*>          If LWORK = -1, then a workspace query is assumed.

*>          The routine only calculates the optimal size of the WORK

*>          array, returns this value as the first entry of the WORK

*>          array, and no error message related to LWORK is issued

*>          by XERBLA.

*> \endverbatim

*>

*> \param[out] INFO

*> \verbatim

*>          INFO is INTEGER

*>          = 0:  successful exit

*>          < 0:  if INFO = -i, the i-th argument had an illegal value

*> \endverbatim

*

*  Authors:

*  ========

*

*> \author Univ. of Tennessee

*> \author Univ. of California Berkeley

*> \author Univ. of Colorado Denver

*> \author NAG Ltd.

*

*> \ingroup getsqrhrt

*

*> \par Contributors:

*  ==================

*>

*> \verbatim

*>

*> November 2020, Igor Kozachenko,

*>                Computer Science Division,

*>                University of California, Berkeley

*>

*> \endverbatim

*>

*  =====================================================================


      SUBROUTINE cgetsqrhrt( M, N, MB1, NB1, NB2, A, LDA, T, LDT,

     $                       WORK,

     $                       LWORK, INFO )

      IMPLICIT NONE

*

*  -- LAPACK computational routine --

*  -- LAPACK is a software package provided by Univ. of Tennessee,    --

*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--

*

*     .. Scalar Arguments ..

      INTEGER           INFO, LDA, LDT, LWORK, M, N, NB1, NB2, MB1

*     ..

*     .. Array Arguments ..

      COMPLEX           A( LDA, * ), T( LDT, * ), WORK( * )

*     ..

*

*  =====================================================================

*

*     .. Parameters ..

      COMPLEX            CONE

      PARAMETER          ( CONE = ( 1.0e+0, 0.0e+0 ) )

*     ..

*     .. Local Scalars ..

      LOGICAL            LQUERY

      INTEGER            I, IINFO, J, LW1, LW2, LWT, LDWT, LWORKOPT,

     $                   nb1local, nb2local, num_all_row_blocks

*     ..

*     .. External Functions ..

      REAL               SROUNDUP_LWORK

      EXTERNAL           SROUNDUP_LWORK

*     ..

*     .. External Subroutines ..

      EXTERNAL           ccopy, clatsqr, cungtsqr_row,

     $                   cunhr_col,

     $                   xerbla

*     ..

*     .. Intrinsic Functions ..

      INTRINSIC          ceiling, real, cmplx, max, min

*     ..

*     .. Executable Statements ..

*

*     Test the input arguments

*

      info = 0

      lquery = ( lwork.EQ.-1 )

      IF( m.LT.0 ) THEN

         info = -1

      ELSE IF( n.LT.0 .OR. m.LT.n ) THEN

         info = -2

      ELSE IF( mb1.LE.n ) THEN

         info = -3

      ELSE IF( nb1.LT.1 ) THEN

         info = -4

      ELSE IF( nb2.LT.1 ) THEN

         info = -5

      ELSE IF( lda.LT.max( 1, m ) ) THEN

         info = -7

      ELSE IF( ldt.LT.max( 1, min( nb2, n ) ) ) THEN

         info = -9

      ELSE

*

*        Test the input LWORK for the dimension of the array WORK.

*        This workspace is used to store array:

*        a) Matrix T and WORK for CLATSQR;

*        b) N-by-N upper-triangular factor R_tsqr;

*        c) Matrix T and array WORK for CUNGTSQR_ROW;

*        d) Diagonal D for CUNHR_COL.

*

         IF( lwork.LT.n*n+1 .AND. .NOT.lquery ) THEN

            info = -11

         ELSE

*

*           Set block size for column blocks

*

            nb1local = min( nb1, n )

*

            num_all_row_blocks = max( 1,

     $                   ceiling( real( m - n ) / real( mb1 - n ) ) )

*

*           Length and leading dimension of WORK array to place

*           T array in TSQR.

*

            lwt = num_all_row_blocks * n * nb1local


            ldwt = nb1local

*

*           Length of TSQR work array

*

            lw1 = nb1local * n

*

*           Length of CUNGTSQR_ROW work array.

*

            lw2 = nb1local * max( nb1local, ( n - nb1local ) )

*

            lworkopt = max( lwt + lw1, max( lwt+n*n+lw2, lwt+n*n+n ) )

            lworkopt = max( 1, lworkopt )

*

            IF( lwork.LT.lworkopt .AND. .NOT.lquery ) THEN

               info = -11

            END IF

*

         END IF

      END IF

*

*     Handle error in the input parameters and return workspace query.

*

      IF( info.NE.0 ) THEN

         CALL xerbla( 'CGETSQRHRT', -info )

         RETURN

      ELSE IF ( lquery ) THEN

         work( 1 ) = sroundup_lwork( lworkopt )

         RETURN

      END IF

*

*     Quick return if possible

*

      IF( min( m, n ).EQ.0 ) THEN

         work( 1 ) = sroundup_lwork( lworkopt )

         RETURN

      END IF

*

      nb2local = min( nb2, n )

*

*

*     (1) Perform TSQR-factorization of the M-by-N matrix A.

*

      CALL clatsqr( m, n, mb1, nb1local, a, lda, work, ldwt,

     $              work(lwt+1), lw1, iinfo )

*

*     (2) Copy the factor R_tsqr stored in the upper-triangular part

*         of A into the square matrix in the work array

*         WORK(LWT+1:LWT+N*N) column-by-column.

*

      DO j = 1, n

         CALL ccopy( j, a( 1, j ), 1, work( lwt + n*(j-1)+1 ), 1 )

      END DO

*

*     (3) Generate a M-by-N matrix Q with orthonormal columns from

*     the result stored below the diagonal in the array A in place.

*


      CALL cungtsqr_row( m, n, mb1, nb1local, a, lda, work, ldwt,

     $                   work( lwt+n*n+1 ), lw2, iinfo )

*

*     (4) Perform the reconstruction of Householder vectors from

*     the matrix Q (stored in A) in place.

*

      CALL cunhr_col( m, n, nb2local, a, lda, t, ldt,

     $                work( lwt+n*n+1 ), iinfo )

*

*     (5) Copy the factor R_tsqr stored in the square matrix in the

*     work array WORK(LWT+1:LWT+N*N) into the upper-triangular

*     part of A.

*

*     (6) Compute from R_tsqr the factor R_hr corresponding to

*     the reconstructed Householder vectors, i.e. R_hr = S * R_tsqr.

*     This multiplication by the sign matrix S on the left means

*     changing the sign of I-th row of the matrix R_tsqr according

*     to sign of the I-th diagonal element DIAG(I) of the matrix S.

*     DIAG is stored in WORK( LWT+N*N+1 ) from the CUNHR_COL output.

*

*     (5) and (6) can be combined in a single loop, so the rows in A

*     are accessed only once.

*

      DO i = 1, n

         IF( work( lwt+n*n+i ).EQ.-cone ) THEN

            DO j = i, n

               a( i, j ) = -cone * work( lwt+n*(j-1)+i )

            END DO

         ELSE

            CALL ccopy( n-i+1, work(lwt+n*(i-1)+i), n, a( i, i ),

     $                  lda )

         END IF

      END DO

*

      work( 1 ) = sroundup_lwork( lworkopt )

      RETURN

*

*     End of CGETSQRHRT

*


      END

xerbla
subroutine xerbla(srname, info)
Definition cblat2.f:3285

ccopy
subroutine ccopy(n, cx, incx, cy, incy)
CCOPY
Definition ccopy.f:81

cgetsqrhrt
subroutine cgetsqrhrt(m, n, mb1, nb1, nb2, a, lda, t, ldt, work, lwork, info)
CGETSQRHRT
Definition cgetsqrhrt.f:181

clatsqr
subroutine clatsqr(m, n, mb, nb, a, lda, t, ldt, work, lwork, info)
CLATSQR
Definition clatsqr.f:172

cungtsqr_row
subroutine cungtsqr_row(m, n, mb, nb, a, lda, t, ldt, work, lwork, info)
CUNGTSQR_ROW
Definition cungtsqr_row.f:187

cunhr_col
subroutine cunhr_col(m, n, nb, a, lda, t, ldt, d, info)
CUNHR_COL
Definition cunhr_col.f:257