#:include "common.fypp" submodule(stdlib_lapack_solve) stdlib_lapack_solve_ldl_comp3 implicit none contains #:for ik,it,ii in LINALG_INT_KINDS_TYPES pure module subroutine stdlib${ii}$_checon( uplo, n, a, lda, ipiv, anorm, rcond, work,info ) !! CHECON estimates the reciprocal of the condition number of a complex !! Hermitian matrix A using the factorization A = U*D*U**H or !! A = L*D*L**H computed by CHETRF. !! An estimate is obtained for norm(inv(A)), and the reciprocal of the !! condition number is computed as RCOND = 1 / (ANORM * norm(inv(A))). ! -- lapack computational routine -- ! -- lapack is a software package provided by univ. of tennessee, -- ! -- univ. of california berkeley, univ. of colorado denver and nag ltd..-- use stdlib_blas_constants_sp, only: negone, zero, half, one, two, three, four, eight, ten, czero, chalf, cone, cnegone ! Scalar Arguments character, intent(in) :: uplo integer(${ik}$), intent(out) :: info integer(${ik}$), intent(in) :: lda, n real(sp), intent(in) :: anorm real(sp), intent(out) :: rcond ! Array Arguments integer(${ik}$), intent(in) :: ipiv(*) complex(sp), intent(in) :: a(lda,*) complex(sp), intent(out) :: work(*) ! ===================================================================== ! Local Scalars logical(lk) :: upper integer(${ik}$) :: i, kase real(sp) :: ainvnm ! Local Arrays integer(${ik}$) :: isave(3_${ik}$) ! Intrinsic Functions ! Executable Statements ! test the input parameters. info = 0_${ik}$ upper = stdlib_lsame( uplo, 'U' ) if( .not.upper .and. .not.stdlib_lsame( uplo, 'L' ) ) then info = -1_${ik}$ else if( n<0_${ik}$ ) then info = -2_${ik}$ else if( lda<max( 1_${ik}$, n ) ) then info = -4_${ik}$ else if( anorm<zero ) then info = -6_${ik}$ end if if( info/=0_${ik}$ ) then call stdlib${ii}$_xerbla( 'CHECON', -info ) return end if ! quick return if possible rcond = zero if( n==0_${ik}$ ) then rcond = one return else if( anorm<=zero ) then return end if ! check that the diagonal matrix d is nonsingular. if( upper ) then ! upper triangular storage: examine d from bottom to top do i = n, 1, -1 if( ipiv( i )>0 .and. a( i, i )==zero )return end do else ! lower triangular storage: examine d from top to bottom. do i = 1, n if( ipiv( i )>0 .and. a( i, i )==zero )return end do end if ! estimate the 1-norm of the inverse. kase = 0_${ik}$ 30 continue call stdlib${ii}$_clacn2( n, work( n+1 ), work, ainvnm, kase, isave ) if( kase/=0_${ik}$ ) then ! multiply by inv(l*d*l**h) or inv(u*d*u**h). call stdlib${ii}$_chetrs( uplo, n, 1_${ik}$, a, lda, ipiv, work, n, info ) go to 30 end if ! compute the estimate of the reciprocal condition number. if( ainvnm/=zero )rcond = ( one / ainvnm ) / anorm return end subroutine stdlib${ii}$_checon pure module subroutine stdlib${ii}$_zhecon( uplo, n, a, lda, ipiv, anorm, rcond, work,info ) !! ZHECON estimates the reciprocal of the condition number of a complex !! Hermitian matrix A using the factorization A = U*D*U**H or !! A = L*D*L**H computed by ZHETRF. !! An estimate is obtained for norm(inv(A)), and the reciprocal of the !! condition number is computed as RCOND = 1 / (ANORM * norm(inv(A))). ! -- lapack computational routine -- ! -- lapack is a software package provided by univ. of tennessee, -- ! -- univ. of california berkeley, univ. of colorado denver and nag ltd..-- use stdlib_blas_constants_dp, only: negone, zero, half, one, two, three, four, eight, ten, czero, chalf, cone, cnegone ! Scalar Arguments character, intent(in) :: uplo integer(${ik}$), intent(out) :: info integer(${ik}$), intent(in) :: lda, n real(dp), intent(in) :: anorm real(dp), intent(out) :: rcond ! Array Arguments integer(${ik}$), intent(in) :: ipiv(*) complex(dp), intent(in) :: a(lda,*) complex(dp), intent(out) :: work(*) ! ===================================================================== ! Local Scalars logical(lk) :: upper integer(${ik}$) :: i, kase real(dp) :: ainvnm ! Local Arrays integer(${ik}$) :: isave(3_${ik}$) ! Intrinsic Functions ! Executable Statements ! test the input parameters. info = 0_${ik}$ upper = stdlib_lsame( uplo, 'U' ) if( .not.upper .and. .not.stdlib_lsame( uplo, 'L' ) ) then info = -1_${ik}$ else if( n<0_${ik}$ ) then info = -2_${ik}$ else if( lda<max( 1_${ik}$, n ) ) then info = -4_${ik}$ else if( anorm<zero ) then info = -6_${ik}$ end if if( info/=0_${ik}$ ) then call stdlib${ii}$_xerbla( 'ZHECON', -info ) return end if ! quick return if possible rcond = zero if( n==0_${ik}$ ) then rcond = one return else if( anorm<=zero ) then return end if ! check that the diagonal matrix d is nonsingular. if( upper ) then ! upper triangular storage: examine d from bottom to top do i = n, 1, -1 if( ipiv( i )>0 .and. a( i, i )==zero )return end do else ! lower triangular storage: examine d from top to bottom. do i = 1, n if( ipiv( i )>0 .and. a( i, i )==zero )return end do end if ! estimate the 1-norm of the inverse. kase = 0_${ik}$ 30 continue call stdlib${ii}$_zlacn2( n, work( n+1 ), work, ainvnm, kase, isave ) if( kase/=0_${ik}$ ) then ! multiply by inv(l*d*l**h) or inv(u*d*u**h). call stdlib${ii}$_zhetrs( uplo, n, 1_${ik}$, a, lda, ipiv, work, n, info ) go to 30 end if ! compute the estimate of the reciprocal condition number. if( ainvnm/=zero )rcond = ( one / ainvnm ) / anorm return end subroutine stdlib${ii}$_zhecon #:for ck,ct,ci in CMPLX_KINDS_TYPES #:if not ck in ["sp","dp"] pure module subroutine stdlib${ii}$_${ci}$hecon( uplo, n, a, lda, ipiv, anorm, rcond, work,info ) !! ZHECON: estimates the reciprocal of the condition number of a complex !! Hermitian matrix A using the factorization A = U*D*U**H or !! A = L*D*L**H computed by ZHETRF. !! An estimate is obtained for norm(inv(A)), and the reciprocal of the !! condition number is computed as RCOND = 1 / (ANORM * norm(inv(A))). ! -- lapack computational routine -- ! -- lapack is a software package provided by univ. of tennessee, -- ! -- univ. of california berkeley, univ. of colorado denver and nag ltd..-- use stdlib_blas_constants_${ck}$, only: negone, zero, half, one, two, three, four, eight, ten, czero, chalf, cone, cnegone ! Scalar Arguments character, intent(in) :: uplo integer(${ik}$), intent(out) :: info integer(${ik}$), intent(in) :: lda, n real(${ck}$), intent(in) :: anorm real(${ck}$), intent(out) :: rcond ! Array Arguments integer(${ik}$), intent(in) :: ipiv(*) complex(${ck}$), intent(in) :: a(lda,*) complex(${ck}$), intent(out) :: work(*) ! ===================================================================== ! Local Scalars logical(lk) :: upper integer(${ik}$) :: i, kase real(${ck}$) :: ainvnm ! Local Arrays integer(${ik}$) :: isave(3_${ik}$) ! Intrinsic Functions ! Executable Statements ! test the input parameters. info = 0_${ik}$ upper = stdlib_lsame( uplo, 'U' ) if( .not.upper .and. .not.stdlib_lsame( uplo, 'L' ) ) then info = -1_${ik}$ else if( n<0_${ik}$ ) then info = -2_${ik}$ else if( lda<max( 1_${ik}$, n ) ) then info = -4_${ik}$ else if( anorm<zero ) then info = -6_${ik}$ end if if( info/=0_${ik}$ ) then call stdlib${ii}$_xerbla( 'ZHECON', -info ) return end if ! quick return if possible rcond = zero if( n==0_${ik}$ ) then rcond = one return else if( anorm<=zero ) then return end if ! check that the diagonal matrix d is nonsingular. if( upper ) then ! upper triangular storage: examine d from bottom to top do i = n, 1, -1 if( ipiv( i )>0 .and. a( i, i )==zero )return end do else ! lower triangular storage: examine d from top to bottom. do i = 1, n if( ipiv( i )>0 .and. a( i, i )==zero )return end do end if ! estimate the 1-norm of the inverse. kase = 0_${ik}$ 30 continue call stdlib${ii}$_${ci}$lacn2( n, work( n+1 ), work, ainvnm, kase, isave ) if( kase/=0_${ik}$ ) then ! multiply by inv(l*d*l**h) or inv(u*d*u**h). call stdlib${ii}$_${ci}$hetrs( uplo, n, 1_${ik}$, a, lda, ipiv, work, n, info ) go to 30 end if ! compute the estimate of the reciprocal condition number. if( ainvnm/=zero )rcond = ( one / ainvnm ) / anorm return end subroutine stdlib${ii}$_${ci}$hecon #:endif #:endfor pure module subroutine stdlib${ii}$_chetrf( uplo, n, a, lda, ipiv, work, lwork, info ) !! CHETRF computes the factorization of a complex Hermitian matrix A !! using the Bunch-Kaufman diagonal pivoting method. The form of the !! factorization is !! A = U*D*U**H or A = L*D*L**H !! where U (or L) is a product of permutation and unit upper (lower) !! triangular matrices, and D is Hermitian and block diagonal with !! 1-by-1 and 2-by-2 diagonal blocks. !! This is the blocked version of the algorithm, calling Level 3 BLAS. ! -- lapack computational routine -- ! -- lapack is a software package provided by univ. of tennessee, -- ! -- univ. of california berkeley, univ. of colorado denver and nag ltd..-- use stdlib_blas_constants_sp, only: negone, zero, half, one, two, three, four, eight, ten, czero, chalf, cone, cnegone ! Scalar Arguments character, intent(in) :: uplo integer(${ik}$), intent(out) :: info integer(${ik}$), intent(in) :: lda, lwork, n ! Array Arguments integer(${ik}$), intent(out) :: ipiv(*) complex(sp), intent(inout) :: a(lda,*) complex(sp), intent(out) :: work(*) ! ===================================================================== ! Local Scalars logical(lk) :: lquery, upper integer(${ik}$) :: iinfo, iws, j, k, kb, ldwork, lwkopt, nb, nbmin ! Intrinsic Functions ! Executable Statements ! test the input parameters. info = 0_${ik}$ upper = stdlib_lsame( uplo, 'U' ) lquery = ( lwork==-1_${ik}$ ) if( .not.upper .and. .not.stdlib_lsame( uplo, 'L' ) ) then info = -1_${ik}$ else if( n<0_${ik}$ ) then info = -2_${ik}$ else if( lda<max( 1_${ik}$, n ) ) then info = -4_${ik}$ else if( lwork<1_${ik}$ .and. .not.lquery ) then info = -7_${ik}$ end if if( info==0_${ik}$ ) then ! determine the block size nb = stdlib${ii}$_ilaenv( 1_${ik}$, 'CHETRF', uplo, n, -1_${ik}$, -1_${ik}$, -1_${ik}$ ) lwkopt = n*nb work( 1_${ik}$ ) = lwkopt end if if( info/=0_${ik}$ ) then call stdlib${ii}$_xerbla( 'CHETRF', -info ) return else if( lquery ) then return end if nbmin = 2_${ik}$ ldwork = n if( nb>1_${ik}$ .and. nb<n ) then iws = ldwork*nb if( lwork<iws ) then nb = max( lwork / ldwork, 1_${ik}$ ) nbmin = max( 2_${ik}$, stdlib${ii}$_ilaenv( 2_${ik}$, 'CHETRF', uplo, n, -1_${ik}$, -1_${ik}$, -1_${ik}$ ) ) end if else iws = 1_${ik}$ end if if( nb<nbmin )nb = n if( upper ) then ! factorize a as u*d*u**h using the upper triangle of a ! k is the main loop index, decreasing from n to 1 in steps of ! kb, where kb is the number of columns factorized by stdlib${ii}$_clahef; ! kb is either nb or nb-1, or k for the last block k = n 10 continue ! if k < 1, exit from loop if( k<1 )go to 40 if( k>nb ) then ! factorize columns k-kb+1:k of a and use blocked code to ! update columns 1:k-kb call stdlib${ii}$_clahef( uplo, k, nb, kb, a, lda, ipiv, work, n, iinfo ) else ! use unblocked code to factorize columns 1:k of a call stdlib${ii}$_chetf2( uplo, k, a, lda, ipiv, iinfo ) kb = k end if ! set info on the first occurrence of a zero pivot if( info==0_${ik}$ .and. iinfo>0_${ik}$ )info = iinfo ! decrease k and return to the start of the main loop k = k - kb go to 10 else ! factorize a as l*d*l**h using the lower triangle of a ! k is the main loop index, increasing from 1 to n in steps of ! kb, where kb is the number of columns factorized by stdlib${ii}$_clahef; ! kb is either nb or nb-1, or n-k+1 for the last block k = 1_${ik}$ 20 continue ! if k > n, exit from loop if( k>n )go to 40 if( k<=n-nb ) then ! factorize columns k:k+kb-1 of a and use blocked code to ! update columns k+kb:n call stdlib${ii}$_clahef( uplo, n-k+1, nb, kb, a( k, k ), lda, ipiv( k ),work, n, & iinfo ) else ! use unblocked code to factorize columns k:n of a call stdlib${ii}$_chetf2( uplo, n-k+1, a( k, k ), lda, ipiv( k ), iinfo ) kb = n - k + 1_${ik}$ end if ! set info on the first occurrence of a zero pivot if( info==0_${ik}$ .and. iinfo>0_${ik}$ )info = iinfo + k - 1_${ik}$ ! adjust ipiv do j = k, k + kb - 1 if( ipiv( j )>0_${ik}$ ) then ipiv( j ) = ipiv( j ) + k - 1_${ik}$ else ipiv( j ) = ipiv( j ) - k + 1_${ik}$ end if end do ! increase k and return to the start of the main loop k = k + kb go to 20 end if 40 continue work( 1_${ik}$ ) = lwkopt return end subroutine stdlib${ii}$_chetrf pure module subroutine stdlib${ii}$_zhetrf( uplo, n, a, lda, ipiv, work, lwork, info ) !! ZHETRF computes the factorization of a complex Hermitian matrix A !! using the Bunch-Kaufman diagonal pivoting method. The form of the !! factorization is !! A = U*D*U**H or A = L*D*L**H !! where U (or L) is a product of permutation and unit upper (lower) !! triangular matrices, and D is Hermitian and block diagonal with !! 1-by-1 and 2-by-2 diagonal blocks. !! This is the blocked version of the algorithm, calling Level 3 BLAS. ! -- lapack computational routine -- ! -- lapack is a software package provided by univ. of tennessee, -- ! -- univ. of california berkeley, univ. of colorado denver and nag ltd..-- use stdlib_blas_constants_dp, only: negone, zero, half, one, two, three, four, eight, ten, czero, chalf, cone, cnegone ! Scalar Arguments character, intent(in) :: uplo integer(${ik}$), intent(out) :: info integer(${ik}$), intent(in) :: lda, lwork, n ! Array Arguments integer(${ik}$), intent(out) :: ipiv(*) complex(dp), intent(inout) :: a(lda,*) complex(dp), intent(out) :: work(*) ! ===================================================================== ! Local Scalars logical(lk) :: lquery, upper integer(${ik}$) :: iinfo, iws, j, k, kb, ldwork, lwkopt, nb, nbmin ! Intrinsic Functions ! Executable Statements ! test the input parameters. info = 0_${ik}$ upper = stdlib_lsame( uplo, 'U' ) lquery = ( lwork==-1_${ik}$ ) if( .not.upper .and. .not.stdlib_lsame( uplo, 'L' ) ) then info = -1_${ik}$ else if( n<0_${ik}$ ) then info = -2_${ik}$ else if( lda<max( 1_${ik}$, n ) ) then info = -4_${ik}$ else if( lwork<1_${ik}$ .and. .not.lquery ) then info = -7_${ik}$ end if if( info==0_${ik}$ ) then ! determine the block size nb = stdlib${ii}$_ilaenv( 1_${ik}$, 'ZHETRF', uplo, n, -1_${ik}$, -1_${ik}$, -1_${ik}$ ) lwkopt = n*nb work( 1_${ik}$ ) = lwkopt end if if( info/=0_${ik}$ ) then call stdlib${ii}$_xerbla( 'ZHETRF', -info ) return else if( lquery ) then return end if nbmin = 2_${ik}$ ldwork = n if( nb>1_${ik}$ .and. nb<n ) then iws = ldwork*nb if( lwork<iws ) then nb = max( lwork / ldwork, 1_${ik}$ ) nbmin = max( 2_${ik}$, stdlib${ii}$_ilaenv( 2_${ik}$, 'ZHETRF', uplo, n, -1_${ik}$, -1_${ik}$, -1_${ik}$ ) ) end if else iws = 1_${ik}$ end if if( nb<nbmin )nb = n if( upper ) then ! factorize a as u*d*u**h using the upper triangle of a ! k is the main loop index, decreasing from n to 1 in steps of ! kb, where kb is the number of columns factorized by stdlib${ii}$_zlahef; ! kb is either nb or nb-1, or k for the last block k = n 10 continue ! if k < 1, exit from loop if( k<1 )go to 40 if( k>nb ) then ! factorize columns k-kb+1:k of a and use blocked code to ! update columns 1:k-kb call stdlib${ii}$_zlahef( uplo, k, nb, kb, a, lda, ipiv, work, n, iinfo ) else ! use unblocked code to factorize columns 1:k of a call stdlib${ii}$_zhetf2( uplo, k, a, lda, ipiv, iinfo ) kb = k end if ! set info on the first occurrence of a zero pivot if( info==0_${ik}$ .and. iinfo>0_${ik}$ )info = iinfo ! decrease k and return to the start of the main loop k = k - kb go to 10 else ! factorize a as l*d*l**h using the lower triangle of a ! k is the main loop index, increasing from 1 to n in steps of ! kb, where kb is the number of columns factorized by stdlib${ii}$_zlahef; ! kb is either nb or nb-1, or n-k+1 for the last block k = 1_${ik}$ 20 continue ! if k > n, exit from loop if( k>n )go to 40 if( k<=n-nb ) then ! factorize columns k:k+kb-1 of a and use blocked code to ! update columns k+kb:n call stdlib${ii}$_zlahef( uplo, n-k+1, nb, kb, a( k, k ), lda, ipiv( k ),work, n, & iinfo ) else ! use unblocked code to factorize columns k:n of a call stdlib${ii}$_zhetf2( uplo, n-k+1, a( k, k ), lda, ipiv( k ), iinfo ) kb = n - k + 1_${ik}$ end if ! set info on the first occurrence of a zero pivot if( info==0_${ik}$ .and. iinfo>0_${ik}$ )info = iinfo + k - 1_${ik}$ ! adjust ipiv do j = k, k + kb - 1 if( ipiv( j )>0_${ik}$ ) then ipiv( j ) = ipiv( j ) + k - 1_${ik}$ else ipiv( j ) = ipiv( j ) - k + 1_${ik}$ end if end do ! increase k and return to the start of the main loop k = k + kb go to 20 end if 40 continue work( 1_${ik}$ ) = lwkopt return end subroutine stdlib${ii}$_zhetrf #:for ck,ct,ci in CMPLX_KINDS_TYPES #:if not ck in ["sp","dp"] pure module subroutine stdlib${ii}$_${ci}$hetrf( uplo, n, a, lda, ipiv, work, lwork, info ) !! ZHETRF: computes the factorization of a complex Hermitian matrix A !! using the Bunch-Kaufman diagonal pivoting method. The form of the !! factorization is !! A = U*D*U**H or A = L*D*L**H !! where U (or L) is a product of permutation and unit upper (lower) !! triangular matrices, and D is Hermitian and block diagonal with !! 1-by-1 and 2-by-2 diagonal blocks. !! This is the blocked version of the algorithm, calling Level 3 BLAS. ! -- lapack computational routine -- ! -- lapack is a software package provided by univ. of tennessee, -- ! -- univ. of california berkeley, univ. of colorado denver and nag ltd..-- use stdlib_blas_constants_${ck}$, only: negone, zero, half, one, two, three, four, eight, ten, czero, chalf, cone, cnegone ! Scalar Arguments character, intent(in) :: uplo integer(${ik}$), intent(out) :: info integer(${ik}$), intent(in) :: lda, lwork, n ! Array Arguments integer(${ik}$), intent(out) :: ipiv(*) complex(${ck}$), intent(inout) :: a(lda,*) complex(${ck}$), intent(out) :: work(*) ! ===================================================================== ! Local Scalars logical(lk) :: lquery, upper integer(${ik}$) :: iinfo, iws, j, k, kb, ldwork, lwkopt, nb, nbmin ! Intrinsic Functions ! Executable Statements ! test the input parameters. info = 0_${ik}$ upper = stdlib_lsame( uplo, 'U' ) lquery = ( lwork==-1_${ik}$ ) if( .not.upper .and. .not.stdlib_lsame( uplo, 'L' ) ) then info = -1_${ik}$ else if( n<0_${ik}$ ) then info = -2_${ik}$ else if( lda<max( 1_${ik}$, n ) ) then info = -4_${ik}$ else if( lwork<1_${ik}$ .and. .not.lquery ) then info = -7_${ik}$ end if if( info==0_${ik}$ ) then ! determine the block size nb = stdlib${ii}$_ilaenv( 1_${ik}$, 'ZHETRF', uplo, n, -1_${ik}$, -1_${ik}$, -1_${ik}$ ) lwkopt = n*nb work( 1_${ik}$ ) = lwkopt end if if( info/=0_${ik}$ ) then call stdlib${ii}$_xerbla( 'ZHETRF', -info ) return else if( lquery ) then return end if nbmin = 2_${ik}$ ldwork = n if( nb>1_${ik}$ .and. nb<n ) then iws = ldwork*nb if( lwork<iws ) then nb = max( lwork / ldwork, 1_${ik}$ ) nbmin = max( 2_${ik}$, stdlib${ii}$_ilaenv( 2_${ik}$, 'ZHETRF', uplo, n, -1_${ik}$, -1_${ik}$, -1_${ik}$ ) ) end if else iws = 1_${ik}$ end if if( nb<nbmin )nb = n if( upper ) then ! factorize a as u*d*u**h using the upper triangle of a ! k is the main loop index, decreasing from n to 1 in steps of ! kb, where kb is the number of columns factorized by stdlib${ii}$_${ci}$lahef; ! kb is either nb or nb-1, or k for the last block k = n 10 continue ! if k < 1, exit from loop if( k<1 )go to 40 if( k>nb ) then ! factorize columns k-kb+1:k of a and use blocked code to ! update columns 1:k-kb call stdlib${ii}$_${ci}$lahef( uplo, k, nb, kb, a, lda, ipiv, work, n, iinfo ) else ! use unblocked code to factorize columns 1:k of a call stdlib${ii}$_${ci}$hetf2( uplo, k, a, lda, ipiv, iinfo ) kb = k end if ! set info on the first occurrence of a zero pivot if( info==0_${ik}$ .and. iinfo>0_${ik}$ )info = iinfo ! decrease k and return to the start of the main loop k = k - kb go to 10 else ! factorize a as l*d*l**h using the lower triangle of a ! k is the main loop index, increasing from 1 to n in steps of ! kb, where kb is the number of columns factorized by stdlib${ii}$_${ci}$lahef; ! kb is either nb or nb-1, or n-k+1 for the last block k = 1_${ik}$ 20 continue ! if k > n, exit from loop if( k>n )go to 40 if( k<=n-nb ) then ! factorize columns k:k+kb-1 of a and use blocked code to ! update columns k+kb:n call stdlib${ii}$_${ci}$lahef( uplo, n-k+1, nb, kb, a( k, k ), lda, ipiv( k ),work, n, & iinfo ) else ! use unblocked code to factorize columns k:n of a call stdlib${ii}$_${ci}$hetf2( uplo, n-k+1, a( k, k ), lda, ipiv( k ), iinfo ) kb = n - k + 1_${ik}$ end if ! set info on the first occurrence of a zero pivot if( info==0_${ik}$ .and. iinfo>0_${ik}$ )info = iinfo + k - 1_${ik}$ ! adjust ipiv do j = k, k + kb - 1 if( ipiv( j )>0_${ik}$ ) then ipiv( j ) = ipiv( j ) + k - 1_${ik}$ else ipiv( j ) = ipiv( j ) - k + 1_${ik}$ end if end do ! increase k and return to the start of the main loop k = k + kb go to 20 end if 40 continue work( 1_${ik}$ ) = lwkopt return end subroutine stdlib${ii}$_${ci}$hetrf #:endif #:endfor pure module subroutine stdlib${ii}$_clahef( uplo, n, nb, kb, a, lda, ipiv, w, ldw, info ) !! CLAHEF computes a partial factorization of a complex Hermitian !! matrix A using the Bunch-Kaufman diagonal pivoting method. The !! partial factorization has the form: !! A = ( I U12 ) ( A11 0 ) ( I 0 ) if UPLO = 'U', or: !! ( 0 U22 ) ( 0 D ) ( U12**H U22**H ) !! A = ( L11 0 ) ( D 0 ) ( L11**H L21**H ) if UPLO = 'L' !! ( L21 I ) ( 0 A22 ) ( 0 I ) !! where the order of D is at most NB. The actual order is returned in !! the argument KB, and is either NB or NB-1, or N if N <= NB. !! Note that U**H denotes the conjugate transpose of U. !! CLAHEF is an auxiliary routine called by CHETRF. It uses blocked code !! (calling Level 3 BLAS) to update the submatrix A11 (if UPLO = 'U') or !! A22 (if UPLO = 'L'). ! -- lapack computational routine -- ! -- lapack is a software package provided by univ. of tennessee, -- ! -- univ. of california berkeley, univ. of colorado denver and nag ltd..-- use stdlib_blas_constants_sp, only: negone, zero, half, one, two, three, four, eight, ten, czero, chalf, cone, cnegone ! Scalar Arguments character, intent(in) :: uplo integer(${ik}$), intent(out) :: info, kb integer(${ik}$), intent(in) :: lda, ldw, n, nb ! Array Arguments integer(${ik}$), intent(out) :: ipiv(*) complex(sp), intent(inout) :: a(lda,*) complex(sp), intent(out) :: w(ldw,*) ! ===================================================================== ! Parameters real(sp), parameter :: sevten = 17.0e+0_sp ! Local Scalars integer(${ik}$) :: imax, j, jb, jj, jmax, jp, k, kk, kkw, kp, kstep, kw real(sp) :: absakk, alpha, colmax, r1, rowmax, t complex(sp) :: d11, d21, d22, z ! Intrinsic Functions ! Statement Functions real(sp) :: cabs1 ! Statement Function Definitions cabs1( z ) = abs( real( z,KIND=sp) ) + abs( aimag( z ) ) ! Executable Statements info = 0_${ik}$ ! initialize alpha for use in choosing pivot block size. alpha = ( one+sqrt( sevten ) ) / eight if( stdlib_lsame( uplo, 'U' ) ) then ! factorize the trailing columns of a using the upper triangle ! of a and working backwards, and compute the matrix w = u12*d ! for use in updating a11 (note that conjg(w) is actually stored) ! k is the main loop index, decreasing from n in steps of 1 or 2 k = n 10 continue ! kw is the column of w which corresponds to column k of a kw = nb + k - n ! exit from loop if( ( k<=n-nb+1 .and. nb<n ) .or. k<1 )go to 30 kstep = 1_${ik}$ ! copy column k of a to column kw of w and update it call stdlib${ii}$_ccopy( k-1, a( 1_${ik}$, k ), 1_${ik}$, w( 1_${ik}$, kw ), 1_${ik}$ ) w( k, kw ) = real( a( k, k ),KIND=sp) if( k<n ) then call stdlib${ii}$_cgemv( 'NO TRANSPOSE', k, n-k, -cone, a( 1_${ik}$, k+1 ), lda,w( k, kw+1 ), & ldw, cone, w( 1_${ik}$, kw ), 1_${ik}$ ) w( k, kw ) = real( w( k, kw ),KIND=sp) end if ! determine rows and columns to be interchanged and whether ! a 1-by-1 or 2-by-2 pivot block will be used absakk = abs( real( w( k, kw ),KIND=sp) ) ! imax is the row-index of the largest off-diagonal element in ! column k, and colmax is its absolute value. ! determine both colmax and imax. if( k>1_${ik}$ ) then imax = stdlib${ii}$_icamax( k-1, w( 1_${ik}$, kw ), 1_${ik}$ ) colmax = cabs1( w( imax, kw ) ) else colmax = zero end if if( max( absakk, colmax )==zero ) then ! column k is zero or underflow: set info and continue if( info==0_${ik}$ )info = k kp = k a( k, k ) = real( a( k, k ),KIND=sp) else ! ============================================================ ! begin pivot search ! case(1) if( absakk>=alpha*colmax ) then ! no interchange, use 1-by-1 pivot block kp = k else ! begin pivot search along imax row ! copy column imax to column kw-1 of w and update it call stdlib${ii}$_ccopy( imax-1, a( 1_${ik}$, imax ), 1_${ik}$, w( 1_${ik}$, kw-1 ), 1_${ik}$ ) w( imax, kw-1 ) = real( a( imax, imax ),KIND=sp) call stdlib${ii}$_ccopy( k-imax, a( imax, imax+1 ), lda,w( imax+1, kw-1 ), 1_${ik}$ ) call stdlib${ii}$_clacgv( k-imax, w( imax+1, kw-1 ), 1_${ik}$ ) if( k<n ) then call stdlib${ii}$_cgemv( 'NO TRANSPOSE', k, n-k, -cone,a( 1_${ik}$, k+1 ), lda, w( imax,& kw+1 ), ldw,cone, w( 1_${ik}$, kw-1 ), 1_${ik}$ ) w( imax, kw-1 ) = real( w( imax, kw-1 ),KIND=sp) end if ! jmax is the column-index of the largest off-diagonal ! element in row imax, and rowmax is its absolute value. ! determine only rowmax. jmax = imax + stdlib${ii}$_icamax( k-imax, w( imax+1, kw-1 ), 1_${ik}$ ) rowmax = cabs1( w( jmax, kw-1 ) ) if( imax>1_${ik}$ ) then jmax = stdlib${ii}$_icamax( imax-1, w( 1_${ik}$, kw-1 ), 1_${ik}$ ) rowmax = max( rowmax, cabs1( w( jmax, kw-1 ) ) ) end if ! case(2) if( absakk>=alpha*colmax*( colmax / rowmax ) ) then ! no interchange, use 1-by-1 pivot block kp = k ! case(3) else if( abs( real( w( imax, kw-1 ),KIND=sp) )>=alpha*rowmax )then ! interchange rows and columns k and imax, use 1-by-1 ! pivot block kp = imax ! copy column kw-1 of w to column kw of w call stdlib${ii}$_ccopy( k, w( 1_${ik}$, kw-1 ), 1_${ik}$, w( 1_${ik}$, kw ), 1_${ik}$ ) ! case(4) else ! interchange rows and columns k-1 and imax, use 2-by-2 ! pivot block kp = imax kstep = 2_${ik}$ end if ! end pivot search along imax row end if ! end pivot search ! ============================================================ ! kk is the column of a where pivoting step stopped kk = k - kstep + 1_${ik}$ ! kkw is the column of w which corresponds to column kk of a kkw = nb + kk - n ! interchange rows and columns kp and kk. ! updated column kp is already stored in column kkw of w. if( kp/=kk ) then ! copy non-updated column kk to column kp of submatrix a ! at step k. no need to copy element into column k ! (or k and k-1 for 2-by-2 pivot) of a, since these columns ! will be later overwritten. a( kp, kp ) = real( a( kk, kk ),KIND=sp) call stdlib${ii}$_ccopy( kk-1-kp, a( kp+1, kk ), 1_${ik}$, a( kp, kp+1 ),lda ) call stdlib${ii}$_clacgv( kk-1-kp, a( kp, kp+1 ), lda ) if( kp>1_${ik}$ )call stdlib${ii}$_ccopy( kp-1, a( 1_${ik}$, kk ), 1_${ik}$, a( 1_${ik}$, kp ), 1_${ik}$ ) ! interchange rows kk and kp in last k+1 to n columns of a ! (columns k (or k and k-1 for 2-by-2 pivot) of a will be ! later overwritten). interchange rows kk and kp ! in last kkw to nb columns of w. if( k<n )call stdlib${ii}$_cswap( n-k, a( kk, k+1 ), lda, a( kp, k+1 ),lda ) call stdlib${ii}$_cswap( n-kk+1, w( kk, kkw ), ldw, w( kp, kkw ),ldw ) end if if( kstep==1_${ik}$ ) then ! 1-by-1 pivot block d(k): column kw of w now holds ! w(kw) = u(k)*d(k), ! where u(k) is the k-th column of u ! (1) store subdiag. elements of column u(k) ! and 1-by-1 block d(k) in column k of a. ! (note: diagonal element u(k,k) is a unit element ! and not stored) ! a(k,k) := d(k,k) = w(k,kw) ! a(1:k-1,k) := u(1:k-1,k) = w(1:k-1,kw)/d(k,k) ! (note: no need to use for hermitian matrix ! a( k, k ) = real( w( k, k),KIND=sp) to separately copy diagonal ! element d(k,k) from w (potentially saves only one load)) call stdlib${ii}$_ccopy( k, w( 1_${ik}$, kw ), 1_${ik}$, a( 1_${ik}$, k ), 1_${ik}$ ) if( k>1_${ik}$ ) then ! (note: no need to check if a(k,k) is not zero, ! since that was ensured earlier in pivot search: ! case a(k,k) = 0 falls into 2x2 pivot case(4)) r1 = one / real( a( k, k ),KIND=sp) call stdlib${ii}$_csscal( k-1, r1, a( 1_${ik}$, k ), 1_${ik}$ ) ! (2) conjugate column w(kw) call stdlib${ii}$_clacgv( k-1, w( 1_${ik}$, kw ), 1_${ik}$ ) end if else ! 2-by-2 pivot block d(k): columns kw and kw-1 of w now hold ! ( w(kw-1) w(kw) ) = ( u(k-1) u(k) )*d(k) ! where u(k) and u(k-1) are the k-th and (k-1)-th columns ! of u ! (1) store u(1:k-2,k-1) and u(1:k-2,k) and 2-by-2 ! block d(k-1:k,k-1:k) in columns k-1 and k of a. ! (note: 2-by-2 diagonal block u(k-1:k,k-1:k) is a unit ! block and not stored) ! a(k-1:k,k-1:k) := d(k-1:k,k-1:k) = w(k-1:k,kw-1:kw) ! a(1:k-2,k-1:k) := u(1:k-2,k:k-1:k) = ! = w(1:k-2,kw-1:kw) * ( d(k-1:k,k-1:k)**(-1) ) if( k>2_${ik}$ ) then ! factor out the columns of the inverse of 2-by-2 pivot ! block d, so that each column contains 1, to reduce the ! number of flops when we multiply panel ! ( w(kw-1) w(kw) ) by this inverse, i.e. by d**(-1). ! d**(-1) = ( d11 cj(d21) )**(-1) = ! ( d21 d22 ) ! = 1/(d11*d22-|d21|**2) * ( ( d22) (-cj(d21) ) ) = ! ( (-d21) ( d11 ) ) ! = 1/(|d21|**2) * 1/((d11/cj(d21))*(d22/d21)-1) * ! * ( d21*( d22/d21 ) conj(d21)*( - 1 ) ) = ! ( ( -1 ) ( d11/conj(d21) ) ) ! = 1/(|d21|**2) * 1/(d22*d11-1) * ! * ( d21*( d11 ) conj(d21)*( -1 ) ) = ! ( ( -1 ) ( d22 ) ) ! = (1/|d21|**2) * t * ( d21*( d11 ) conj(d21)*( -1 ) ) = ! ( ( -1 ) ( d22 ) ) ! = ( (t/conj(d21))*( d11 ) (t/d21)*( -1 ) ) = ! ( ( -1 ) ( d22 ) ) ! = ( conj(d21)*( d11 ) d21*( -1 ) ) ! ( ( -1 ) ( d22 ) ), ! where d11 = d22/d21, ! d22 = d11/conj(d21), ! d21 = t/d21, ! t = 1/(d22*d11-1). ! (note: no need to check for division by zero, ! since that was ensured earlier in pivot search: ! (a) d21 != 0, since in 2x2 pivot case(4) ! |d21| should be larger than |d11| and |d22|; ! (b) (d22*d11 - 1) != 0, since from (a), ! both |d11| < 1, |d22| < 1, hence |d22*d11| << 1.) d21 = w( k-1, kw ) d11 = w( k, kw ) / conjg( d21 ) d22 = w( k-1, kw-1 ) / d21 t = one / ( real( d11*d22,KIND=sp)-one ) d21 = t / d21 ! update elements in columns a(k-1) and a(k) as ! dot products of rows of ( w(kw-1) w(kw) ) and columns ! of d**(-1) do j = 1, k - 2 a( j, k-1 ) = d21*( d11*w( j, kw-1 )-w( j, kw ) ) a( j, k ) = conjg( d21 )*( d22*w( j, kw )-w( j, kw-1 ) ) end do end if ! copy d(k) to a a( k-1, k-1 ) = w( k-1, kw-1 ) a( k-1, k ) = w( k-1, kw ) a( k, k ) = w( k, kw ) ! (2) conjugate columns w(kw) and w(kw-1) call stdlib${ii}$_clacgv( k-1, w( 1_${ik}$, kw ), 1_${ik}$ ) call stdlib${ii}$_clacgv( k-2, w( 1_${ik}$, kw-1 ), 1_${ik}$ ) end if end if ! store details of the interchanges in ipiv if( kstep==1_${ik}$ ) then ipiv( k ) = kp else ipiv( k ) = -kp ipiv( k-1 ) = -kp end if ! decrease k and return to the start of the main loop k = k - kstep go to 10 30 continue ! update the upper triangle of a11 (= a(1:k,1:k)) as ! a11 := a11 - u12*d*u12**h = a11 - u12*w**h ! computing blocks of nb columns at a time (note that conjg(w) is ! actually stored) do j = ( ( k-1 ) / nb )*nb + 1, 1, -nb jb = min( nb, k-j+1 ) ! update the upper triangle of the diagonal block do jj = j, j + jb - 1 a( jj, jj ) = real( a( jj, jj ),KIND=sp) call stdlib${ii}$_cgemv( 'NO TRANSPOSE', jj-j+1, n-k, -cone,a( j, k+1 ), lda, w( jj,& kw+1 ), ldw, cone,a( j, jj ), 1_${ik}$ ) a( jj, jj ) = real( a( jj, jj ),KIND=sp) end do ! update the rectangular superdiagonal block call stdlib${ii}$_cgemm( 'NO TRANSPOSE', 'TRANSPOSE', j-1, jb, n-k,-cone, a( 1_${ik}$, k+1 ), & lda, w( j, kw+1 ), ldw,cone, a( 1_${ik}$, j ), lda ) end do ! put u12 in standard form by partially undoing the interchanges ! in of rows in columns k+1:n looping backwards from k+1 to n j = k + 1_${ik}$ 60 continue ! undo the interchanges (if any) of rows j and jp ! at each step j ! (here, j is a diagonal index) jj = j jp = ipiv( j ) if( jp<0_${ik}$ ) then jp = -jp ! (here, j is a diagonal index) j = j + 1_${ik}$ end if ! (note: here, j is used to determine row length. length n-j+1 ! of the rows to swap back doesn't include diagonal element) j = j + 1_${ik}$ if( jp/=jj .and. j<=n )call stdlib${ii}$_cswap( n-j+1, a( jp, j ), lda, a( jj, j ), & lda ) if( j<=n )go to 60 ! set kb to the number of columns factorized kb = n - k else ! factorize the leading columns of a using the lower triangle ! of a and working forwards, and compute the matrix w = l21*d ! for use in updating a22 (note that conjg(w) is actually stored) ! k is the main loop index, increasing from 1 in steps of 1 or 2 k = 1_${ik}$ 70 continue ! exit from loop if( ( k>=nb .and. nb<n ) .or. k>n )go to 90 kstep = 1_${ik}$ ! copy column k of a to column k of w and update it w( k, k ) = real( a( k, k ),KIND=sp) if( k<n )call stdlib${ii}$_ccopy( n-k, a( k+1, k ), 1_${ik}$, w( k+1, k ), 1_${ik}$ ) call stdlib${ii}$_cgemv( 'NO TRANSPOSE', n-k+1, k-1, -cone, a( k, 1_${ik}$ ), lda,w( k, 1_${ik}$ ), ldw,& cone, w( k, k ), 1_${ik}$ ) w( k, k ) = real( w( k, k ),KIND=sp) ! determine rows and columns to be interchanged and whether ! a 1-by-1 or 2-by-2 pivot block will be used absakk = abs( real( w( k, k ),KIND=sp) ) ! imax is the row-index of the largest off-diagonal element in ! column k, and colmax is its absolute value. ! determine both colmax and imax. if( k<n ) then imax = k + stdlib${ii}$_icamax( n-k, w( k+1, k ), 1_${ik}$ ) colmax = cabs1( w( imax, k ) ) else colmax = zero end if if( max( absakk, colmax )==zero ) then ! column k is zero or underflow: set info and continue if( info==0_${ik}$ )info = k kp = k a( k, k ) = real( a( k, k ),KIND=sp) else ! ============================================================ ! begin pivot search ! case(1) if( absakk>=alpha*colmax ) then ! no interchange, use 1-by-1 pivot block kp = k else ! begin pivot search along imax row ! copy column imax to column k+1 of w and update it call stdlib${ii}$_ccopy( imax-k, a( imax, k ), lda, w( k, k+1 ), 1_${ik}$ ) call stdlib${ii}$_clacgv( imax-k, w( k, k+1 ), 1_${ik}$ ) w( imax, k+1 ) = real( a( imax, imax ),KIND=sp) if( imax<n )call stdlib${ii}$_ccopy( n-imax, a( imax+1, imax ), 1_${ik}$,w( imax+1, k+1 ), & 1_${ik}$ ) call stdlib${ii}$_cgemv( 'NO TRANSPOSE', n-k+1, k-1, -cone, a( k, 1_${ik}$ ),lda, w( imax, & 1_${ik}$ ), ldw, cone, w( k, k+1 ),1_${ik}$ ) w( imax, k+1 ) = real( w( imax, k+1 ),KIND=sp) ! jmax is the column-index of the largest off-diagonal ! element in row imax, and rowmax is its absolute value. ! determine only rowmax. jmax = k - 1_${ik}$ + stdlib${ii}$_icamax( imax-k, w( k, k+1 ), 1_${ik}$ ) rowmax = cabs1( w( jmax, k+1 ) ) if( imax<n ) then jmax = imax + stdlib${ii}$_icamax( n-imax, w( imax+1, k+1 ), 1_${ik}$ ) rowmax = max( rowmax, cabs1( w( jmax, k+1 ) ) ) end if ! case(2) if( absakk>=alpha*colmax*( colmax / rowmax ) ) then ! no interchange, use 1-by-1 pivot block kp = k ! case(3) else if( abs( real( w( imax, k+1 ),KIND=sp) )>=alpha*rowmax )then ! interchange rows and columns k and imax, use 1-by-1 ! pivot block kp = imax ! copy column k+1 of w to column k of w call stdlib${ii}$_ccopy( n-k+1, w( k, k+1 ), 1_${ik}$, w( k, k ), 1_${ik}$ ) ! case(4) else ! interchange rows and columns k+1 and imax, use 2-by-2 ! pivot block kp = imax kstep = 2_${ik}$ end if ! end pivot search along imax row end if ! end pivot search ! ============================================================ ! kk is the column of a where pivoting step stopped kk = k + kstep - 1_${ik}$ ! interchange rows and columns kp and kk. ! updated column kp is already stored in column kk of w. if( kp/=kk ) then ! copy non-updated column kk to column kp of submatrix a ! at step k. no need to copy element into column k ! (or k and k+1 for 2-by-2 pivot) of a, since these columns ! will be later overwritten. a( kp, kp ) = real( a( kk, kk ),KIND=sp) call stdlib${ii}$_ccopy( kp-kk-1, a( kk+1, kk ), 1_${ik}$, a( kp, kk+1 ),lda ) call stdlib${ii}$_clacgv( kp-kk-1, a( kp, kk+1 ), lda ) if( kp<n )call stdlib${ii}$_ccopy( n-kp, a( kp+1, kk ), 1_${ik}$, a( kp+1, kp ), 1_${ik}$ ) ! interchange rows kk and kp in first k-1 columns of a ! (columns k (or k and k+1 for 2-by-2 pivot) of a will be ! later overwritten). interchange rows kk and kp ! in first kk columns of w. if( k>1_${ik}$ )call stdlib${ii}$_cswap( k-1, a( kk, 1_${ik}$ ), lda, a( kp, 1_${ik}$ ), lda ) call stdlib${ii}$_cswap( kk, w( kk, 1_${ik}$ ), ldw, w( kp, 1_${ik}$ ), ldw ) end if if( kstep==1_${ik}$ ) then ! 1-by-1 pivot block d(k): column k of w now holds ! w(k) = l(k)*d(k), ! where l(k) is the k-th column of l ! (1) store subdiag. elements of column l(k) ! and 1-by-1 block d(k) in column k of a. ! (note: diagonal element l(k,k) is a unit element ! and not stored) ! a(k,k) := d(k,k) = w(k,k) ! a(k+1:n,k) := l(k+1:n,k) = w(k+1:n,k)/d(k,k) ! (note: no need to use for hermitian matrix ! a( k, k ) = real( w( k, k),KIND=sp) to separately copy diagonal ! element d(k,k) from w (potentially saves only one load)) call stdlib${ii}$_ccopy( n-k+1, w( k, k ), 1_${ik}$, a( k, k ), 1_${ik}$ ) if( k<n ) then ! (note: no need to check if a(k,k) is not zero, ! since that was ensured earlier in pivot search: ! case a(k,k) = 0 falls into 2x2 pivot case(4)) r1 = one / real( a( k, k ),KIND=sp) call stdlib${ii}$_csscal( n-k, r1, a( k+1, k ), 1_${ik}$ ) ! (2) conjugate column w(k) call stdlib${ii}$_clacgv( n-k, w( k+1, k ), 1_${ik}$ ) end if else ! 2-by-2 pivot block d(k): columns k and k+1 of w now hold ! ( w(k) w(k+1) ) = ( l(k) l(k+1) )*d(k) ! where l(k) and l(k+1) are the k-th and (k+1)-th columns ! of l ! (1) store l(k+2:n,k) and l(k+2:n,k+1) and 2-by-2 ! block d(k:k+1,k:k+1) in columns k and k+1 of a. ! (note: 2-by-2 diagonal block l(k:k+1,k:k+1) is a unit ! block and not stored) ! a(k:k+1,k:k+1) := d(k:k+1,k:k+1) = w(k:k+1,k:k+1) ! a(k+2:n,k:k+1) := l(k+2:n,k:k+1) = ! = w(k+2:n,k:k+1) * ( d(k:k+1,k:k+1)**(-1) ) if( k<n-1 ) then ! factor out the columns of the inverse of 2-by-2 pivot ! block d, so that each column contains 1, to reduce the ! number of flops when we multiply panel ! ( w(kw-1) w(kw) ) by this inverse, i.e. by d**(-1). ! d**(-1) = ( d11 cj(d21) )**(-1) = ! ( d21 d22 ) ! = 1/(d11*d22-|d21|**2) * ( ( d22) (-cj(d21) ) ) = ! ( (-d21) ( d11 ) ) ! = 1/(|d21|**2) * 1/((d11/cj(d21))*(d22/d21)-1) * ! * ( d21*( d22/d21 ) conj(d21)*( - 1 ) ) = ! ( ( -1 ) ( d11/conj(d21) ) ) ! = 1/(|d21|**2) * 1/(d22*d11-1) * ! * ( d21*( d11 ) conj(d21)*( -1 ) ) = ! ( ( -1 ) ( d22 ) ) ! = (1/|d21|**2) * t * ( d21*( d11 ) conj(d21)*( -1 ) ) = ! ( ( -1 ) ( d22 ) ) ! = ( (t/conj(d21))*( d11 ) (t/d21)*( -1 ) ) = ! ( ( -1 ) ( d22 ) ) ! = ( conj(d21)*( d11 ) d21*( -1 ) ) ! ( ( -1 ) ( d22 ) ) ! where d11 = d22/d21, ! d22 = d11/conj(d21), ! d21 = t/d21, ! t = 1/(d22*d11-1). ! (note: no need to check for division by zero, ! since that was ensured earlier in pivot search: ! (a) d21 != 0, since in 2x2 pivot case(4) ! |d21| should be larger than |d11| and |d22|; ! (b) (d22*d11 - 1) != 0, since from (a), ! both |d11| < 1, |d22| < 1, hence |d22*d11| << 1.) d21 = w( k+1, k ) d11 = w( k+1, k+1 ) / d21 d22 = w( k, k ) / conjg( d21 ) t = one / ( real( d11*d22,KIND=sp)-one ) d21 = t / d21 ! update elements in columns a(k) and a(k+1) as ! dot products of rows of ( w(k) w(k+1) ) and columns ! of d**(-1) do j = k + 2, n a( j, k ) = conjg( d21 )*( d11*w( j, k )-w( j, k+1 ) ) a( j, k+1 ) = d21*( d22*w( j, k+1 )-w( j, k ) ) end do end if ! copy d(k) to a a( k, k ) = w( k, k ) a( k+1, k ) = w( k+1, k ) a( k+1, k+1 ) = w( k+1, k+1 ) ! (2) conjugate columns w(k) and w(k+1) call stdlib${ii}$_clacgv( n-k, w( k+1, k ), 1_${ik}$ ) call stdlib${ii}$_clacgv( n-k-1, w( k+2, k+1 ), 1_${ik}$ ) end if end if ! store details of the interchanges in ipiv if( kstep==1_${ik}$ ) then ipiv( k ) = kp else ipiv( k ) = -kp ipiv( k+1 ) = -kp end if ! increase k and return to the start of the main loop k = k + kstep go to 70 90 continue ! update the lower triangle of a22 (= a(k:n,k:n)) as ! a22 := a22 - l21*d*l21**h = a22 - l21*w**h ! computing blocks of nb columns at a time (note that conjg(w) is ! actually stored) do j = k, n, nb jb = min( nb, n-j+1 ) ! update the lower triangle of the diagonal block do jj = j, j + jb - 1 a( jj, jj ) = real( a( jj, jj ),KIND=sp) call stdlib${ii}$_cgemv( 'NO TRANSPOSE', j+jb-jj, k-1, -cone,a( jj, 1_${ik}$ ), lda, w( jj,& 1_${ik}$ ), ldw, cone,a( jj, jj ), 1_${ik}$ ) a( jj, jj ) = real( a( jj, jj ),KIND=sp) end do ! update the rectangular subdiagonal block if( j+jb<=n )call stdlib${ii}$_cgemm( 'NO TRANSPOSE', 'TRANSPOSE', n-j-jb+1, jb,k-1, -& cone, a( j+jb, 1_${ik}$ ), lda, w( j, 1_${ik}$ ),ldw, cone, a( j+jb, j ), lda ) end do ! put l21 in standard form by partially undoing the interchanges ! of rows in columns 1:k-1 looping backwards from k-1 to 1 j = k - 1_${ik}$ 120 continue ! undo the interchanges (if any) of rows j and jp ! at each step j ! (here, j is a diagonal index) jj = j jp = ipiv( j ) if( jp<0_${ik}$ ) then jp = -jp ! (here, j is a diagonal index) j = j - 1_${ik}$ end if ! (note: here, j is used to determine row length. length j ! of the rows to swap back doesn't include diagonal element) j = j - 1_${ik}$ if( jp/=jj .and. j>=1_${ik}$ )call stdlib${ii}$_cswap( j, a( jp, 1_${ik}$ ), lda, a( jj, 1_${ik}$ ), lda ) if( j>=1 )go to 120 ! set kb to the number of columns factorized kb = k - 1_${ik}$ end if return end subroutine stdlib${ii}$_clahef pure module subroutine stdlib${ii}$_zlahef( uplo, n, nb, kb, a, lda, ipiv, w, ldw, info ) !! ZLAHEF computes a partial factorization of a complex Hermitian !! matrix A using the Bunch-Kaufman diagonal pivoting method. The !! partial factorization has the form: !! A = ( I U12 ) ( A11 0 ) ( I 0 ) if UPLO = 'U', or: !! ( 0 U22 ) ( 0 D ) ( U12**H U22**H ) !! A = ( L11 0 ) ( D 0 ) ( L11**H L21**H ) if UPLO = 'L' !! ( L21 I ) ( 0 A22 ) ( 0 I ) !! where the order of D is at most NB. The actual order is returned in !! the argument KB, and is either NB or NB-1, or N if N <= NB. !! Note that U**H denotes the conjugate transpose of U. !! ZLAHEF is an auxiliary routine called by ZHETRF. It uses blocked code !! (calling Level 3 BLAS) to update the submatrix A11 (if UPLO = 'U') or !! A22 (if UPLO = 'L'). ! -- lapack computational routine -- ! -- lapack is a software package provided by univ. of tennessee, -- ! -- univ. of california berkeley, univ. of colorado denver and nag ltd..-- use stdlib_blas_constants_dp, only: negone, zero, half, one, two, three, four, eight, ten, czero, chalf, cone, cnegone ! Scalar Arguments character, intent(in) :: uplo integer(${ik}$), intent(out) :: info, kb integer(${ik}$), intent(in) :: lda, ldw, n, nb ! Array Arguments integer(${ik}$), intent(out) :: ipiv(*) complex(dp), intent(inout) :: a(lda,*) complex(dp), intent(out) :: w(ldw,*) ! ===================================================================== ! Parameters real(dp), parameter :: sevten = 17.0e+0_dp ! Local Scalars integer(${ik}$) :: imax, j, jb, jj, jmax, jp, k, kk, kkw, kp, kstep, kw real(dp) :: absakk, alpha, colmax, r1, rowmax, t complex(dp) :: d11, d21, d22, z ! Intrinsic Functions ! Statement Functions real(dp) :: cabs1 ! Statement Function Definitions cabs1( z ) = abs( real( z,KIND=dp) ) + abs( aimag( z ) ) ! Executable Statements info = 0_${ik}$ ! initialize alpha for use in choosing pivot block size. alpha = ( one+sqrt( sevten ) ) / eight if( stdlib_lsame( uplo, 'U' ) ) then ! factorize the trailing columns of a using the upper triangle ! of a and working backwards, and compute the matrix w = u12*d ! for use in updating a11 (note that conjg(w) is actually stored) ! k is the main loop index, decreasing from n in steps of 1 or 2 ! kw is the column of w which corresponds to column k of a k = n 10 continue kw = nb + k - n ! exit from loop if( ( k<=n-nb+1 .and. nb<n ) .or. k<1 )go to 30 kstep = 1_${ik}$ ! copy column k of a to column kw of w and update it call stdlib${ii}$_zcopy( k-1, a( 1_${ik}$, k ), 1_${ik}$, w( 1_${ik}$, kw ), 1_${ik}$ ) w( k, kw ) = real( a( k, k ),KIND=dp) if( k<n ) then call stdlib${ii}$_zgemv( 'NO TRANSPOSE', k, n-k, -cone, a( 1_${ik}$, k+1 ), lda,w( k, kw+1 ), & ldw, cone, w( 1_${ik}$, kw ), 1_${ik}$ ) w( k, kw ) = real( w( k, kw ),KIND=dp) end if ! determine rows and columns to be interchanged and whether ! a 1-by-1 or 2-by-2 pivot block will be used absakk = abs( real( w( k, kw ),KIND=dp) ) ! imax is the row-index of the largest off-diagonal element in ! column k, and colmax is its absolute value. ! determine both colmax and imax. if( k>1_${ik}$ ) then imax = stdlib${ii}$_izamax( k-1, w( 1_${ik}$, kw ), 1_${ik}$ ) colmax = cabs1( w( imax, kw ) ) else colmax = zero end if if( max( absakk, colmax )==zero ) then ! column k is zero or underflow: set info and continue if( info==0_${ik}$ )info = k kp = k a( k, k ) = real( a( k, k ),KIND=dp) else ! ============================================================ ! begin pivot search ! case(1) if( absakk>=alpha*colmax ) then ! no interchange, use 1-by-1 pivot block kp = k else ! begin pivot search along imax row ! copy column imax to column kw-1 of w and update it call stdlib${ii}$_zcopy( imax-1, a( 1_${ik}$, imax ), 1_${ik}$, w( 1_${ik}$, kw-1 ), 1_${ik}$ ) w( imax, kw-1 ) = real( a( imax, imax ),KIND=dp) call stdlib${ii}$_zcopy( k-imax, a( imax, imax+1 ), lda,w( imax+1, kw-1 ), 1_${ik}$ ) call stdlib${ii}$_zlacgv( k-imax, w( imax+1, kw-1 ), 1_${ik}$ ) if( k<n ) then call stdlib${ii}$_zgemv( 'NO TRANSPOSE', k, n-k, -cone,a( 1_${ik}$, k+1 ), lda, w( imax,& kw+1 ), ldw,cone, w( 1_${ik}$, kw-1 ), 1_${ik}$ ) w( imax, kw-1 ) = real( w( imax, kw-1 ),KIND=dp) end if ! jmax is the column-index of the largest off-diagonal ! element in row imax, and rowmax is its absolute value. ! determine only rowmax. jmax = imax + stdlib${ii}$_izamax( k-imax, w( imax+1, kw-1 ), 1_${ik}$ ) rowmax = cabs1( w( jmax, kw-1 ) ) if( imax>1_${ik}$ ) then jmax = stdlib${ii}$_izamax( imax-1, w( 1_${ik}$, kw-1 ), 1_${ik}$ ) rowmax = max( rowmax, cabs1( w( jmax, kw-1 ) ) ) end if ! case(2) if( absakk>=alpha*colmax*( colmax / rowmax ) ) then ! no interchange, use 1-by-1 pivot block kp = k ! case(3) else if( abs( real( w( imax, kw-1 ),KIND=dp) )>=alpha*rowmax )then ! interchange rows and columns k and imax, use 1-by-1 ! pivot block kp = imax ! copy column kw-1 of w to column kw of w call stdlib${ii}$_zcopy( k, w( 1_${ik}$, kw-1 ), 1_${ik}$, w( 1_${ik}$, kw ), 1_${ik}$ ) ! case(4) else ! interchange rows and columns k-1 and imax, use 2-by-2 ! pivot block kp = imax kstep = 2_${ik}$ end if ! end pivot search along imax row end if ! end pivot search ! ============================================================ ! kk is the column of a where pivoting step stopped kk = k - kstep + 1_${ik}$ ! kkw is the column of w which corresponds to column kk of a kkw = nb + kk - n ! interchange rows and columns kp and kk. ! updated column kp is already stored in column kkw of w. if( kp/=kk ) then ! copy non-updated column kk to column kp of submatrix a ! at step k. no need to copy element into column k ! (or k and k-1 for 2-by-2 pivot) of a, since these columns ! will be later overwritten. a( kp, kp ) = real( a( kk, kk ),KIND=dp) call stdlib${ii}$_zcopy( kk-1-kp, a( kp+1, kk ), 1_${ik}$, a( kp, kp+1 ),lda ) call stdlib${ii}$_zlacgv( kk-1-kp, a( kp, kp+1 ), lda ) if( kp>1_${ik}$ )call stdlib${ii}$_zcopy( kp-1, a( 1_${ik}$, kk ), 1_${ik}$, a( 1_${ik}$, kp ), 1_${ik}$ ) ! interchange rows kk and kp in last k+1 to n columns of a ! (columns k (or k and k-1 for 2-by-2 pivot) of a will be ! later overwritten). interchange rows kk and kp ! in last kkw to nb columns of w. if( k<n )call stdlib${ii}$_zswap( n-k, a( kk, k+1 ), lda, a( kp, k+1 ),lda ) call stdlib${ii}$_zswap( n-kk+1, w( kk, kkw ), ldw, w( kp, kkw ),ldw ) end if if( kstep==1_${ik}$ ) then ! 1-by-1 pivot block d(k): column kw of w now holds ! w(kw) = u(k)*d(k), ! where u(k) is the k-th column of u ! (1) store subdiag. elements of column u(k) ! and 1-by-1 block d(k) in column k of a. ! (note: diagonal element u(k,k) is a unit element ! and not stored) ! a(k,k) := d(k,k) = w(k,kw) ! a(1:k-1,k) := u(1:k-1,k) = w(1:k-1,kw)/d(k,k) ! (note: no need to use for hermitian matrix ! a( k, k ) = real( w( k, k),KIND=dp) to separately copy diagonal ! element d(k,k) from w (potentially saves only one load)) call stdlib${ii}$_zcopy( k, w( 1_${ik}$, kw ), 1_${ik}$, a( 1_${ik}$, k ), 1_${ik}$ ) if( k>1_${ik}$ ) then ! (note: no need to check if a(k,k) is not zero, ! since that was ensured earlier in pivot search: ! case a(k,k) = 0 falls into 2x2 pivot case(4)) r1 = one / real( a( k, k ),KIND=dp) call stdlib${ii}$_zdscal( k-1, r1, a( 1_${ik}$, k ), 1_${ik}$ ) ! (2) conjugate column w(kw) call stdlib${ii}$_zlacgv( k-1, w( 1_${ik}$, kw ), 1_${ik}$ ) end if else ! 2-by-2 pivot block d(k): columns kw and kw-1 of w now hold ! ( w(kw-1) w(kw) ) = ( u(k-1) u(k) )*d(k) ! where u(k) and u(k-1) are the k-th and (k-1)-th columns ! of u ! (1) store u(1:k-2,k-1) and u(1:k-2,k) and 2-by-2 ! block d(k-1:k,k-1:k) in columns k-1 and k of a. ! (note: 2-by-2 diagonal block u(k-1:k,k-1:k) is a unit ! block and not stored) ! a(k-1:k,k-1:k) := d(k-1:k,k-1:k) = w(k-1:k,kw-1:kw) ! a(1:k-2,k-1:k) := u(1:k-2,k:k-1:k) = ! = w(1:k-2,kw-1:kw) * ( d(k-1:k,k-1:k)**(-1) ) if( k>2_${ik}$ ) then ! factor out the columns of the inverse of 2-by-2 pivot ! block d, so that each column contains 1, to reduce the ! number of flops when we multiply panel ! ( w(kw-1) w(kw) ) by this inverse, i.e. by d**(-1). ! d**(-1) = ( d11 cj(d21) )**(-1) = ! ( d21 d22 ) ! = 1/(d11*d22-|d21|**2) * ( ( d22) (-cj(d21) ) ) = ! ( (-d21) ( d11 ) ) ! = 1/(|d21|**2) * 1/((d11/cj(d21))*(d22/d21)-1) * ! * ( d21*( d22/d21 ) conj(d21)*( - 1 ) ) = ! ( ( -1 ) ( d11/conj(d21) ) ) ! = 1/(|d21|**2) * 1/(d22*d11-1) * ! * ( d21*( d11 ) conj(d21)*( -1 ) ) = ! ( ( -1 ) ( d22 ) ) ! = (1/|d21|**2) * t * ( d21*( d11 ) conj(d21)*( -1 ) ) = ! ( ( -1 ) ( d22 ) ) ! = ( (t/conj(d21))*( d11 ) (t/d21)*( -1 ) ) = ! ( ( -1 ) ( d22 ) ) ! = ( conj(d21)*( d11 ) d21*( -1 ) ) ! ( ( -1 ) ( d22 ) ), ! where d11 = d22/d21, ! d22 = d11/conj(d21), ! d21 = t/d21, ! t = 1/(d22*d11-1). ! (note: no need to check for division by zero, ! since that was ensured earlier in pivot search: ! (a) d21 != 0, since in 2x2 pivot case(4) ! |d21| should be larger than |d11| and |d22|; ! (b) (d22*d11 - 1) != 0, since from (a), ! both |d11| < 1, |d22| < 1, hence |d22*d11| << 1.) d21 = w( k-1, kw ) d11 = w( k, kw ) / conjg( d21 ) d22 = w( k-1, kw-1 ) / d21 t = one / ( real( d11*d22,KIND=dp)-one ) d21 = t / d21 ! update elements in columns a(k-1) and a(k) as ! dot products of rows of ( w(kw-1) w(kw) ) and columns ! of d**(-1) do j = 1, k - 2 a( j, k-1 ) = d21*( d11*w( j, kw-1 )-w( j, kw ) ) a( j, k ) = conjg( d21 )*( d22*w( j, kw )-w( j, kw-1 ) ) end do end if ! copy d(k) to a a( k-1, k-1 ) = w( k-1, kw-1 ) a( k-1, k ) = w( k-1, kw ) a( k, k ) = w( k, kw ) ! (2) conjugate columns w(kw) and w(kw-1) call stdlib${ii}$_zlacgv( k-1, w( 1_${ik}$, kw ), 1_${ik}$ ) call stdlib${ii}$_zlacgv( k-2, w( 1_${ik}$, kw-1 ), 1_${ik}$ ) end if end if ! store details of the interchanges in ipiv if( kstep==1_${ik}$ ) then ipiv( k ) = kp else ipiv( k ) = -kp ipiv( k-1 ) = -kp end if ! decrease k and return to the start of the main loop k = k - kstep go to 10 30 continue ! update the upper triangle of a11 (= a(1:k,1:k)) as ! a11 := a11 - u12*d*u12**h = a11 - u12*w**h ! computing blocks of nb columns at a time (note that conjg(w) is ! actually stored) do j = ( ( k-1 ) / nb )*nb + 1, 1, -nb jb = min( nb, k-j+1 ) ! update the upper triangle of the diagonal block do jj = j, j + jb - 1 a( jj, jj ) = real( a( jj, jj ),KIND=dp) call stdlib${ii}$_zgemv( 'NO TRANSPOSE', jj-j+1, n-k, -cone,a( j, k+1 ), lda, w( jj,& kw+1 ), ldw, cone,a( j, jj ), 1_${ik}$ ) a( jj, jj ) = real( a( jj, jj ),KIND=dp) end do ! update the rectangular superdiagonal block call stdlib${ii}$_zgemm( 'NO TRANSPOSE', 'TRANSPOSE', j-1, jb, n-k,-cone, a( 1_${ik}$, k+1 ), & lda, w( j, kw+1 ), ldw,cone, a( 1_${ik}$, j ), lda ) end do ! put u12 in standard form by partially undoing the interchanges ! in columns k+1:n looping backwards from k+1 to n j = k + 1_${ik}$ 60 continue ! undo the interchanges (if any) of rows jj and jp at each ! step j ! (here, j is a diagonal index) jj = j jp = ipiv( j ) if( jp<0_${ik}$ ) then jp = -jp ! (here, j is a diagonal index) j = j + 1_${ik}$ end if ! (note: here, j is used to determine row length. length n-j+1 ! of the rows to swap back doesn't include diagonal element) j = j + 1_${ik}$ if( jp/=jj .and. j<=n )call stdlib${ii}$_zswap( n-j+1, a( jp, j ), lda, a( jj, j ), & lda ) if( j<n )go to 60 ! set kb to the number of columns factorized kb = n - k else ! factorize the leading columns of a using the lower triangle ! of a and working forwards, and compute the matrix w = l21*d ! for use in updating a22 (note that conjg(w) is actually stored) ! k is the main loop index, increasing from 1 in steps of 1 or 2 k = 1_${ik}$ 70 continue ! exit from loop if( ( k>=nb .and. nb<n ) .or. k>n )go to 90 kstep = 1_${ik}$ ! copy column k of a to column k of w and update it w( k, k ) = real( a( k, k ),KIND=dp) if( k<n )call stdlib${ii}$_zcopy( n-k, a( k+1, k ), 1_${ik}$, w( k+1, k ), 1_${ik}$ ) call stdlib${ii}$_zgemv( 'NO TRANSPOSE', n-k+1, k-1, -cone, a( k, 1_${ik}$ ), lda,w( k, 1_${ik}$ ), ldw,& cone, w( k, k ), 1_${ik}$ ) w( k, k ) = real( w( k, k ),KIND=dp) ! determine rows and columns to be interchanged and whether ! a 1-by-1 or 2-by-2 pivot block will be used absakk = abs( real( w( k, k ),KIND=dp) ) ! imax is the row-index of the largest off-diagonal element in ! column k, and colmax is its absolute value. ! determine both colmax and imax. if( k<n ) then imax = k + stdlib${ii}$_izamax( n-k, w( k+1, k ), 1_${ik}$ ) colmax = cabs1( w( imax, k ) ) else colmax = zero end if if( max( absakk, colmax )==zero ) then ! column k is zero or underflow: set info and continue if( info==0_${ik}$ )info = k kp = k a( k, k ) = real( a( k, k ),KIND=dp) else ! ============================================================ ! begin pivot search ! case(1) if( absakk>=alpha*colmax ) then ! no interchange, use 1-by-1 pivot block kp = k else ! begin pivot search along imax row ! copy column imax to column k+1 of w and update it call stdlib${ii}$_zcopy( imax-k, a( imax, k ), lda, w( k, k+1 ), 1_${ik}$ ) call stdlib${ii}$_zlacgv( imax-k, w( k, k+1 ), 1_${ik}$ ) w( imax, k+1 ) = real( a( imax, imax ),KIND=dp) if( imax<n )call stdlib${ii}$_zcopy( n-imax, a( imax+1, imax ), 1_${ik}$,w( imax+1, k+1 ), & 1_${ik}$ ) call stdlib${ii}$_zgemv( 'NO TRANSPOSE', n-k+1, k-1, -cone, a( k, 1_${ik}$ ),lda, w( imax, & 1_${ik}$ ), ldw, cone, w( k, k+1 ),1_${ik}$ ) w( imax, k+1 ) = real( w( imax, k+1 ),KIND=dp) ! jmax is the column-index of the largest off-diagonal ! element in row imax, and rowmax is its absolute value. ! determine only rowmax. jmax = k - 1_${ik}$ + stdlib${ii}$_izamax( imax-k, w( k, k+1 ), 1_${ik}$ ) rowmax = cabs1( w( jmax, k+1 ) ) if( imax<n ) then jmax = imax + stdlib${ii}$_izamax( n-imax, w( imax+1, k+1 ), 1_${ik}$ ) rowmax = max( rowmax, cabs1( w( jmax, k+1 ) ) ) end if ! case(2) if( absakk>=alpha*colmax*( colmax / rowmax ) ) then ! no interchange, use 1-by-1 pivot block kp = k ! case(3) else if( abs( real( w( imax, k+1 ),KIND=dp) )>=alpha*rowmax )then ! interchange rows and columns k and imax, use 1-by-1 ! pivot block kp = imax ! copy column k+1 of w to column k of w call stdlib${ii}$_zcopy( n-k+1, w( k, k+1 ), 1_${ik}$, w( k, k ), 1_${ik}$ ) ! case(4) else ! interchange rows and columns k+1 and imax, use 2-by-2 ! pivot block kp = imax kstep = 2_${ik}$ end if ! end pivot search along imax row end if ! end pivot search ! ============================================================ ! kk is the column of a where pivoting step stopped kk = k + kstep - 1_${ik}$ ! interchange rows and columns kp and kk. ! updated column kp is already stored in column kk of w. if( kp/=kk ) then ! copy non-updated column kk to column kp of submatrix a ! at step k. no need to copy element into column k ! (or k and k+1 for 2-by-2 pivot) of a, since these columns ! will be later overwritten. a( kp, kp ) = real( a( kk, kk ),KIND=dp) call stdlib${ii}$_zcopy( kp-kk-1, a( kk+1, kk ), 1_${ik}$, a( kp, kk+1 ),lda ) call stdlib${ii}$_zlacgv( kp-kk-1, a( kp, kk+1 ), lda ) if( kp<n )call stdlib${ii}$_zcopy( n-kp, a( kp+1, kk ), 1_${ik}$, a( kp+1, kp ), 1_${ik}$ ) ! interchange rows kk and kp in first k-1 columns of a ! (columns k (or k and k+1 for 2-by-2 pivot) of a will be ! later overwritten). interchange rows kk and kp ! in first kk columns of w. if( k>1_${ik}$ )call stdlib${ii}$_zswap( k-1, a( kk, 1_${ik}$ ), lda, a( kp, 1_${ik}$ ), lda ) call stdlib${ii}$_zswap( kk, w( kk, 1_${ik}$ ), ldw, w( kp, 1_${ik}$ ), ldw ) end if if( kstep==1_${ik}$ ) then ! 1-by-1 pivot block d(k): column k of w now holds ! w(k) = l(k)*d(k), ! where l(k) is the k-th column of l ! (1) store subdiag. elements of column l(k) ! and 1-by-1 block d(k) in column k of a. ! (note: diagonal element l(k,k) is a unit element ! and not stored) ! a(k,k) := d(k,k) = w(k,k) ! a(k+1:n,k) := l(k+1:n,k) = w(k+1:n,k)/d(k,k) ! (note: no need to use for hermitian matrix ! a( k, k ) = real( w( k, k),KIND=dp) to separately copy diagonal ! element d(k,k) from w (potentially saves only one load)) call stdlib${ii}$_zcopy( n-k+1, w( k, k ), 1_${ik}$, a( k, k ), 1_${ik}$ ) if( k<n ) then ! (note: no need to check if a(k,k) is not zero, ! since that was ensured earlier in pivot search: ! case a(k,k) = 0 falls into 2x2 pivot case(4)) r1 = one / real( a( k, k ),KIND=dp) call stdlib${ii}$_zdscal( n-k, r1, a( k+1, k ), 1_${ik}$ ) ! (2) conjugate column w(k) call stdlib${ii}$_zlacgv( n-k, w( k+1, k ), 1_${ik}$ ) end if else ! 2-by-2 pivot block d(k): columns k and k+1 of w now hold ! ( w(k) w(k+1) ) = ( l(k) l(k+1) )*d(k) ! where l(k) and l(k+1) are the k-th and (k+1)-th columns ! of l ! (1) store l(k+2:n,k) and l(k+2:n,k+1) and 2-by-2 ! block d(k:k+1,k:k+1) in columns k and k+1 of a. ! (note: 2-by-2 diagonal block l(k:k+1,k:k+1) is a unit ! block and not stored) ! a(k:k+1,k:k+1) := d(k:k+1,k:k+1) = w(k:k+1,k:k+1) ! a(k+2:n,k:k+1) := l(k+2:n,k:k+1) = ! = w(k+2:n,k:k+1) * ( d(k:k+1,k:k+1)**(-1) ) if( k<n-1 ) then ! factor out the columns of the inverse of 2-by-2 pivot ! block d, so that each column contains 1, to reduce the ! number of flops when we multiply panel ! ( w(kw-1) w(kw) ) by this inverse, i.e. by d**(-1). ! d**(-1) = ( d11 cj(d21) )**(-1) = ! ( d21 d22 ) ! = 1/(d11*d22-|d21|**2) * ( ( d22) (-cj(d21) ) ) = ! ( (-d21) ( d11 ) ) ! = 1/(|d21|**2) * 1/((d11/cj(d21))*(d22/d21)-1) * ! * ( d21*( d22/d21 ) conj(d21)*( - 1 ) ) = ! ( ( -1 ) ( d11/conj(d21) ) ) ! = 1/(|d21|**2) * 1/(d22*d11-1) * ! * ( d21*( d11 ) conj(d21)*( -1 ) ) = ! ( ( -1 ) ( d22 ) ) ! = (1/|d21|**2) * t * ( d21*( d11 ) conj(d21)*( -1 ) ) = ! ( ( -1 ) ( d22 ) ) ! = ( (t/conj(d21))*( d11 ) (t/d21)*( -1 ) ) = ! ( ( -1 ) ( d22 ) ) ! = ( conj(d21)*( d11 ) d21*( -1 ) ) ! ( ( -1 ) ( d22 ) ), ! where d11 = d22/d21, ! d22 = d11/conj(d21), ! d21 = t/d21, ! t = 1/(d22*d11-1). ! (note: no need to check for division by zero, ! since that was ensured earlier in pivot search: ! (a) d21 != 0, since in 2x2 pivot case(4) ! |d21| should be larger than |d11| and |d22|; ! (b) (d22*d11 - 1) != 0, since from (a), ! both |d11| < 1, |d22| < 1, hence |d22*d11| << 1.) d21 = w( k+1, k ) d11 = w( k+1, k+1 ) / d21 d22 = w( k, k ) / conjg( d21 ) t = one / ( real( d11*d22,KIND=dp)-one ) d21 = t / d21 ! update elements in columns a(k) and a(k+1) as ! dot products of rows of ( w(k) w(k+1) ) and columns ! of d**(-1) do j = k + 2, n a( j, k ) = conjg( d21 )*( d11*w( j, k )-w( j, k+1 ) ) a( j, k+1 ) = d21*( d22*w( j, k+1 )-w( j, k ) ) end do end if ! copy d(k) to a a( k, k ) = w( k, k ) a( k+1, k ) = w( k+1, k ) a( k+1, k+1 ) = w( k+1, k+1 ) ! (2) conjugate columns w(k) and w(k+1) call stdlib${ii}$_zlacgv( n-k, w( k+1, k ), 1_${ik}$ ) call stdlib${ii}$_zlacgv( n-k-1, w( k+2, k+1 ), 1_${ik}$ ) end if end if ! store details of the interchanges in ipiv if( kstep==1_${ik}$ ) then ipiv( k ) = kp else ipiv( k ) = -kp ipiv( k+1 ) = -kp end if ! increase k and return to the start of the main loop k = k + kstep go to 70 90 continue ! update the lower triangle of a22 (= a(k:n,k:n)) as ! a22 := a22 - l21*d*l21**h = a22 - l21*w**h ! computing blocks of nb columns at a time (note that conjg(w) is ! actually stored) do j = k, n, nb jb = min( nb, n-j+1 ) ! update the lower triangle of the diagonal block do jj = j, j + jb - 1 a( jj, jj ) = real( a( jj, jj ),KIND=dp) call stdlib${ii}$_zgemv( 'NO TRANSPOSE', j+jb-jj, k-1, -cone,a( jj, 1_${ik}$ ), lda, w( jj,& 1_${ik}$ ), ldw, cone,a( jj, jj ), 1_${ik}$ ) a( jj, jj ) = real( a( jj, jj ),KIND=dp) end do ! update the rectangular subdiagonal block if( j+jb<=n )call stdlib${ii}$_zgemm( 'NO TRANSPOSE', 'TRANSPOSE', n-j-jb+1, jb,k-1, -& cone, a( j+jb, 1_${ik}$ ), lda, w( j, 1_${ik}$ ),ldw, cone, a( j+jb, j ), lda ) end do ! put l21 in standard form by partially undoing the interchanges ! of rows in columns 1:k-1 looping backwards from k-1 to 1 j = k - 1_${ik}$ 120 continue ! undo the interchanges (if any) of rows jj and jp at each ! step j ! (here, j is a diagonal index) jj = j jp = ipiv( j ) if( jp<0_${ik}$ ) then jp = -jp ! (here, j is a diagonal index) j = j - 1_${ik}$ end if ! (note: here, j is used to determine row length. length j ! of the rows to swap back doesn't include diagonal element) j = j - 1_${ik}$ if( jp/=jj .and. j>=1_${ik}$ )call stdlib${ii}$_zswap( j, a( jp, 1_${ik}$ ), lda, a( jj, 1_${ik}$ ), lda ) if( j>1 )go to 120 ! set kb to the number of columns factorized kb = k - 1_${ik}$ end if return end subroutine stdlib${ii}$_zlahef #:for ck,ct,ci in CMPLX_KINDS_TYPES #:if not ck in ["sp","dp"] pure module subroutine stdlib${ii}$_${ci}$lahef( uplo, n, nb, kb, a, lda, ipiv, w, ldw, info ) !! ZLAHEF: computes a partial factorization of a complex Hermitian !! matrix A using the Bunch-Kaufman diagonal pivoting method. The !! partial factorization has the form: !! A = ( I U12 ) ( A11 0 ) ( I 0 ) if UPLO = 'U', or: !! ( 0 U22 ) ( 0 D ) ( U12**H U22**H ) !! A = ( L11 0 ) ( D 0 ) ( L11**H L21**H ) if UPLO = 'L' !! ( L21 I ) ( 0 A22 ) ( 0 I ) !! where the order of D is at most NB. The actual order is returned in !! the argument KB, and is either NB or NB-1, or N if N <= NB. !! Note that U**H denotes the conjugate transpose of U. !! ZLAHEF is an auxiliary routine called by ZHETRF. It uses blocked code !! (calling Level 3 BLAS) to update the submatrix A11 (if UPLO = 'U') or !! A22 (if UPLO = 'L'). ! -- lapack computational routine -- ! -- lapack is a software package provided by univ. of tennessee, -- ! -- univ. of california berkeley, univ. of colorado denver and nag ltd..-- use stdlib_blas_constants_${ck}$, only: negone, zero, half, one, two, three, four, eight, ten, czero, chalf, cone, cnegone ! Scalar Arguments character, intent(in) :: uplo integer(${ik}$), intent(out) :: info, kb integer(${ik}$), intent(in) :: lda, ldw, n, nb ! Array Arguments integer(${ik}$), intent(out) :: ipiv(*) complex(${ck}$), intent(inout) :: a(lda,*) complex(${ck}$), intent(out) :: w(ldw,*) ! ===================================================================== ! Parameters real(${ck}$), parameter :: sevten = 17.0e+0_${ck}$ ! Local Scalars integer(${ik}$) :: imax, j, jb, jj, jmax, jp, k, kk, kkw, kp, kstep, kw real(${ck}$) :: absakk, alpha, colmax, r1, rowmax, t complex(${ck}$) :: d11, d21, d22, z ! Intrinsic Functions ! Statement Functions real(${ck}$) :: cabs1 ! Statement Function Definitions cabs1( z ) = abs( real( z,KIND=${ck}$) ) + abs( aimag( z ) ) ! Executable Statements info = 0_${ik}$ ! initialize alpha for use in choosing pivot block size. alpha = ( one+sqrt( sevten ) ) / eight if( stdlib_lsame( uplo, 'U' ) ) then ! factorize the trailing columns of a using the upper triangle ! of a and working backwards, and compute the matrix w = u12*d ! for use in updating a11 (note that conjg(w) is actually stored) ! k is the main loop index, decreasing from n in steps of 1 or 2 ! kw is the column of w which corresponds to column k of a k = n 10 continue kw = nb + k - n ! exit from loop if( ( k<=n-nb+1 .and. nb<n ) .or. k<1 )go to 30 kstep = 1_${ik}$ ! copy column k of a to column kw of w and update it call stdlib${ii}$_${ci}$copy( k-1, a( 1_${ik}$, k ), 1_${ik}$, w( 1_${ik}$, kw ), 1_${ik}$ ) w( k, kw ) = real( a( k, k ),KIND=${ck}$) if( k<n ) then call stdlib${ii}$_${ci}$gemv( 'NO TRANSPOSE', k, n-k, -cone, a( 1_${ik}$, k+1 ), lda,w( k, kw+1 ), & ldw, cone, w( 1_${ik}$, kw ), 1_${ik}$ ) w( k, kw ) = real( w( k, kw ),KIND=${ck}$) end if ! determine rows and columns to be interchanged and whether ! a 1-by-1 or 2-by-2 pivot block will be used absakk = abs( real( w( k, kw ),KIND=${ck}$) ) ! imax is the row-index of the largest off-diagonal element in ! column k, and colmax is its absolute value. ! determine both colmax and imax. if( k>1_${ik}$ ) then imax = stdlib${ii}$_i${ci}$amax( k-1, w( 1_${ik}$, kw ), 1_${ik}$ ) colmax = cabs1( w( imax, kw ) ) else colmax = zero end if if( max( absakk, colmax )==zero ) then ! column k is zero or underflow: set info and continue if( info==0_${ik}$ )info = k kp = k a( k, k ) = real( a( k, k ),KIND=${ck}$) else ! ============================================================ ! begin pivot search ! case(1) if( absakk>=alpha*colmax ) then ! no interchange, use 1-by-1 pivot block kp = k else ! begin pivot search along imax row ! copy column imax to column kw-1 of w and update it call stdlib${ii}$_${ci}$copy( imax-1, a( 1_${ik}$, imax ), 1_${ik}$, w( 1_${ik}$, kw-1 ), 1_${ik}$ ) w( imax, kw-1 ) = real( a( imax, imax ),KIND=${ck}$) call stdlib${ii}$_${ci}$copy( k-imax, a( imax, imax+1 ), lda,w( imax+1, kw-1 ), 1_${ik}$ ) call stdlib${ii}$_${ci}$lacgv( k-imax, w( imax+1, kw-1 ), 1_${ik}$ ) if( k<n ) then call stdlib${ii}$_${ci}$gemv( 'NO TRANSPOSE', k, n-k, -cone,a( 1_${ik}$, k+1 ), lda, w( imax,& kw+1 ), ldw,cone, w( 1_${ik}$, kw-1 ), 1_${ik}$ ) w( imax, kw-1 ) = real( w( imax, kw-1 ),KIND=${ck}$) end if ! jmax is the column-index of the largest off-diagonal ! element in row imax, and rowmax is its absolute value. ! determine only rowmax. jmax = imax + stdlib${ii}$_i${ci}$amax( k-imax, w( imax+1, kw-1 ), 1_${ik}$ ) rowmax = cabs1( w( jmax, kw-1 ) ) if( imax>1_${ik}$ ) then jmax = stdlib${ii}$_i${ci}$amax( imax-1, w( 1_${ik}$, kw-1 ), 1_${ik}$ ) rowmax = max( rowmax, cabs1( w( jmax, kw-1 ) ) ) end if ! case(2) if( absakk>=alpha*colmax*( colmax / rowmax ) ) then ! no interchange, use 1-by-1 pivot block kp = k ! case(3) else if( abs( real( w( imax, kw-1 ),KIND=${ck}$) )>=alpha*rowmax )then ! interchange rows and columns k and imax, use 1-by-1 ! pivot block kp = imax ! copy column kw-1 of w to column kw of w call stdlib${ii}$_${ci}$copy( k, w( 1_${ik}$, kw-1 ), 1_${ik}$, w( 1_${ik}$, kw ), 1_${ik}$ ) ! case(4) else ! interchange rows and columns k-1 and imax, use 2-by-2 ! pivot block kp = imax kstep = 2_${ik}$ end if ! end pivot search along imax row end if ! end pivot search ! ============================================================ ! kk is the column of a where pivoting step stopped kk = k - kstep + 1_${ik}$ ! kkw is the column of w which corresponds to column kk of a kkw = nb + kk - n ! interchange rows and columns kp and kk. ! updated column kp is already stored in column kkw of w. if( kp/=kk ) then ! copy non-updated column kk to column kp of submatrix a ! at step k. no need to copy element into column k ! (or k and k-1 for 2-by-2 pivot) of a, since these columns ! will be later overwritten. a( kp, kp ) = real( a( kk, kk ),KIND=${ck}$) call stdlib${ii}$_${ci}$copy( kk-1-kp, a( kp+1, kk ), 1_${ik}$, a( kp, kp+1 ),lda ) call stdlib${ii}$_${ci}$lacgv( kk-1-kp, a( kp, kp+1 ), lda ) if( kp>1_${ik}$ )call stdlib${ii}$_${ci}$copy( kp-1, a( 1_${ik}$, kk ), 1_${ik}$, a( 1_${ik}$, kp ), 1_${ik}$ ) ! interchange rows kk and kp in last k+1 to n columns of a ! (columns k (or k and k-1 for 2-by-2 pivot) of a will be ! later overwritten). interchange rows kk and kp ! in last kkw to nb columns of w. if( k<n )call stdlib${ii}$_${ci}$swap( n-k, a( kk, k+1 ), lda, a( kp, k+1 ),lda ) call stdlib${ii}$_${ci}$swap( n-kk+1, w( kk, kkw ), ldw, w( kp, kkw ),ldw ) end if if( kstep==1_${ik}$ ) then ! 1-by-1 pivot block d(k): column kw of w now holds ! w(kw) = u(k)*d(k), ! where u(k) is the k-th column of u ! (1) store subdiag. elements of column u(k) ! and 1-by-1 block d(k) in column k of a. ! (note: diagonal element u(k,k) is a unit element ! and not stored) ! a(k,k) := d(k,k) = w(k,kw) ! a(1:k-1,k) := u(1:k-1,k) = w(1:k-1,kw)/d(k,k) ! (note: no need to use for hermitian matrix ! a( k, k ) = real( w( k, k),KIND=${ck}$) to separately copy diagonal ! element d(k,k) from w (potentially saves only one load)) call stdlib${ii}$_${ci}$copy( k, w( 1_${ik}$, kw ), 1_${ik}$, a( 1_${ik}$, k ), 1_${ik}$ ) if( k>1_${ik}$ ) then ! (note: no need to check if a(k,k) is not zero, ! since that was ensured earlier in pivot search: ! case a(k,k) = 0 falls into 2x2 pivot case(4)) r1 = one / real( a( k, k ),KIND=${ck}$) call stdlib${ii}$_${ci}$dscal( k-1, r1, a( 1_${ik}$, k ), 1_${ik}$ ) ! (2) conjugate column w(kw) call stdlib${ii}$_${ci}$lacgv( k-1, w( 1_${ik}$, kw ), 1_${ik}$ ) end if else ! 2-by-2 pivot block d(k): columns kw and kw-1 of w now hold ! ( w(kw-1) w(kw) ) = ( u(k-1) u(k) )*d(k) ! where u(k) and u(k-1) are the k-th and (k-1)-th columns ! of u ! (1) store u(1:k-2,k-1) and u(1:k-2,k) and 2-by-2 ! block d(k-1:k,k-1:k) in columns k-1 and k of a. ! (note: 2-by-2 diagonal block u(k-1:k,k-1:k) is a unit ! block and not stored) ! a(k-1:k,k-1:k) := d(k-1:k,k-1:k) = w(k-1:k,kw-1:kw) ! a(1:k-2,k-1:k) := u(1:k-2,k:k-1:k) = ! = w(1:k-2,kw-1:kw) * ( d(k-1:k,k-1:k)**(-1) ) if( k>2_${ik}$ ) then ! factor out the columns of the inverse of 2-by-2 pivot ! block d, so that each column contains 1, to reduce the ! number of flops when we multiply panel ! ( w(kw-1) w(kw) ) by this inverse, i.e. by d**(-1). ! d**(-1) = ( d11 cj(d21) )**(-1) = ! ( d21 d22 ) ! = 1/(d11*d22-|d21|**2) * ( ( d22) (-cj(d21) ) ) = ! ( (-d21) ( d11 ) ) ! = 1/(|d21|**2) * 1/((d11/cj(d21))*(d22/d21)-1) * ! * ( d21*( d22/d21 ) conj(d21)*( - 1 ) ) = ! ( ( -1 ) ( d11/conj(d21) ) ) ! = 1/(|d21|**2) * 1/(d22*d11-1) * ! * ( d21*( d11 ) conj(d21)*( -1 ) ) = ! ( ( -1 ) ( d22 ) ) ! = (1/|d21|**2) * t * ( d21*( d11 ) conj(d21)*( -1 ) ) = ! ( ( -1 ) ( d22 ) ) ! = ( (t/conj(d21))*( d11 ) (t/d21)*( -1 ) ) = ! ( ( -1 ) ( d22 ) ) ! = ( conj(d21)*( d11 ) d21*( -1 ) ) ! ( ( -1 ) ( d22 ) ), ! where d11 = d22/d21, ! d22 = d11/conj(d21), ! d21 = t/d21, ! t = 1/(d22*d11-1). ! (note: no need to check for division by zero, ! since that was ensured earlier in pivot search: ! (a) d21 != 0, since in 2x2 pivot case(4) ! |d21| should be larger than |d11| and |d22|; ! (b) (d22*d11 - 1) != 0, since from (a), ! both |d11| < 1, |d22| < 1, hence |d22*d11| << 1.) d21 = w( k-1, kw ) d11 = w( k, kw ) / conjg( d21 ) d22 = w( k-1, kw-1 ) / d21 t = one / ( real( d11*d22,KIND=${ck}$)-one ) d21 = t / d21 ! update elements in columns a(k-1) and a(k) as ! dot products of rows of ( w(kw-1) w(kw) ) and columns ! of d**(-1) do j = 1, k - 2 a( j, k-1 ) = d21*( d11*w( j, kw-1 )-w( j, kw ) ) a( j, k ) = conjg( d21 )*( d22*w( j, kw )-w( j, kw-1 ) ) end do end if ! copy d(k) to a a( k-1, k-1 ) = w( k-1, kw-1 ) a( k-1, k ) = w( k-1, kw ) a( k, k ) = w( k, kw ) ! (2) conjugate columns w(kw) and w(kw-1) call stdlib${ii}$_${ci}$lacgv( k-1, w( 1_${ik}$, kw ), 1_${ik}$ ) call stdlib${ii}$_${ci}$lacgv( k-2, w( 1_${ik}$, kw-1 ), 1_${ik}$ ) end if end if ! store details of the interchanges in ipiv if( kstep==1_${ik}$ ) then ipiv( k ) = kp else ipiv( k ) = -kp ipiv( k-1 ) = -kp end if ! decrease k and return to the start of the main loop k = k - kstep go to 10 30 continue ! update the upper triangle of a11 (= a(1:k,1:k)) as ! a11 := a11 - u12*d*u12**h = a11 - u12*w**h ! computing blocks of nb columns at a time (note that conjg(w) is ! actually stored) do j = ( ( k-1 ) / nb )*nb + 1, 1, -nb jb = min( nb, k-j+1 ) ! update the upper triangle of the diagonal block do jj = j, j + jb - 1 a( jj, jj ) = real( a( jj, jj ),KIND=${ck}$) call stdlib${ii}$_${ci}$gemv( 'NO TRANSPOSE', jj-j+1, n-k, -cone,a( j, k+1 ), lda, w( jj,& kw+1 ), ldw, cone,a( j, jj ), 1_${ik}$ ) a( jj, jj ) = real( a( jj, jj ),KIND=${ck}$) end do ! update the rectangular superdiagonal block call stdlib${ii}$_${ci}$gemm( 'NO TRANSPOSE', 'TRANSPOSE', j-1, jb, n-k,-cone, a( 1_${ik}$, k+1 ), & lda, w( j, kw+1 ), ldw,cone, a( 1_${ik}$, j ), lda ) end do ! put u12 in standard form by partially undoing the interchanges ! in columns k+1:n looping backwards from k+1 to n j = k + 1_${ik}$ 60 continue ! undo the interchanges (if any) of rows jj and jp at each ! step j ! (here, j is a diagonal index) jj = j jp = ipiv( j ) if( jp<0_${ik}$ ) then jp = -jp ! (here, j is a diagonal index) j = j + 1_${ik}$ end if ! (note: here, j is used to determine row length. length n-j+1 ! of the rows to swap back doesn't include diagonal element) j = j + 1_${ik}$ if( jp/=jj .and. j<=n )call stdlib${ii}$_${ci}$swap( n-j+1, a( jp, j ), lda, a( jj, j ), & lda ) if( j<n )go to 60 ! set kb to the number of columns factorized kb = n - k else ! factorize the leading columns of a using the lower triangle ! of a and working forwards, and compute the matrix w = l21*d ! for use in updating a22 (note that conjg(w) is actually stored) ! k is the main loop index, increasing from 1 in steps of 1 or 2 k = 1_${ik}$ 70 continue ! exit from loop if( ( k>=nb .and. nb<n ) .or. k>n )go to 90 kstep = 1_${ik}$ ! copy column k of a to column k of w and update it w( k, k ) = real( a( k, k ),KIND=${ck}$) if( k<n )call stdlib${ii}$_${ci}$copy( n-k, a( k+1, k ), 1_${ik}$, w( k+1, k ), 1_${ik}$ ) call stdlib${ii}$_${ci}$gemv( 'NO TRANSPOSE', n-k+1, k-1, -cone, a( k, 1_${ik}$ ), lda,w( k, 1_${ik}$ ), ldw,& cone, w( k, k ), 1_${ik}$ ) w( k, k ) = real( w( k, k ),KIND=${ck}$) ! determine rows and columns to be interchanged and whether ! a 1-by-1 or 2-by-2 pivot block will be used absakk = abs( real( w( k, k ),KIND=${ck}$) ) ! imax is the row-index of the largest off-diagonal element in ! column k, and colmax is its absolute value. ! determine both colmax and imax. if( k<n ) then imax = k + stdlib${ii}$_i${ci}$amax( n-k, w( k+1, k ), 1_${ik}$ ) colmax = cabs1( w( imax, k ) ) else colmax = zero end if if( max( absakk, colmax )==zero ) then ! column k is zero or underflow: set info and continue if( info==0_${ik}$ )info = k kp = k a( k, k ) = real( a( k, k ),KIND=${ck}$) else ! ============================================================ ! begin pivot search ! case(1) if( absakk>=alpha*colmax ) then ! no interchange, use 1-by-1 pivot block kp = k else ! begin pivot search along imax row ! copy column imax to column k+1 of w and update it call stdlib${ii}$_${ci}$copy( imax-k, a( imax, k ), lda, w( k, k+1 ), 1_${ik}$ ) call stdlib${ii}$_${ci}$lacgv( imax-k, w( k, k+1 ), 1_${ik}$ ) w( imax, k+1 ) = real( a( imax, imax ),KIND=${ck}$) if( imax<n )call stdlib${ii}$_${ci}$copy( n-imax, a( imax+1, imax ), 1_${ik}$,w( imax+1, k+1 ), & 1_${ik}$ ) call stdlib${ii}$_${ci}$gemv( 'NO TRANSPOSE', n-k+1, k-1, -cone, a( k, 1_${ik}$ ),lda, w( imax, & 1_${ik}$ ), ldw, cone, w( k, k+1 ),1_${ik}$ ) w( imax, k+1 ) = real( w( imax, k+1 ),KIND=${ck}$) ! jmax is the column-index of the largest off-diagonal ! element in row imax, and rowmax is its absolute value. ! determine only rowmax. jmax = k - 1_${ik}$ + stdlib${ii}$_i${ci}$amax( imax-k, w( k, k+1 ), 1_${ik}$ ) rowmax = cabs1( w( jmax, k+1 ) ) if( imax<n ) then jmax = imax + stdlib${ii}$_i${ci}$amax( n-imax, w( imax+1, k+1 ), 1_${ik}$ ) rowmax = max( rowmax, cabs1( w( jmax, k+1 ) ) ) end if ! case(2) if( absakk>=alpha*colmax*( colmax / rowmax ) ) then ! no interchange, use 1-by-1 pivot block kp = k ! case(3) else if( abs( real( w( imax, k+1 ),KIND=${ck}$) )>=alpha*rowmax )then ! interchange rows and columns k and imax, use 1-by-1 ! pivot block kp = imax ! copy column k+1 of w to column k of w call stdlib${ii}$_${ci}$copy( n-k+1, w( k, k+1 ), 1_${ik}$, w( k, k ), 1_${ik}$ ) ! case(4) else ! interchange rows and columns k+1 and imax, use 2-by-2 ! pivot block kp = imax kstep = 2_${ik}$ end if ! end pivot search along imax row end if ! end pivot search ! ============================================================ ! kk is the column of a where pivoting step stopped kk = k + kstep - 1_${ik}$ ! interchange rows and columns kp and kk. ! updated column kp is already stored in column kk of w. if( kp/=kk ) then ! copy non-updated column kk to column kp of submatrix a ! at step k. no need to copy element into column k ! (or k and k+1 for 2-by-2 pivot) of a, since these columns ! will be later overwritten. a( kp, kp ) = real( a( kk, kk ),KIND=${ck}$) call stdlib${ii}$_${ci}$copy( kp-kk-1, a( kk+1, kk ), 1_${ik}$, a( kp, kk+1 ),lda ) call stdlib${ii}$_${ci}$lacgv( kp-kk-1, a( kp, kk+1 ), lda ) if( kp<n )call stdlib${ii}$_${ci}$copy( n-kp, a( kp+1, kk ), 1_${ik}$, a( kp+1, kp ), 1_${ik}$ ) ! interchange rows kk and kp in first k-1 columns of a ! (columns k (or k and k+1 for 2-by-2 pivot) of a will be ! later overwritten). interchange rows kk and kp ! in first kk columns of w. if( k>1_${ik}$ )call stdlib${ii}$_${ci}$swap( k-1, a( kk, 1_${ik}$ ), lda, a( kp, 1_${ik}$ ), lda ) call stdlib${ii}$_${ci}$swap( kk, w( kk, 1_${ik}$ ), ldw, w( kp, 1_${ik}$ ), ldw ) end if if( kstep==1_${ik}$ ) then ! 1-by-1 pivot block d(k): column k of w now holds ! w(k) = l(k)*d(k), ! where l(k) is the k-th column of l ! (1) store subdiag. elements of column l(k) ! and 1-by-1 block d(k) in column k of a. ! (note: diagonal element l(k,k) is a unit element ! and not stored) ! a(k,k) := d(k,k) = w(k,k) ! a(k+1:n,k) := l(k+1:n,k) = w(k+1:n,k)/d(k,k) ! (note: no need to use for hermitian matrix ! a( k, k ) = real( w( k, k),KIND=${ck}$) to separately copy diagonal ! element d(k,k) from w (potentially saves only one load)) call stdlib${ii}$_${ci}$copy( n-k+1, w( k, k ), 1_${ik}$, a( k, k ), 1_${ik}$ ) if( k<n ) then ! (note: no need to check if a(k,k) is not zero, ! since that was ensured earlier in pivot search: ! case a(k,k) = 0 falls into 2x2 pivot case(4)) r1 = one / real( a( k, k ),KIND=${ck}$) call stdlib${ii}$_${ci}$dscal( n-k, r1, a( k+1, k ), 1_${ik}$ ) ! (2) conjugate column w(k) call stdlib${ii}$_${ci}$lacgv( n-k, w( k+1, k ), 1_${ik}$ ) end if else ! 2-by-2 pivot block d(k): columns k and k+1 of w now hold ! ( w(k) w(k+1) ) = ( l(k) l(k+1) )*d(k) ! where l(k) and l(k+1) are the k-th and (k+1)-th columns ! of l ! (1) store l(k+2:n,k) and l(k+2:n,k+1) and 2-by-2 ! block d(k:k+1,k:k+1) in columns k and k+1 of a. ! (note: 2-by-2 diagonal block l(k:k+1,k:k+1) is a unit ! block and not stored) ! a(k:k+1,k:k+1) := d(k:k+1,k:k+1) = w(k:k+1,k:k+1) ! a(k+2:n,k:k+1) := l(k+2:n,k:k+1) = ! = w(k+2:n,k:k+1) * ( d(k:k+1,k:k+1)**(-1) ) if( k<n-1 ) then ! factor out the columns of the inverse of 2-by-2 pivot ! block d, so that each column contains 1, to reduce the ! number of flops when we multiply panel ! ( w(kw-1) w(kw) ) by this inverse, i.e. by d**(-1). ! d**(-1) = ( d11 cj(d21) )**(-1) = ! ( d21 d22 ) ! = 1/(d11*d22-|d21|**2) * ( ( d22) (-cj(d21) ) ) = ! ( (-d21) ( d11 ) ) ! = 1/(|d21|**2) * 1/((d11/cj(d21))*(d22/d21)-1) * ! * ( d21*( d22/d21 ) conj(d21)*( - 1 ) ) = ! ( ( -1 ) ( d11/conj(d21) ) ) ! = 1/(|d21|**2) * 1/(d22*d11-1) * ! * ( d21*( d11 ) conj(d21)*( -1 ) ) = ! ( ( -1 ) ( d22 ) ) ! = (1/|d21|**2) * t * ( d21*( d11 ) conj(d21)*( -1 ) ) = ! ( ( -1 ) ( d22 ) ) ! = ( (t/conj(d21))*( d11 ) (t/d21)*( -1 ) ) = ! ( ( -1 ) ( d22 ) ) ! = ( conj(d21)*( d11 ) d21*( -1 ) ) ! ( ( -1 ) ( d22 ) ), ! where d11 = d22/d21, ! d22 = d11/conj(d21), ! d21 = t/d21, ! t = 1/(d22*d11-1). ! (note: no need to check for division by zero, ! since that was ensured earlier in pivot search: ! (a) d21 != 0, since in 2x2 pivot case(4) ! |d21| should be larger than |d11| and |d22|; ! (b) (d22*d11 - 1) != 0, since from (a), ! both |d11| < 1, |d22| < 1, hence |d22*d11| << 1.) d21 = w( k+1, k ) d11 = w( k+1, k+1 ) / d21 d22 = w( k, k ) / conjg( d21 ) t = one / ( real( d11*d22,KIND=${ck}$)-one ) d21 = t / d21 ! update elements in columns a(k) and a(k+1) as ! dot products of rows of ( w(k) w(k+1) ) and columns ! of d**(-1) do j = k + 2, n a( j, k ) = conjg( d21 )*( d11*w( j, k )-w( j, k+1 ) ) a( j, k+1 ) = d21*( d22*w( j, k+1 )-w( j, k ) ) end do end if ! copy d(k) to a a( k, k ) = w( k, k ) a( k+1, k ) = w( k+1, k ) a( k+1, k+1 ) = w( k+1, k+1 ) ! (2) conjugate columns w(k) and w(k+1) call stdlib${ii}$_${ci}$lacgv( n-k, w( k+1, k ), 1_${ik}$ ) call stdlib${ii}$_${ci}$lacgv( n-k-1, w( k+2, k+1 ), 1_${ik}$ ) end if end if ! store details of the interchanges in ipiv if( kstep==1_${ik}$ ) then ipiv( k ) = kp else ipiv( k ) = -kp ipiv( k+1 ) = -kp end if ! increase k and return to the start of the main loop k = k + kstep go to 70 90 continue ! update the lower triangle of a22 (= a(k:n,k:n)) as ! a22 := a22 - l21*d*l21**h = a22 - l21*w**h ! computing blocks of nb columns at a time (note that conjg(w) is ! actually stored) do j = k, n, nb jb = min( nb, n-j+1 ) ! update the lower triangle of the diagonal block do jj = j, j + jb - 1 a( jj, jj ) = real( a( jj, jj ),KIND=${ck}$) call stdlib${ii}$_${ci}$gemv( 'NO TRANSPOSE', j+jb-jj, k-1, -cone,a( jj, 1_${ik}$ ), lda, w( jj,& 1_${ik}$ ), ldw, cone,a( jj, jj ), 1_${ik}$ ) a( jj, jj ) = real( a( jj, jj ),KIND=${ck}$) end do ! update the rectangular subdiagonal block if( j+jb<=n )call stdlib${ii}$_${ci}$gemm( 'NO TRANSPOSE', 'TRANSPOSE', n-j-jb+1, jb,k-1, -& cone, a( j+jb, 1_${ik}$ ), lda, w( j, 1_${ik}$ ),ldw, cone, a( j+jb, j ), lda ) end do ! put l21 in standard form by partially undoing the interchanges ! of rows in columns 1:k-1 looping backwards from k-1 to 1 j = k - 1_${ik}$ 120 continue ! undo the interchanges (if any) of rows jj and jp at each ! step j ! (here, j is a diagonal index) jj = j jp = ipiv( j ) if( jp<0_${ik}$ ) then jp = -jp ! (here, j is a diagonal index) j = j - 1_${ik}$ end if ! (note: here, j is used to determine row length. length j ! of the rows to swap back doesn't include diagonal element) j = j - 1_${ik}$ if( jp/=jj .and. j>=1_${ik}$ )call stdlib${ii}$_${ci}$swap( j, a( jp, 1_${ik}$ ), lda, a( jj, 1_${ik}$ ), lda ) if( j>1 )go to 120 ! set kb to the number of columns factorized kb = k - 1_${ik}$ end if return end subroutine stdlib${ii}$_${ci}$lahef #:endif #:endfor pure module subroutine stdlib${ii}$_chetf2( uplo, n, a, lda, ipiv, info ) !! CHETF2 computes the factorization of a complex Hermitian matrix A !! using the Bunch-Kaufman diagonal pivoting method: !! A = U*D*U**H or A = L*D*L**H !! where U (or L) is a product of permutation and unit upper (lower) !! triangular matrices, U**H is the conjugate transpose of U, and D is !! Hermitian and block diagonal with 1-by-1 and 2-by-2 diagonal blocks. !! This is the unblocked version of the algorithm, calling Level 2 BLAS. ! -- lapack computational routine -- ! -- lapack is a software package provided by univ. of tennessee, -- ! -- univ. of california berkeley, univ. of colorado denver and nag ltd..-- use stdlib_blas_constants_sp, only: negone, zero, half, one, two, three, four, eight, ten, czero, chalf, cone, cnegone ! Scalar Arguments character, intent(in) :: uplo integer(${ik}$), intent(out) :: info integer(${ik}$), intent(in) :: lda, n ! Array Arguments integer(${ik}$), intent(out) :: ipiv(*) complex(sp), intent(inout) :: a(lda,*) ! ===================================================================== ! Parameters real(sp), parameter :: sevten = 17.0e+0_sp ! Local Scalars logical(lk) :: upper integer(${ik}$) :: i, imax, j, jmax, k, kk, kp, kstep real(sp) :: absakk, alpha, colmax, d, d11, d22, r1, rowmax, tt complex(sp) :: d12, d21, t, wk, wkm1, wkp1, zdum ! Intrinsic Functions ! Statement Functions real(sp) :: cabs1 ! Statement Function Definitions cabs1( zdum ) = abs( real( zdum,KIND=sp) ) + abs( aimag( zdum ) ) ! Executable Statements ! test the input parameters. info = 0_${ik}$ upper = stdlib_lsame( uplo, 'U' ) if( .not.upper .and. .not.stdlib_lsame( uplo, 'L' ) ) then info = -1_${ik}$ else if( n<0_${ik}$ ) then info = -2_${ik}$ else if( lda<max( 1_${ik}$, n ) ) then info = -4_${ik}$ end if if( info/=0_${ik}$ ) then call stdlib${ii}$_xerbla( 'CHETF2', -info ) return end if ! initialize alpha for use in choosing pivot block size. alpha = ( one+sqrt( sevten ) ) / eight if( upper ) then ! factorize a as u*d*u**h using the upper triangle of a ! k is the main loop index, decreasing from n to 1 in steps of ! 1 or 2 k = n 10 continue ! if k < 1, exit from loop if( k<1 )go to 90 kstep = 1_${ik}$ ! determine rows and columns to be interchanged and whether ! a 1-by-1 or 2-by-2 pivot block will be used absakk = abs( real( a( k, k ),KIND=sp) ) ! imax is the row-index of the largest off-diagonal element in ! column k, and colmax is its absolute value. ! determine both colmax and imax. if( k>1_${ik}$ ) then imax = stdlib${ii}$_icamax( k-1, a( 1_${ik}$, k ), 1_${ik}$ ) colmax = cabs1( a( imax, k ) ) else colmax = zero end if if( (max( absakk, colmax )==zero) .or. stdlib${ii}$_sisnan(absakk) ) then ! column k is or underflow, or contains a nan: ! set info and continue if( info==0_${ik}$ )info = k kp = k a( k, k ) = real( a( k, k ),KIND=sp) else if( absakk>=alpha*colmax ) then ! no interchange, use 1-by-1 pivot block kp = k else ! jmax is the column-index of the largest off-diagonal ! element in row imax, and rowmax is its absolute value jmax = imax + stdlib${ii}$_icamax( k-imax, a( imax, imax+1 ), lda ) rowmax = cabs1( a( imax, jmax ) ) if( imax>1_${ik}$ ) then jmax = stdlib${ii}$_icamax( imax-1, a( 1_${ik}$, imax ), 1_${ik}$ ) rowmax = max( rowmax, cabs1( a( jmax, imax ) ) ) end if if( absakk>=alpha*colmax*( colmax / rowmax ) ) then ! no interchange, use 1-by-1 pivot block kp = k else if( abs( real( a( imax, imax ),KIND=sp) )>=alpha*rowmax )then ! interchange rows and columns k and imax, use 1-by-1 ! pivot block kp = imax else ! interchange rows and columns k-1 and imax, use 2-by-2 ! pivot block kp = imax kstep = 2_${ik}$ end if end if kk = k - kstep + 1_${ik}$ if( kp/=kk ) then ! interchange rows and columns kk and kp in the leading ! submatrix a(1:k,1:k) call stdlib${ii}$_cswap( kp-1, a( 1_${ik}$, kk ), 1_${ik}$, a( 1_${ik}$, kp ), 1_${ik}$ ) do j = kp + 1, kk - 1 t = conjg( a( j, kk ) ) a( j, kk ) = conjg( a( kp, j ) ) a( kp, j ) = t end do a( kp, kk ) = conjg( a( kp, kk ) ) r1 = real( a( kk, kk ),KIND=sp) a( kk, kk ) = real( a( kp, kp ),KIND=sp) a( kp, kp ) = r1 if( kstep==2_${ik}$ ) then a( k, k ) = real( a( k, k ),KIND=sp) t = a( k-1, k ) a( k-1, k ) = a( kp, k ) a( kp, k ) = t end if else a( k, k ) = real( a( k, k ),KIND=sp) if( kstep==2_${ik}$ )a( k-1, k-1 ) = real( a( k-1, k-1 ),KIND=sp) end if ! update the leading submatrix if( kstep==1_${ik}$ ) then ! 1-by-1 pivot block d(k): column k now holds ! w(k) = u(k)*d(k) ! where u(k) is the k-th column of u ! perform a rank-1 update of a(1:k-1,1:k-1) as ! a := a - u(k)*d(k)*u(k)**h = a - w(k)*1/d(k)*w(k)**h r1 = one / real( a( k, k ),KIND=sp) call stdlib${ii}$_cher( uplo, k-1, -r1, a( 1_${ik}$, k ), 1_${ik}$, a, lda ) ! store u(k) in column k call stdlib${ii}$_csscal( k-1, r1, a( 1_${ik}$, k ), 1_${ik}$ ) else ! 2-by-2 pivot block d(k): columns k and k-1 now hold ! ( w(k-1) w(k) ) = ( u(k-1) u(k) )*d(k) ! where u(k) and u(k-1) are the k-th and (k-1)-th columns ! of u ! perform a rank-2 update of a(1:k-2,1:k-2) as ! a := a - ( u(k-1) u(k) )*d(k)*( u(k-1) u(k) )**h ! = a - ( w(k-1) w(k) )*inv(d(k))*( w(k-1) w(k) )**h if( k>2_${ik}$ ) then d = stdlib${ii}$_slapy2( real( a( k-1, k ),KIND=sp),aimag( a( k-1, k ) ) ) d22 = real( a( k-1, k-1 ),KIND=sp) / d d11 = real( a( k, k ),KIND=sp) / d tt = one / ( d11*d22-one ) d12 = a( k-1, k ) / d d = tt / d do j = k - 2, 1, -1 wkm1 = d*( d11*a( j, k-1 )-conjg( d12 )*a( j, k ) ) wk = d*( d22*a( j, k )-d12*a( j, k-1 ) ) do i = j, 1, -1 a( i, j ) = a( i, j ) - a( i, k )*conjg( wk ) -a( i, k-1 )*conjg( & wkm1 ) end do a( j, k ) = wk a( j, k-1 ) = wkm1 a( j, j ) = cmplx( real( a( j, j ),KIND=sp), zero,KIND=sp) end do end if end if end if ! store details of the interchanges in ipiv if( kstep==1_${ik}$ ) then ipiv( k ) = kp else ipiv( k ) = -kp ipiv( k-1 ) = -kp end if ! decrease k and return to the start of the main loop k = k - kstep go to 10 else ! factorize a as l*d*l**h using the lower triangle of a ! k is the main loop index, increasing from 1 to n in steps of ! 1 or 2 k = 1_${ik}$ 50 continue ! if k > n, exit from loop if( k>n )go to 90 kstep = 1_${ik}$ ! determine rows and columns to be interchanged and whether ! a 1-by-1 or 2-by-2 pivot block will be used absakk = abs( real( a( k, k ),KIND=sp) ) ! imax is the row-index of the largest off-diagonal element in ! column k, and colmax is its absolute value. ! determine both colmax and imax. if( k<n ) then imax = k + stdlib${ii}$_icamax( n-k, a( k+1, k ), 1_${ik}$ ) colmax = cabs1( a( imax, k ) ) else colmax = zero end if if( (max( absakk, colmax )==zero) .or. stdlib${ii}$_sisnan(absakk) ) then ! column k is zero or underflow, contains a nan: ! set info and continue if( info==0_${ik}$ )info = k kp = k a( k, k ) = real( a( k, k ),KIND=sp) else if( absakk>=alpha*colmax ) then ! no interchange, use 1-by-1 pivot block kp = k else ! jmax is the column-index of the largest off-diagonal ! element in row imax, and rowmax is its absolute value jmax = k - 1_${ik}$ + stdlib${ii}$_icamax( imax-k, a( imax, k ), lda ) rowmax = cabs1( a( imax, jmax ) ) if( imax<n ) then jmax = imax + stdlib${ii}$_icamax( n-imax, a( imax+1, imax ), 1_${ik}$ ) rowmax = max( rowmax, cabs1( a( jmax, imax ) ) ) end if if( absakk>=alpha*colmax*( colmax / rowmax ) ) then ! no interchange, use 1-by-1 pivot block kp = k else if( abs( real( a( imax, imax ),KIND=sp) )>=alpha*rowmax )then ! interchange rows and columns k and imax, use 1-by-1 ! pivot block kp = imax else ! interchange rows and columns k+1 and imax, use 2-by-2 ! pivot block kp = imax kstep = 2_${ik}$ end if end if kk = k + kstep - 1_${ik}$ if( kp/=kk ) then ! interchange rows and columns kk and kp in the trailing ! submatrix a(k:n,k:n) if( kp<n )call stdlib${ii}$_cswap( n-kp, a( kp+1, kk ), 1_${ik}$, a( kp+1, kp ), 1_${ik}$ ) do j = kk + 1, kp - 1 t = conjg( a( j, kk ) ) a( j, kk ) = conjg( a( kp, j ) ) a( kp, j ) = t end do a( kp, kk ) = conjg( a( kp, kk ) ) r1 = real( a( kk, kk ),KIND=sp) a( kk, kk ) = real( a( kp, kp ),KIND=sp) a( kp, kp ) = r1 if( kstep==2_${ik}$ ) then a( k, k ) = real( a( k, k ),KIND=sp) t = a( k+1, k ) a( k+1, k ) = a( kp, k ) a( kp, k ) = t end if else a( k, k ) = real( a( k, k ),KIND=sp) if( kstep==2_${ik}$ )a( k+1, k+1 ) = real( a( k+1, k+1 ),KIND=sp) end if ! update the trailing submatrix if( kstep==1_${ik}$ ) then ! 1-by-1 pivot block d(k): column k now holds ! w(k) = l(k)*d(k) ! where l(k) is the k-th column of l if( k<n ) then ! perform a rank-1 update of a(k+1:n,k+1:n) as ! a := a - l(k)*d(k)*l(k)**h = a - w(k)*(1/d(k))*w(k)**h r1 = one / real( a( k, k ),KIND=sp) call stdlib${ii}$_cher( uplo, n-k, -r1, a( k+1, k ), 1_${ik}$,a( k+1, k+1 ), lda ) ! store l(k) in column k call stdlib${ii}$_csscal( n-k, r1, a( k+1, k ), 1_${ik}$ ) end if else ! 2-by-2 pivot block d(k) if( k<n-1 ) then ! perform a rank-2 update of a(k+2:n,k+2:n) as ! a := a - ( l(k) l(k+1) )*d(k)*( l(k) l(k+1) )**h ! = a - ( w(k) w(k+1) )*inv(d(k))*( w(k) w(k+1) )**h ! where l(k) and l(k+1) are the k-th and (k+1)-th ! columns of l d = stdlib${ii}$_slapy2( real( a( k+1, k ),KIND=sp),aimag( a( k+1, k ) ) ) d11 = real( a( k+1, k+1 ),KIND=sp) / d d22 = real( a( k, k ),KIND=sp) / d tt = one / ( d11*d22-one ) d21 = a( k+1, k ) / d d = tt / d do j = k + 2, n wk = d*( d11*a( j, k )-d21*a( j, k+1 ) ) wkp1 = d*( d22*a( j, k+1 )-conjg( d21 )*a( j, k ) ) do i = j, n a( i, j ) = a( i, j ) - a( i, k )*conjg( wk ) -a( i, k+1 )*conjg( & wkp1 ) end do a( j, k ) = wk a( j, k+1 ) = wkp1 a( j, j ) = cmplx( real( a( j, j ),KIND=sp), zero,KIND=sp) end do end if end if end if ! store details of the interchanges in ipiv if( kstep==1_${ik}$ ) then ipiv( k ) = kp else ipiv( k ) = -kp ipiv( k+1 ) = -kp end if ! increase k and return to the start of the main loop k = k + kstep go to 50 end if 90 continue return end subroutine stdlib${ii}$_chetf2 pure module subroutine stdlib${ii}$_zhetf2( uplo, n, a, lda, ipiv, info ) !! ZHETF2 computes the factorization of a complex Hermitian matrix A !! using the Bunch-Kaufman diagonal pivoting method: !! A = U*D*U**H or A = L*D*L**H !! where U (or L) is a product of permutation and unit upper (lower) !! triangular matrices, U**H is the conjugate transpose of U, and D is !! Hermitian and block diagonal with 1-by-1 and 2-by-2 diagonal blocks. !! This is the unblocked version of the algorithm, calling Level 2 BLAS. ! -- lapack computational routine -- ! -- lapack is a software package provided by univ. of tennessee, -- ! -- univ. of california berkeley, univ. of colorado denver and nag ltd..-- use stdlib_blas_constants_dp, only: negone, zero, half, one, two, three, four, eight, ten, czero, chalf, cone, cnegone ! Scalar Arguments character, intent(in) :: uplo integer(${ik}$), intent(out) :: info integer(${ik}$), intent(in) :: lda, n ! Array Arguments integer(${ik}$), intent(out) :: ipiv(*) complex(dp), intent(inout) :: a(lda,*) ! ===================================================================== ! Parameters real(dp), parameter :: sevten = 17.0e+0_dp ! Local Scalars logical(lk) :: upper integer(${ik}$) :: i, imax, j, jmax, k, kk, kp, kstep real(dp) :: absakk, alpha, colmax, d, d11, d22, r1, rowmax, tt complex(dp) :: d12, d21, t, wk, wkm1, wkp1, zdum ! Intrinsic Functions ! Statement Functions real(dp) :: cabs1 ! Statement Function Definitions cabs1( zdum ) = abs( real( zdum,KIND=dp) ) + abs( aimag( zdum ) ) ! Executable Statements ! test the input parameters. info = 0_${ik}$ upper = stdlib_lsame( uplo, 'U' ) if( .not.upper .and. .not.stdlib_lsame( uplo, 'L' ) ) then info = -1_${ik}$ else if( n<0_${ik}$ ) then info = -2_${ik}$ else if( lda<max( 1_${ik}$, n ) ) then info = -4_${ik}$ end if if( info/=0_${ik}$ ) then call stdlib${ii}$_xerbla( 'ZHETF2', -info ) return end if ! initialize alpha for use in choosing pivot block size. alpha = ( one+sqrt( sevten ) ) / eight if( upper ) then ! factorize a as u*d*u**h using the upper triangle of a ! k is the main loop index, decreasing from n to 1 in steps of ! 1 or 2 k = n 10 continue ! if k < 1, exit from loop if( k<1 )go to 90 kstep = 1_${ik}$ ! determine rows and columns to be interchanged and whether ! a 1-by-1 or 2-by-2 pivot block will be used absakk = abs( real( a( k, k ),KIND=dp) ) ! imax is the row-index of the largest off-diagonal element in ! column k, and colmax is its absolute value. ! determine both colmax and imax. if( k>1_${ik}$ ) then imax = stdlib${ii}$_izamax( k-1, a( 1_${ik}$, k ), 1_${ik}$ ) colmax = cabs1( a( imax, k ) ) else colmax = zero end if if( (max( absakk, colmax )==zero) .or. stdlib${ii}$_disnan(absakk) ) then ! column k is zero or underflow, or contains a nan: ! set info and continue if( info==0_${ik}$ )info = k kp = k a( k, k ) = real( a( k, k ),KIND=dp) else ! ============================================================ ! test for interchange if( absakk>=alpha*colmax ) then ! no interchange, use 1-by-1 pivot block kp = k else ! jmax is the column-index of the largest off-diagonal ! element in row imax, and rowmax is its absolute value. ! determine only rowmax. jmax = imax + stdlib${ii}$_izamax( k-imax, a( imax, imax+1 ), lda ) rowmax = cabs1( a( imax, jmax ) ) if( imax>1_${ik}$ ) then jmax = stdlib${ii}$_izamax( imax-1, a( 1_${ik}$, imax ), 1_${ik}$ ) rowmax = max( rowmax, cabs1( a( jmax, imax ) ) ) end if if( absakk>=alpha*colmax*( colmax / rowmax ) ) then ! no interchange, use 1-by-1 pivot block kp = k else if( abs( real( a( imax, imax ),KIND=dp) )>=alpha*rowmax )then ! interchange rows and columns k and imax, use 1-by-1 ! pivot block kp = imax else ! interchange rows and columns k-1 and imax, use 2-by-2 ! pivot block kp = imax kstep = 2_${ik}$ end if end if ! ============================================================ kk = k - kstep + 1_${ik}$ if( kp/=kk ) then ! interchange rows and columns kk and kp in the leading ! submatrix a(1:k,1:k) call stdlib${ii}$_zswap( kp-1, a( 1_${ik}$, kk ), 1_${ik}$, a( 1_${ik}$, kp ), 1_${ik}$ ) do j = kp + 1, kk - 1 t = conjg( a( j, kk ) ) a( j, kk ) = conjg( a( kp, j ) ) a( kp, j ) = t end do a( kp, kk ) = conjg( a( kp, kk ) ) r1 = real( a( kk, kk ),KIND=dp) a( kk, kk ) = real( a( kp, kp ),KIND=dp) a( kp, kp ) = r1 if( kstep==2_${ik}$ ) then a( k, k ) = real( a( k, k ),KIND=dp) t = a( k-1, k ) a( k-1, k ) = a( kp, k ) a( kp, k ) = t end if else a( k, k ) = real( a( k, k ),KIND=dp) if( kstep==2_${ik}$ )a( k-1, k-1 ) = real( a( k-1, k-1 ),KIND=dp) end if ! update the leading submatrix if( kstep==1_${ik}$ ) then ! 1-by-1 pivot block d(k): column k now holds ! w(k) = u(k)*d(k) ! where u(k) is the k-th column of u ! perform a rank-1 update of a(1:k-1,1:k-1) as ! a := a - u(k)*d(k)*u(k)**h = a - w(k)*1/d(k)*w(k)**h r1 = one / real( a( k, k ),KIND=dp) call stdlib${ii}$_zher( uplo, k-1, -r1, a( 1_${ik}$, k ), 1_${ik}$, a, lda ) ! store u(k) in column k call stdlib${ii}$_zdscal( k-1, r1, a( 1_${ik}$, k ), 1_${ik}$ ) else ! 2-by-2 pivot block d(k): columns k and k-1 now hold ! ( w(k-1) w(k) ) = ( u(k-1) u(k) )*d(k) ! where u(k) and u(k-1) are the k-th and (k-1)-th columns ! of u ! perform a rank-2 update of a(1:k-2,1:k-2) as ! a := a - ( u(k-1) u(k) )*d(k)*( u(k-1) u(k) )**h ! = a - ( w(k-1) w(k) )*inv(d(k))*( w(k-1) w(k) )**h if( k>2_${ik}$ ) then d = stdlib${ii}$_dlapy2( real( a( k-1, k ),KIND=dp),aimag( a( k-1, k ) ) ) d22 = real( a( k-1, k-1 ),KIND=dp) / d d11 = real( a( k, k ),KIND=dp) / d tt = one / ( d11*d22-one ) d12 = a( k-1, k ) / d d = tt / d do j = k - 2, 1, -1 wkm1 = d*( d11*a( j, k-1 )-conjg( d12 )*a( j, k ) ) wk = d*( d22*a( j, k )-d12*a( j, k-1 ) ) do i = j, 1, -1 a( i, j ) = a( i, j ) - a( i, k )*conjg( wk ) -a( i, k-1 )*conjg( & wkm1 ) end do a( j, k ) = wk a( j, k-1 ) = wkm1 a( j, j ) = cmplx( real( a( j, j ),KIND=dp), zero,KIND=dp) end do end if end if end if ! store details of the interchanges in ipiv if( kstep==1_${ik}$ ) then ipiv( k ) = kp else ipiv( k ) = -kp ipiv( k-1 ) = -kp end if ! decrease k and return to the start of the main loop k = k - kstep go to 10 else ! factorize a as l*d*l**h using the lower triangle of a ! k is the main loop index, increasing from 1 to n in steps of ! 1 or 2 k = 1_${ik}$ 50 continue ! if k > n, exit from loop if( k>n )go to 90 kstep = 1_${ik}$ ! determine rows and columns to be interchanged and whether ! a 1-by-1 or 2-by-2 pivot block will be used absakk = abs( real( a( k, k ),KIND=dp) ) ! imax is the row-index of the largest off-diagonal element in ! column k, and colmax is its absolute value. ! determine both colmax and imax. if( k<n ) then imax = k + stdlib${ii}$_izamax( n-k, a( k+1, k ), 1_${ik}$ ) colmax = cabs1( a( imax, k ) ) else colmax = zero end if if( (max( absakk, colmax )==zero) .or. stdlib${ii}$_disnan(absakk) ) then ! column k is zero or underflow, or contains a nan: ! set info and continue if( info==0_${ik}$ )info = k kp = k a( k, k ) = real( a( k, k ),KIND=dp) else ! ============================================================ ! test for interchange if( absakk>=alpha*colmax ) then ! no interchange, use 1-by-1 pivot block kp = k else ! jmax is the column-index of the largest off-diagonal ! element in row imax, and rowmax is its absolute value. ! determine only rowmax. jmax = k - 1_${ik}$ + stdlib${ii}$_izamax( imax-k, a( imax, k ), lda ) rowmax = cabs1( a( imax, jmax ) ) if( imax<n ) then jmax = imax + stdlib${ii}$_izamax( n-imax, a( imax+1, imax ), 1_${ik}$ ) rowmax = max( rowmax, cabs1( a( jmax, imax ) ) ) end if if( absakk>=alpha*colmax*( colmax / rowmax ) ) then ! no interchange, use 1-by-1 pivot block kp = k else if( abs( real( a( imax, imax ),KIND=dp) )>=alpha*rowmax )then ! interchange rows and columns k and imax, use 1-by-1 ! pivot block kp = imax else ! interchange rows and columns k+1 and imax, use 2-by-2 ! pivot block kp = imax kstep = 2_${ik}$ end if end if ! ============================================================ kk = k + kstep - 1_${ik}$ if( kp/=kk ) then ! interchange rows and columns kk and kp in the trailing ! submatrix a(k:n,k:n) if( kp<n )call stdlib${ii}$_zswap( n-kp, a( kp+1, kk ), 1_${ik}$, a( kp+1, kp ), 1_${ik}$ ) do j = kk + 1, kp - 1 t = conjg( a( j, kk ) ) a( j, kk ) = conjg( a( kp, j ) ) a( kp, j ) = t end do a( kp, kk ) = conjg( a( kp, kk ) ) r1 = real( a( kk, kk ),KIND=dp) a( kk, kk ) = real( a( kp, kp ),KIND=dp) a( kp, kp ) = r1 if( kstep==2_${ik}$ ) then a( k, k ) = real( a( k, k ),KIND=dp) t = a( k+1, k ) a( k+1, k ) = a( kp, k ) a( kp, k ) = t end if else a( k, k ) = real( a( k, k ),KIND=dp) if( kstep==2_${ik}$ )a( k+1, k+1 ) = real( a( k+1, k+1 ),KIND=dp) end if ! update the trailing submatrix if( kstep==1_${ik}$ ) then ! 1-by-1 pivot block d(k): column k now holds ! w(k) = l(k)*d(k) ! where l(k) is the k-th column of l if( k<n ) then ! perform a rank-1 update of a(k+1:n,k+1:n) as ! a := a - l(k)*d(k)*l(k)**h = a - w(k)*(1/d(k))*w(k)**h r1 = one / real( a( k, k ),KIND=dp) call stdlib${ii}$_zher( uplo, n-k, -r1, a( k+1, k ), 1_${ik}$,a( k+1, k+1 ), lda ) ! store l(k) in column k call stdlib${ii}$_zdscal( n-k, r1, a( k+1, k ), 1_${ik}$ ) end if else ! 2-by-2 pivot block d(k) if( k<n-1 ) then ! perform a rank-2 update of a(k+2:n,k+2:n) as ! a := a - ( l(k) l(k+1) )*d(k)*( l(k) l(k+1) )**h ! = a - ( w(k) w(k+1) )*inv(d(k))*( w(k) w(k+1) )**h ! where l(k) and l(k+1) are the k-th and (k+1)-th ! columns of l d = stdlib${ii}$_dlapy2( real( a( k+1, k ),KIND=dp),aimag( a( k+1, k ) ) ) d11 = real( a( k+1, k+1 ),KIND=dp) / d d22 = real( a( k, k ),KIND=dp) / d tt = one / ( d11*d22-one ) d21 = a( k+1, k ) / d d = tt / d do j = k + 2, n wk = d*( d11*a( j, k )-d21*a( j, k+1 ) ) wkp1 = d*( d22*a( j, k+1 )-conjg( d21 )*a( j, k ) ) do i = j, n a( i, j ) = a( i, j ) - a( i, k )*conjg( wk ) -a( i, k+1 )*conjg( & wkp1 ) end do a( j, k ) = wk a( j, k+1 ) = wkp1 a( j, j ) = cmplx( real( a( j, j ),KIND=dp), zero,KIND=dp) end do end if end if end if ! store details of the interchanges in ipiv if( kstep==1_${ik}$ ) then ipiv( k ) = kp else ipiv( k ) = -kp ipiv( k+1 ) = -kp end if ! increase k and return to the start of the main loop k = k + kstep go to 50 end if 90 continue return end subroutine stdlib${ii}$_zhetf2 #:for ck,ct,ci in CMPLX_KINDS_TYPES #:if not ck in ["sp","dp"] pure module subroutine stdlib${ii}$_${ci}$hetf2( uplo, n, a, lda, ipiv, info ) !! ZHETF2: computes the factorization of a complex Hermitian matrix A !! using the Bunch-Kaufman diagonal pivoting method: !! A = U*D*U**H or A = L*D*L**H !! where U (or L) is a product of permutation and unit upper (lower) !! triangular matrices, U**H is the conjugate transpose of U, and D is !! Hermitian and block diagonal with 1-by-1 and 2-by-2 diagonal blocks. !! This is the unblocked version of the algorithm, calling Level 2 BLAS. ! -- lapack computational routine -- ! -- lapack is a software package provided by univ. of tennessee, -- ! -- univ. of california berkeley, univ. of colorado denver and nag ltd..-- use stdlib_blas_constants_${ck}$, only: negone, zero, half, one, two, three, four, eight, ten, czero, chalf, cone, cnegone ! Scalar Arguments character, intent(in) :: uplo integer(${ik}$), intent(out) :: info integer(${ik}$), intent(in) :: lda, n ! Array Arguments integer(${ik}$), intent(out) :: ipiv(*) complex(${ck}$), intent(inout) :: a(lda,*) ! ===================================================================== ! Parameters real(${ck}$), parameter :: sevten = 17.0e+0_${ck}$ ! Local Scalars logical(lk) :: upper integer(${ik}$) :: i, imax, j, jmax, k, kk, kp, kstep real(${ck}$) :: absakk, alpha, colmax, d, d11, d22, r1, rowmax, tt complex(${ck}$) :: d12, d21, t, wk, wkm1, wkp1, zdum ! Intrinsic Functions ! Statement Functions real(${ck}$) :: cabs1 ! Statement Function Definitions cabs1( zdum ) = abs( real( zdum,KIND=${ck}$) ) + abs( aimag( zdum ) ) ! Executable Statements ! test the input parameters. info = 0_${ik}$ upper = stdlib_lsame( uplo, 'U' ) if( .not.upper .and. .not.stdlib_lsame( uplo, 'L' ) ) then info = -1_${ik}$ else if( n<0_${ik}$ ) then info = -2_${ik}$ else if( lda<max( 1_${ik}$, n ) ) then info = -4_${ik}$ end if if( info/=0_${ik}$ ) then call stdlib${ii}$_xerbla( 'ZHETF2', -info ) return end if ! initialize alpha for use in choosing pivot block size. alpha = ( one+sqrt( sevten ) ) / eight if( upper ) then ! factorize a as u*d*u**h using the upper triangle of a ! k is the main loop index, decreasing from n to 1 in steps of ! 1 or 2 k = n 10 continue ! if k < 1, exit from loop if( k<1 )go to 90 kstep = 1_${ik}$ ! determine rows and columns to be interchanged and whether ! a 1-by-1 or 2-by-2 pivot block will be used absakk = abs( real( a( k, k ),KIND=${ck}$) ) ! imax is the row-index of the largest off-diagonal element in ! column k, and colmax is its absolute value. ! determine both colmax and imax. if( k>1_${ik}$ ) then imax = stdlib${ii}$_i${ci