Functions
subroutine	dlahrd (n, k, nb, a, lda, tau, t, ldt, y, ldy)
	DLAHRD reduces the first nb columns of a general rectangular matrix A so that elements below the k-th subdiagonal are zero, and returns auxiliary matrices which are needed to apply the transformation to the unreduced part of A.
subroutine	dlabrd (m, n, nb, a, lda, d, e, tauq, taup, x, ldx, y, ldy)
	DLABRD reduces the first nb rows and columns of a general matrix to a bidiagonal form.
subroutine	dlacn2 (n, v, x, isgn, est, kase, isave)
	DLACN2 estimates the 1-norm of a square matrix, using reverse communication for evaluating matrix-vector products.
subroutine	dlacon (n, v, x, isgn, est, kase)
	DLACON estimates the 1-norm of a square matrix, using reverse communication for evaluating matrix-vector products.
subroutine	dladiv (a, b, c, d, p, q)
	DLADIV performs complex division in real arithmetic, avoiding unnecessary overflow.
subroutine	dladiv1 (a, b, c, d, p, q)
double precision function	dladiv2 (a, b, c, d, r, t)
subroutine	dlaein (rightv, noinit, n, h, ldh, wr, wi, vr, vi, b, ldb, work, eps3, smlnum, bignum, info)
	DLAEIN computes a specified right or left eigenvector of an upper Hessenberg matrix by inverse iteration.
subroutine	dlaexc (wantq, n, t, ldt, q, ldq, j1, n1, n2, work, info)
	DLAEXC swaps adjacent diagonal blocks of a real upper quasi-triangular matrix in Schur canonical form, by an orthogonal similarity transformation.
subroutine	dlag2 (a, lda, b, ldb, safmin, scale1, scale2, wr1, wr2, wi)
	DLAG2 computes the eigenvalues of a 2-by-2 generalized eigenvalue problem, with scaling as necessary to avoid over-/underflow.
subroutine	dlag2s (m, n, a, lda, sa, ldsa, info)
	DLAG2S converts a double precision matrix to a single precision matrix.
subroutine	dlags2 (upper, a1, a2, a3, b1, b2, b3, csu, snu, csv, snv, csq, snq)
	DLAGS2 computes 2-by-2 orthogonal matrices U, V, and Q, and applies them to matrices A and B such that the rows of the transformed A and B are parallel.
subroutine	dlagtm (trans, n, nrhs, alpha, dl, d, du, x, ldx, beta, b, ldb)
	DLAGTM performs a matrix-matrix product of the form C = αAB+βC, where A is a tridiagonal matrix, B and C are rectangular matrices, and α and β are scalars, which may be 0, 1, or -1.
subroutine	dlagv2 (a, lda, b, ldb, alphar, alphai, beta, csl, snl, csr, snr)
	DLAGV2 computes the Generalized Schur factorization of a real 2-by-2 matrix pencil (A,B) where B is upper triangular.
subroutine	dlahqr (wantt, wantz, n, ilo, ihi, h, ldh, wr, wi, iloz, ihiz, z, ldz, info)
	DLAHQR computes the eigenvalues and Schur factorization of an upper Hessenberg matrix, using the double-shift/single-shift QR algorithm.
subroutine	dlahr2 (n, k, nb, a, lda, tau, t, ldt, y, ldy)
	DLAHR2 reduces the specified number of first columns of a general rectangular matrix A so that elements below the specified subdiagonal are zero, and returns auxiliary matrices which are needed to apply the transformation to the unreduced part of A.
subroutine	dlaic1 (job, j, x, sest, w, gamma, sestpr, s, c)
	DLAIC1 applies one step of incremental condition estimation.
subroutine	dlaln2 (ltrans, na, nw, smin, ca, a, lda, d1, d2, b, ldb, wr, wi, x, ldx, scale, xnorm, info)
	DLALN2 solves a 1-by-1 or 2-by-2 linear system of equations of the specified form.
double precision function	dlangt (norm, n, dl, d, du)
	DLANGT returns the value of the 1-norm, Frobenius norm, infinity-norm, or the largest absolute value of any element of a general tridiagonal matrix.
double precision function	dlanhs (norm, n, a, lda, work)
	DLANHS returns the value of the 1-norm, Frobenius norm, infinity-norm, or the largest absolute value of any element of an upper Hessenberg matrix.
double precision function	dlansb (norm, uplo, n, k, ab, ldab, work)
	DLANSB returns the value of the 1-norm, or the Frobenius norm, or the infinity norm, or the element of largest absolute value of a symmetric band matrix.
double precision function	dlansp (norm, uplo, n, ap, work)
	DLANSP returns the value of the 1-norm, or the Frobenius norm, or the infinity norm, or the element of largest absolute value of a symmetric matrix supplied in packed form.
double precision function	dlantb (norm, uplo, diag, n, k, ab, ldab, work)
	DLANTB returns the value of the 1-norm, or the Frobenius norm, or the infinity norm, or the element of largest absolute value of a triangular band matrix.
double precision function	dlantp (norm, uplo, diag, n, ap, work)
	DLANTP returns the value of the 1-norm, or the Frobenius norm, or the infinity norm, or the element of largest absolute value of a triangular matrix supplied in packed form.
double precision function	dlantr (norm, uplo, diag, m, n, a, lda, work)
	DLANTR returns the value of the 1-norm, or the Frobenius norm, or the infinity norm, or the element of largest absolute value of a trapezoidal or triangular matrix.
subroutine	dlanv2 (a, b, c, d, rt1r, rt1i, rt2r, rt2i, cs, sn)
	DLANV2 computes the Schur factorization of a real 2-by-2 nonsymmetric matrix in standard form.
subroutine	dlapll (n, x, incx, y, incy, ssmin)
	DLAPLL measures the linear dependence of two vectors.
subroutine	dlapmr (forwrd, m, n, x, ldx, k)
	DLAPMR rearranges rows of a matrix as specified by a permutation vector.
subroutine	dlapmt (forwrd, m, n, x, ldx, k)
	DLAPMT performs a forward or backward permutation of the columns of a matrix.
subroutine	dlaqp2 (m, n, offset, a, lda, jpvt, tau, vn1, vn2, work)
	DLAQP2 computes a QR factorization with column pivoting of the matrix block.
subroutine	dlaqps (m, n, offset, nb, kb, a, lda, jpvt, tau, vn1, vn2, auxv, f, ldf)
	DLAQPS computes a step of QR factorization with column pivoting of a real m-by-n matrix A by using BLAS level 3.
subroutine	dlaqr0 (wantt, wantz, n, ilo, ihi, h, ldh, wr, wi, iloz, ihiz, z, ldz, work, lwork, info)
	DLAQR0 computes the eigenvalues of a Hessenberg matrix, and optionally the matrices from the Schur decomposition.
subroutine	dlaqr1 (n, h, ldh, sr1, si1, sr2, si2, v)
	DLAQR1 sets a scalar multiple of the first column of the product of 2-by-2 or 3-by-3 matrix H and specified shifts.
subroutine	dlaqr2 (wantt, wantz, n, ktop, kbot, nw, h, ldh, iloz, ihiz, z, ldz, ns, nd, sr, si, v, ldv, nh, t, ldt, nv, wv, ldwv, work, lwork)
	DLAQR2 performs the orthogonal similarity transformation of a Hessenberg matrix to detect and deflate fully converged eigenvalues from a trailing principal submatrix (aggressive early deflation).
subroutine	dlaqr3 (wantt, wantz, n, ktop, kbot, nw, h, ldh, iloz, ihiz, z, ldz, ns, nd, sr, si, v, ldv, nh, t, ldt, nv, wv, ldwv, work, lwork)
	DLAQR3 performs the orthogonal similarity transformation of a Hessenberg matrix to detect and deflate fully converged eigenvalues from a trailing principal submatrix (aggressive early deflation).
subroutine	dlaqr4 (wantt, wantz, n, ilo, ihi, h, ldh, wr, wi, iloz, ihiz, z, ldz, work, lwork, info)
	DLAQR4 computes the eigenvalues of a Hessenberg matrix, and optionally the matrices from the Schur decomposition.
subroutine	dlaqr5 (wantt, wantz, kacc22, n, ktop, kbot, nshfts, sr, si, h, ldh, iloz, ihiz, z, ldz, v, ldv, u, ldu, nv, wv, ldwv, nh, wh, ldwh)
	DLAQR5 performs a single small-bulge multi-shift QR sweep.
subroutine	dlaqsb (uplo, n, kd, ab, ldab, s, scond, amax, equed)
	DLAQSB scales a symmetric/Hermitian band matrix, using scaling factors computed by spbequ.
subroutine	dlaqsp (uplo, n, ap, s, scond, amax, equed)
	DLAQSP scales a symmetric/Hermitian matrix in packed storage, using scaling factors computed by sppequ.
subroutine	dlaqtr (ltran, lreal, n, t, ldt, b, w, scale, x, work, info)
	DLAQTR solves a real quasi-triangular system of equations, or a complex quasi-triangular system of special form, in real arithmetic.
subroutine	dlar1v (n, b1, bn, lambda, d, l, ld, lld, pivmin, gaptol, z, wantnc, negcnt, ztz, mingma, r, isuppz, nrminv, resid, rqcorr, work)
	DLAR1V computes the (scaled) r-th column of the inverse of the submatrix in rows b1 through bn of the tridiagonal matrix LDLT - λI.
subroutine	dlar2v (n, x, y, z, incx, c, s, incc)
	DLAR2V applies a vector of plane rotations with real cosines and real sines from both sides to a sequence of 2-by-2 symmetric/Hermitian matrices.
subroutine	dlarf (side, m, n, v, incv, tau, c, ldc, work)
	DLARF applies an elementary reflector to a general rectangular matrix.
subroutine	dlarfb (side, trans, direct, storev, m, n, k, v, ldv, t, ldt, c, ldc, work, ldwork)
	DLARFB applies a block reflector or its transpose to a general rectangular matrix.
subroutine	dlarfb_gett (ident, m, n, k, t, ldt, a, lda, b, ldb, work, ldwork)
	DLARFB_GETT
subroutine	dlarfg (n, alpha, x, incx, tau)
	DLARFG generates an elementary reflector (Householder matrix).
subroutine	dlarfgp (n, alpha, x, incx, tau)
	DLARFGP generates an elementary reflector (Householder matrix) with non-negative beta.
subroutine	dlarft (direct, storev, n, k, v, ldv, tau, t, ldt)
	DLARFT forms the triangular factor T of a block reflector H = I - vtvH
subroutine	dlarfx (side, m, n, v, tau, c, ldc, work)
	DLARFX applies an elementary reflector to a general rectangular matrix, with loop unrolling when the reflector has order ≤ 10.
subroutine	dlarfy (uplo, n, v, incv, tau, c, ldc, work)
	DLARFY
subroutine	dlargv (n, x, incx, y, incy, c, incc)
	DLARGV generates a vector of plane rotations with real cosines and real sines.
subroutine	dlarrv (n, vl, vu, d, l, pivmin, isplit, m, dol, dou, minrgp, rtol1, rtol2, w, werr, wgap, iblock, indexw, gers, z, ldz, isuppz, work, iwork, info)
	DLARRV computes the eigenvectors of the tridiagonal matrix T = L D LT given L, D and the eigenvalues of L D LT.
subroutine	dlartv (n, x, incx, y, incy, c, s, incc)
	DLARTV applies a vector of plane rotations with real cosines and real sines to the elements of a pair of vectors.
subroutine	dlaswp (n, a, lda, k1, k2, ipiv, incx)
	DLASWP performs a series of row interchanges on a general rectangular matrix.
subroutine	dlat2s (uplo, n, a, lda, sa, ldsa, info)
	DLAT2S converts a double-precision triangular matrix to a single-precision triangular matrix.
subroutine	dlatbs (uplo, trans, diag, normin, n, kd, ab, ldab, x, scale, cnorm, info)
	DLATBS solves a triangular banded system of equations.
subroutine	dlatdf (ijob, n, z, ldz, rhs, rdsum, rdscal, ipiv, jpiv)
	DLATDF uses the LU factorization of the n-by-n matrix computed by sgetc2 and computes a contribution to the reciprocal Dif-estimate.
subroutine	dlatps (uplo, trans, diag, normin, n, ap, x, scale, cnorm, info)
	DLATPS solves a triangular system of equations with the matrix held in packed storage.
subroutine	dlatrd (uplo, n, nb, a, lda, e, tau, w, ldw)
	DLATRD reduces the first nb rows and columns of a symmetric/Hermitian matrix A to real tridiagonal form by an orthogonal similarity transformation.
subroutine	dlatrs (uplo, trans, diag, normin, n, a, lda, x, scale, cnorm, info)
	DLATRS solves a triangular system of equations with the scale factor set to prevent overflow.
subroutine	dlauu2 (uplo, n, a, lda, info)
	DLAUU2 computes the product UUH or LHL, where U and L are upper or lower triangular matrices (unblocked algorithm).
subroutine	dlauum (uplo, n, a, lda, info)
	DLAUUM computes the product UUH or LHL, where U and L are upper or lower triangular matrices (blocked algorithm).
subroutine	drscl (n, sa, sx, incx)
	DRSCL multiplies a vector by the reciprocal of a real scalar.
subroutine	dtprfb (side, trans, direct, storev, m, n, k, l, v, ldv, t, ldt, a, lda, b, ldb, work, ldwork)
	DTPRFB applies a real or complex "triangular-pentagonal" blocked reflector to a real or complex matrix, which is composed of two blocks.
subroutine	slatrd (uplo, n, nb, a, lda, e, tau, w, ldw)
	SLATRD reduces the first nb rows and columns of a symmetric/Hermitian matrix A to real tridiagonal form by an orthogonal similarity transformation.

Detailed Description

This is the group of double other auxiliary routines

Function Documentation

◆ dlabrd()

subroutine dlabrd	(	integer	m,
		integer	n,
		integer	nb,
		double precision, dimension( lda, * )	a,
		integer	lda,
		double precision, dimension( * )	d,
		double precision, dimension( * )	e,
		double precision, dimension( * )	tauq,
		double precision, dimension( * )	taup,
		double precision, dimension( ldx, * )	x,
		integer	ldx,
		double precision, dimension( ldy, * )	y,
		integer	ldy )

DLABRD reduces the first nb rows and columns of a general matrix to a bidiagonal form.

Download DLABRD + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLABRD reduces the first NB rows and columns of a real general
!> m by n matrix A to upper or lower bidiagonal form by an orthogonal
!> transformation Q**T * A * P, and returns the matrices X and Y which
!> are needed to apply the transformation to the unreduced part of A.
!>
!> If m >= n, A is reduced to upper bidiagonal form; if m < n, to lower
!> bidiagonal form.
!>
!> This is an auxiliary routine called by DGEBRD
!>

Parameters

[in]	M	!> M is INTEGER !> The number of rows in the matrix A. !>
[in]	N	!> N is INTEGER !> The number of columns in the matrix A. !>
[in]	NB	!> NB is INTEGER !> The number of leading rows and columns of A to be reduced. !>
[in,out]	A	!> A is DOUBLE PRECISION array, dimension (LDA,N) !> On entry, the m by n general matrix to be reduced. !> On exit, the first NB rows and columns of the matrix are !> overwritten; the rest of the array is unchanged. !> If m >= n, elements on and below the diagonal in the first NB !> columns, with the array TAUQ, represent the orthogonal !> matrix Q as a product of elementary reflectors; and !> elements above the diagonal in the first NB rows, with the !> array TAUP, represent the orthogonal matrix P as a product !> of elementary reflectors. !> If m < n, elements below the diagonal in the first NB !> columns, with the array TAUQ, represent the orthogonal !> matrix Q as a product of elementary reflectors, and !> elements on and above the diagonal in the first NB rows, !> with the array TAUP, represent the orthogonal matrix P as !> a product of elementary reflectors. !> See Further Details. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,M). !>
[out]	D	!> D is DOUBLE PRECISION array, dimension (NB) !> The diagonal elements of the first NB rows and columns of !> the reduced matrix. D(i) = A(i,i). !>
[out]	E	!> E is DOUBLE PRECISION array, dimension (NB) !> The off-diagonal elements of the first NB rows and columns of !> the reduced matrix. !>
[out]	TAUQ	!> TAUQ is DOUBLE PRECISION array, dimension (NB) !> The scalar factors of the elementary reflectors which !> represent the orthogonal matrix Q. See Further Details. !>
[out]	TAUP	!> TAUP is DOUBLE PRECISION array, dimension (NB) !> The scalar factors of the elementary reflectors which !> represent the orthogonal matrix P. See Further Details. !>
[out]	X	!> X is DOUBLE PRECISION array, dimension (LDX,NB) !> The m-by-nb matrix X required to update the unreduced part !> of A. !>
[in]	LDX	!> LDX is INTEGER !> The leading dimension of the array X. LDX >= max(1,M). !>
[out]	Y	!> Y is DOUBLE PRECISION array, dimension (LDY,NB) !> The n-by-nb matrix Y required to update the unreduced part !> of A. !>
[in]	LDY	!> LDY is INTEGER !> The leading dimension of the array Y. LDY >= max(1,N). !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  The matrices Q and P are represented as products of elementary
!>  reflectors:
!>
!>     Q = H(1) H(2) . . . H(nb)  and  P = G(1) G(2) . . . G(nb)
!>
!>  Each H(i) and G(i) has the form:
!>
!>     H(i) = I - tauq * v * v**T  and G(i) = I - taup * u * u**T
!>
!>  where tauq and taup are real scalars, and v and u are real vectors.
!>
!>  If m >= n, v(1:i-1) = 0, v(i) = 1, and v(i:m) is stored on exit in
!>  A(i:m,i); u(1:i) = 0, u(i+1) = 1, and u(i+1:n) is stored on exit in
!>  A(i,i+1:n); tauq is stored in TAUQ(i) and taup in TAUP(i).
!>
!>  If m < n, v(1:i) = 0, v(i+1) = 1, and v(i+1:m) is stored on exit in
!>  A(i+2:m,i); u(1:i-1) = 0, u(i) = 1, and u(i:n) is stored on exit in
!>  A(i,i+1:n); tauq is stored in TAUQ(i) and taup in TAUP(i).
!>
!>  The elements of the vectors v and u together form the m-by-nb matrix
!>  V and the nb-by-n matrix U**T which are needed, with X and Y, to apply
!>  the transformation to the unreduced part of the matrix, using a block
!>  update of the form:  A := A - V*Y**T - X*U**T.
!>
!>  The contents of A on exit are illustrated by the following examples
!>  with nb = 2:
!>
!>  m = 6 and n = 5 (m > n):          m = 5 and n = 6 (m < n):
!>
!>    (  1   1   u1  u1  u1 )           (  1   u1  u1  u1  u1  u1 )
!>    (  v1  1   1   u2  u2 )           (  1   1   u2  u2  u2  u2 )
!>    (  v1  v2  a   a   a  )           (  v1  1   a   a   a   a  )
!>    (  v1  v2  a   a   a  )           (  v1  v2  a   a   a   a  )
!>    (  v1  v2  a   a   a  )           (  v1  v2  a   a   a   a  )
!>    (  v1  v2  a   a   a  )
!>
!>  where a denotes an element of the original matrix which is unchanged,
!>  vi denotes an element of the vector defining H(i), and ui an element
!>  of the vector defining G(i).
!>

Definition at line 208 of file dlabrd.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            LDA, LDX, LDY, M, N, NB
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   A( LDA, * ), D( * ), E( * ), TAUP( * ),
     $                   TAUQ( * ), X( LDX, * ), Y( LDY, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ZERO, ONE
      parameter( zero = 0.0d0, one = 1.0d0 )
*     ..
*     .. Local Scalars ..
      INTEGER            I
*     ..
*     .. External Subroutines ..
      EXTERNAL           dgemv, dlarfg, dscal
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          min
*     ..
*     .. Executable Statements ..
*
*     Quick return if possible
*
      IF( m.LE.0 .OR. n.LE.0 )
     $   RETURN
*
      IF( m.GE.n ) THEN
*
*        Reduce to upper bidiagonal form
*
         DO 10 i = 1, nb
*
*           Update A(i:m,i)
*
            CALL dgemv( 'No transpose', m-i+1, i-1, -one, a( i, 1 ),
     $                  lda, y( i, 1 ), ldy, one, a( i, i ), 1 )
            CALL dgemv( 'No transpose', m-i+1, i-1, -one, x( i, 1 ),
     $                  ldx, a( 1, i ), 1, one, a( i, i ), 1 )
*
*           Generate reflection Q(i) to annihilate A(i+1:m,i)
*
            CALL dlarfg( m-i+1, a( i, i ), a( min( i+1, m ), i ), 1,
     $                   tauq( i ) )
            d( i ) = a( i, i )
            IF( i.LT.n ) THEN
               a( i, i ) = one
*
*              Compute Y(i+1:n,i)
*
               CALL dgemv( 'Transpose', m-i+1, n-i, one, a( i, i+1 ),
     $                     lda, a( i, i ), 1, zero, y( i+1, i ), 1 )
               CALL dgemv( 'Transpose', m-i+1, i-1, one, a( i, 1 ), lda,
     $                     a( i, i ), 1, zero, y( 1, i ), 1 )
               CALL dgemv( 'No transpose', n-i, i-1, -one, y( i+1, 1 ),
     $                     ldy, y( 1, i ), 1, one, y( i+1, i ), 1 )
               CALL dgemv( 'Transpose', m-i+1, i-1, one, x( i, 1 ), ldx,
     $                     a( i, i ), 1, zero, y( 1, i ), 1 )
               CALL dgemv( 'Transpose', i-1, n-i, -one, a( 1, i+1 ),
     $                     lda, y( 1, i ), 1, one, y( i+1, i ), 1 )
               CALL dscal( n-i, tauq( i ), y( i+1, i ), 1 )
*
*              Update A(i,i+1:n)
*
               CALL dgemv( 'No transpose', n-i, i, -one, y( i+1, 1 ),
     $                     ldy, a( i, 1 ), lda, one, a( i, i+1 ), lda )
               CALL dgemv( 'Transpose', i-1, n-i, -one, a( 1, i+1 ),
     $                     lda, x( i, 1 ), ldx, one, a( i, i+1 ), lda )
*
*              Generate reflection P(i) to annihilate A(i,i+2:n)
*
               CALL dlarfg( n-i, a( i, i+1 ), a( i, min( i+2, n ) ),
     $                      lda, taup( i ) )
               e( i ) = a( i, i+1 )
               a( i, i+1 ) = one
*
*              Compute X(i+1:m,i)
*
               CALL dgemv( 'No transpose', m-i, n-i, one, a( i+1, i+1 ),
     $                     lda, a( i, i+1 ), lda, zero, x( i+1, i ), 1 )
               CALL dgemv( 'Transpose', n-i, i, one, y( i+1, 1 ), ldy,
     $                     a( i, i+1 ), lda, zero, x( 1, i ), 1 )
               CALL dgemv( 'No transpose', m-i, i, -one, a( i+1, 1 ),
     $                     lda, x( 1, i ), 1, one, x( i+1, i ), 1 )
               CALL dgemv( 'No transpose', i-1, n-i, one, a( 1, i+1 ),
     $                     lda, a( i, i+1 ), lda, zero, x( 1, i ), 1 )
               CALL dgemv( 'No transpose', m-i, i-1, -one, x( i+1, 1 ),
     $                     ldx, x( 1, i ), 1, one, x( i+1, i ), 1 )
               CALL dscal( m-i, taup( i ), x( i+1, i ), 1 )
            END IF
   10    CONTINUE
      ELSE
*
*        Reduce to lower bidiagonal form
*
         DO 20 i = 1, nb
*
*           Update A(i,i:n)
*
            CALL dgemv( 'No transpose', n-i+1, i-1, -one, y( i, 1 ),
     $                  ldy, a( i, 1 ), lda, one, a( i, i ), lda )
            CALL dgemv( 'Transpose', i-1, n-i+1, -one, a( 1, i ), lda,
     $                  x( i, 1 ), ldx, one, a( i, i ), lda )
*
*           Generate reflection P(i) to annihilate A(i,i+1:n)
*
            CALL dlarfg( n-i+1, a( i, i ), a( i, min( i+1, n ) ), lda,
     $                   taup( i ) )
            d( i ) = a( i, i )
            IF( i.LT.m ) THEN
               a( i, i ) = one
*
*              Compute X(i+1:m,i)
*
               CALL dgemv( 'No transpose', m-i, n-i+1, one, a( i+1, i ),
     $                     lda, a( i, i ), lda, zero, x( i+1, i ), 1 )
               CALL dgemv( 'Transpose', n-i+1, i-1, one, y( i, 1 ), ldy,
     $                     a( i, i ), lda, zero, x( 1, i ), 1 )
               CALL dgemv( 'No transpose', m-i, i-1, -one, a( i+1, 1 ),
     $                     lda, x( 1, i ), 1, one, x( i+1, i ), 1 )
               CALL dgemv( 'No transpose', i-1, n-i+1, one, a( 1, i ),
     $                     lda, a( i, i ), lda, zero, x( 1, i ), 1 )
               CALL dgemv( 'No transpose', m-i, i-1, -one, x( i+1, 1 ),
     $                     ldx, x( 1, i ), 1, one, x( i+1, i ), 1 )
               CALL dscal( m-i, taup( i ), x( i+1, i ), 1 )
*
*              Update A(i+1:m,i)
*
               CALL dgemv( 'No transpose', m-i, i-1, -one, a( i+1, 1 ),
     $                     lda, y( i, 1 ), ldy, one, a( i+1, i ), 1 )
               CALL dgemv( 'No transpose', m-i, i, -one, x( i+1, 1 ),
     $                     ldx, a( 1, i ), 1, one, a( i+1, i ), 1 )
*
*              Generate reflection Q(i) to annihilate A(i+2:m,i)
*
               CALL dlarfg( m-i, a( i+1, i ), a( min( i+2, m ), i ), 1,
     $                      tauq( i ) )
               e( i ) = a( i+1, i )
               a( i+1, i ) = one
*
*              Compute Y(i+1:n,i)
*
               CALL dgemv( 'Transpose', m-i, n-i, one, a( i+1, i+1 ),
     $                     lda, a( i+1, i ), 1, zero, y( i+1, i ), 1 )
               CALL dgemv( 'Transpose', m-i, i-1, one, a( i+1, 1 ), lda,
     $                     a( i+1, i ), 1, zero, y( 1, i ), 1 )
               CALL dgemv( 'No transpose', n-i, i-1, -one, y( i+1, 1 ),
     $                     ldy, y( 1, i ), 1, one, y( i+1, i ), 1 )
               CALL dgemv( 'Transpose', m-i, i, one, x( i+1, 1 ), ldx,
     $                     a( i+1, i ), 1, zero, y( 1, i ), 1 )
               CALL dgemv( 'Transpose', i, n-i, -one, a( 1, i+1 ), lda,
     $                     y( 1, i ), 1, one, y( i+1, i ), 1 )
               CALL dscal( n-i, tauq( i ), y( i+1, i ), 1 )
            END IF
   20    CONTINUE
      END IF
      RETURN
*
*     End of DLABRD
*

◆ dlacn2()

subroutine dlacn2	(	integer	n,
		double precision, dimension( * )	v,
		double precision, dimension( * )	x,
		integer, dimension( * )	isgn,
		double precision	est,
		integer	kase,
		integer, dimension( 3 )	isave )

DLACN2 estimates the 1-norm of a square matrix, using reverse communication for evaluating matrix-vector products.

Download DLACN2 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLACN2 estimates the 1-norm of a square, real matrix A.
!> Reverse communication is used for evaluating matrix-vector products.
!>

Parameters

[in]	N	!> N is INTEGER !> The order of the matrix. N >= 1. !>
[out]	V	!> V is DOUBLE PRECISION array, dimension (N) !> On the final return, V = A*W, where EST = norm(V)/norm(W) !> (W is not returned). !>
[in,out]	X	!> X is DOUBLE PRECISION array, dimension (N) !> On an intermediate return, X should be overwritten by !> A * X, if KASE=1, !> A*T X, if KASE=2, !> and DLACN2 must be re-called with all the other parameters !> unchanged. !>
[out]	ISGN	!> ISGN is INTEGER array, dimension (N) !>
[in,out]	EST	!> EST is DOUBLE PRECISION !> On entry with KASE = 1 or 2 and ISAVE(1) = 3, EST should be !> unchanged from the previous call to DLACN2. !> On exit, EST is an estimate (a lower bound) for norm(A). !>
[in,out]	KASE	!> KASE is INTEGER !> On the initial call to DLACN2, KASE should be 0. !> On an intermediate return, KASE will be 1 or 2, indicating !> whether X should be overwritten by A * X or A*T X. !> On the final return from DLACN2, KASE will again be 0. !>
[in,out]	ISAVE	!> ISAVE is INTEGER array, dimension (3) !> ISAVE is used to save variables between calls to DLACN2 !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  Originally named SONEST, dated March 16, 1988.
!>
!>  This is a thread safe version of DLACON, which uses the array ISAVE
!>  in place of a SAVE statement, as follows:
!>
!>     DLACON     DLACN2
!>      JUMP     ISAVE(1)
!>      J        ISAVE(2)
!>      ITER     ISAVE(3)
!>

Contributors:: Nick Higham, University of Manchester

References:: N.J. Higham, "FORTRAN codes for estimating the one-norm of a real or complex matrix, with applications to condition estimation", ACM Trans. Math. Soft., vol. 14, no. 4, pp. 381-396, December 1988.

Definition at line 135 of file dlacn2.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            KASE, N
      DOUBLE PRECISION   EST
*     ..
*     .. Array Arguments ..
      INTEGER            ISGN( * ), ISAVE( 3 )
      DOUBLE PRECISION   V( * ), X( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      INTEGER            ITMAX
      parameter( itmax = 5 )
      DOUBLE PRECISION   ZERO, ONE, TWO
      parameter( zero = 0.0d+0, one = 1.0d+0, two = 2.0d+0 )
*     ..
*     .. Local Scalars ..
      INTEGER            I, JLAST
      DOUBLE PRECISION   ALTSGN, ESTOLD, TEMP, XS
*     ..
*     .. External Functions ..
      INTEGER            IDAMAX
      DOUBLE PRECISION   DASUM
      EXTERNAL           idamax, dasum
*     ..
*     .. External Subroutines ..
      EXTERNAL           dcopy
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, dble, nint
*     ..
*     .. Executable Statements ..
*
      IF( kase.EQ.0 ) THEN
         DO 10 i = 1, n
            x( i ) = one / dble( n )
   10    CONTINUE
         kase = 1
         isave( 1 ) = 1
         RETURN
      END IF
*
      GO TO ( 20, 40, 70, 110, 140 )isave( 1 )
*
*     ................ ENTRY   (ISAVE( 1 ) = 1)
*     FIRST ITERATION.  X HAS BEEN OVERWRITTEN BY A*X.
*
   20 CONTINUE
      IF( n.EQ.1 ) THEN
         v( 1 ) = x( 1 )
         est = abs( v( 1 ) )
*        ... QUIT
         GO TO 150
      END IF
      est = dasum( n, x, 1 )
*
      DO 30 i = 1, n
         IF( x(i).GE.zero ) THEN
            x(i) = one
         ELSE
            x(i) = -one
         END IF
         isgn( i ) = nint( x( i ) )
   30 CONTINUE
      kase = 2
      isave( 1 ) = 2
      RETURN
*
*     ................ ENTRY   (ISAVE( 1 ) = 2)
*     FIRST ITERATION.  X HAS BEEN OVERWRITTEN BY TRANSPOSE(A)*X.
*
   40 CONTINUE
      isave( 2 ) = idamax( n, x, 1 )
      isave( 3 ) = 2
*
*     MAIN LOOP - ITERATIONS 2,3,...,ITMAX.
*
   50 CONTINUE
      DO 60 i = 1, n
         x( i ) = zero
   60 CONTINUE
      x( isave( 2 ) ) = one
      kase = 1
      isave( 1 ) = 3
      RETURN
*
*     ................ ENTRY   (ISAVE( 1 ) = 3)
*     X HAS BEEN OVERWRITTEN BY A*X.
*
   70 CONTINUE
      CALL dcopy( n, x, 1, v, 1 )
      estold = est
      est = dasum( n, v, 1 )
      DO 80 i = 1, n
         IF( x(i).GE.zero ) THEN
            xs = one
         ELSE
            xs = -one
         END IF
         IF( nint( xs ).NE.isgn( i ) )
     $      GO TO 90
   80 CONTINUE
*     REPEATED SIGN VECTOR DETECTED, HENCE ALGORITHM HAS CONVERGED.
      GO TO 120
*
   90 CONTINUE
*     TEST FOR CYCLING.
      IF( est.LE.estold )
     $   GO TO 120
*
      DO 100 i = 1, n
         IF( x(i).GE.zero ) THEN
            x(i) = one
         ELSE
            x(i) = -one
         END IF
         isgn( i ) = nint( x( i ) )
  100 CONTINUE
      kase = 2
      isave( 1 ) = 4
      RETURN
*
*     ................ ENTRY   (ISAVE( 1 ) = 4)
*     X HAS BEEN OVERWRITTEN BY TRANSPOSE(A)*X.
*
  110 CONTINUE
      jlast = isave( 2 )
      isave( 2 ) = idamax( n, x, 1 )
      IF( ( x( jlast ).NE.abs( x( isave( 2 ) ) ) ) .AND.
     $    ( isave( 3 ).LT.itmax ) ) THEN
         isave( 3 ) = isave( 3 ) + 1
         GO TO 50
      END IF
*
*     ITERATION COMPLETE.  FINAL STAGE.
*
  120 CONTINUE
      altsgn = one
      DO 130 i = 1, n
         x( i ) = altsgn*( one+dble( i-1 ) / dble( n-1 ) )
         altsgn = -altsgn
  130 CONTINUE
      kase = 1
      isave( 1 ) = 5
      RETURN
*
*     ................ ENTRY   (ISAVE( 1 ) = 5)
*     X HAS BEEN OVERWRITTEN BY A*X.
*
  140 CONTINUE
      temp = two*( dasum( n, x, 1 ) / dble( 3*n ) )
      IF( temp.GT.est ) THEN
         CALL dcopy( n, x, 1, v, 1 )
         est = temp
      END IF
*
  150 CONTINUE
      kase = 0
      RETURN
*
*     End of DLACN2
*

◆ dlacon()

subroutine dlacon	(	integer	n,
		double precision, dimension( * )	v,
		double precision, dimension( * )	x,
		integer, dimension( * )	isgn,
		double precision	est,
		integer	kase )

DLACON estimates the 1-norm of a square matrix, using reverse communication for evaluating matrix-vector products.

Download DLACON + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLACON estimates the 1-norm of a square, real matrix A.
!> Reverse communication is used for evaluating matrix-vector products.
!>

Parameters

[in]	N	!> N is INTEGER !> The order of the matrix. N >= 1. !>
[out]	V	!> V is DOUBLE PRECISION array, dimension (N) !> On the final return, V = A*W, where EST = norm(V)/norm(W) !> (W is not returned). !>
[in,out]	X	!> X is DOUBLE PRECISION array, dimension (N) !> On an intermediate return, X should be overwritten by !> A * X, if KASE=1, !> A*T X, if KASE=2, !> and DLACON must be re-called with all the other parameters !> unchanged. !>
[out]	ISGN	!> ISGN is INTEGER array, dimension (N) !>
[in,out]	EST	!> EST is DOUBLE PRECISION !> On entry with KASE = 1 or 2 and JUMP = 3, EST should be !> unchanged from the previous call to DLACON. !> On exit, EST is an estimate (a lower bound) for norm(A). !>
[in,out]	KASE	!> KASE is INTEGER !> On the initial call to DLACON, KASE should be 0. !> On an intermediate return, KASE will be 1 or 2, indicating !> whether X should be overwritten by A * X or A*T X. !> On the final return from DLACON, KASE will again be 0. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: Nick Higham, University of Manchester.
Originally named SONEST, dated March 16, 1988.

References:: N.J. Higham, "FORTRAN codes for estimating the one-norm of a real or complex matrix, with applications to condition estimation", ACM Trans. Math. Soft., vol. 14, no. 4, pp. 381-396, December 1988.

Definition at line 114 of file dlacon.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            KASE, N
      DOUBLE PRECISION   EST
*     ..
*     .. Array Arguments ..
      INTEGER            ISGN( * )
      DOUBLE PRECISION   V( * ), X( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      INTEGER            ITMAX
      parameter( itmax = 5 )
      DOUBLE PRECISION   ZERO, ONE, TWO
      parameter( zero = 0.0d+0, one = 1.0d+0, two = 2.0d+0 )
*     ..
*     .. Local Scalars ..
      INTEGER            I, ITER, J, JLAST, JUMP
      DOUBLE PRECISION   ALTSGN, ESTOLD, TEMP
*     ..
*     .. External Functions ..
      INTEGER            IDAMAX
      DOUBLE PRECISION   DASUM
      EXTERNAL           idamax, dasum
*     ..
*     .. External Subroutines ..
      EXTERNAL           dcopy
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, dble, nint, sign
*     ..
*     .. Save statement ..
      SAVE
*     ..
*     .. Executable Statements ..
*
      IF( kase.EQ.0 ) THEN
         DO 10 i = 1, n
            x( i ) = one / dble( n )
   10    CONTINUE
         kase = 1
         jump = 1
         RETURN
      END IF
*
      GO TO ( 20, 40, 70, 110, 140 )jump
*
*     ................ ENTRY   (JUMP = 1)
*     FIRST ITERATION.  X HAS BEEN OVERWRITTEN BY A*X.
*
   20 CONTINUE
      IF( n.EQ.1 ) THEN
         v( 1 ) = x( 1 )
         est = abs( v( 1 ) )
*        ... QUIT
         GO TO 150
      END IF
      est = dasum( n, x, 1 )
*
      DO 30 i = 1, n
         x( i ) = sign( one, x( i ) )
         isgn( i ) = nint( x( i ) )
   30 CONTINUE
      kase = 2
      jump = 2
      RETURN
*
*     ................ ENTRY   (JUMP = 2)
*     FIRST ITERATION.  X HAS BEEN OVERWRITTEN BY TRANSPOSE(A)*X.
*
   40 CONTINUE
      j = idamax( n, x, 1 )
      iter = 2
*
*     MAIN LOOP - ITERATIONS 2,3,...,ITMAX.
*
   50 CONTINUE
      DO 60 i = 1, n
         x( i ) = zero
   60 CONTINUE
      x( j ) = one
      kase = 1
      jump = 3
      RETURN
*
*     ................ ENTRY   (JUMP = 3)
*     X HAS BEEN OVERWRITTEN BY A*X.
*
   70 CONTINUE
      CALL dcopy( n, x, 1, v, 1 )
      estold = est
      est = dasum( n, v, 1 )
      DO 80 i = 1, n
         IF( nint( sign( one, x( i ) ) ).NE.isgn( i ) )
     $      GO TO 90
   80 CONTINUE
*     REPEATED SIGN VECTOR DETECTED, HENCE ALGORITHM HAS CONVERGED.
      GO TO 120
*
   90 CONTINUE
*     TEST FOR CYCLING.
      IF( est.LE.estold )
     $   GO TO 120
*
      DO 100 i = 1, n
         x( i ) = sign( one, x( i ) )
         isgn( i ) = nint( x( i ) )
  100 CONTINUE
      kase = 2
      jump = 4
      RETURN
*
*     ................ ENTRY   (JUMP = 4)
*     X HAS BEEN OVERWRITTEN BY TRANSPOSE(A)*X.
*
  110 CONTINUE
      jlast = j
      j = idamax( n, x, 1 )
      IF( ( x( jlast ).NE.abs( x( j ) ) ) .AND. ( iter.LT.itmax ) ) THEN
         iter = iter + 1
         GO TO 50
      END IF
*
*     ITERATION COMPLETE.  FINAL STAGE.
*
  120 CONTINUE
      altsgn = one
      DO 130 i = 1, n
         x( i ) = altsgn*( one+dble( i-1 ) / dble( n-1 ) )
         altsgn = -altsgn
  130 CONTINUE
      kase = 1
      jump = 5
      RETURN
*
*     ................ ENTRY   (JUMP = 5)
*     X HAS BEEN OVERWRITTEN BY A*X.
*
  140 CONTINUE
      temp = two*( dasum( n, x, 1 ) / dble( 3*n ) )
      IF( temp.GT.est ) THEN
         CALL dcopy( n, x, 1, v, 1 )
         est = temp
      END IF
*
  150 CONTINUE
      kase = 0
      RETURN
*
*     End of DLACON
*

◆ dladiv()

subroutine dladiv	(	double precision	a,
		double precision	b,
		double precision	c,
		double precision	d,
		double precision	p,
		double precision	q )

DLADIV performs complex division in real arithmetic, avoiding unnecessary overflow.

Download DLADIV + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLADIV performs complex division in  real arithmetic
!>
!>                       a + i*b
!>            p + i*q = ---------
!>                       c + i*d
!>
!> The algorithm is due to Michael Baudin and Robert L. Smith
!> and can be found in the paper
!> 
!>

Parameters

[in]	A	!> A is DOUBLE PRECISION !>
[in]	B	!> B is DOUBLE PRECISION !>
[in]	C	!> C is DOUBLE PRECISION !>
[in]	D	!> D is DOUBLE PRECISION !> The scalars a, b, c, and d in the above expression. !>
[out]	P	!> P is DOUBLE PRECISION !>
[out]	Q	!> Q is DOUBLE PRECISION !> The scalars p and q in the above expression. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 90 of file dladiv.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      DOUBLE PRECISION   A, B, C, D, P, Q
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   BS
      parameter( bs = 2.0d0 )
      DOUBLE PRECISION   HALF
      parameter( half = 0.5d0 )
      DOUBLE PRECISION   TWO
      parameter( two = 2.0d0 )
*
*     .. Local Scalars ..
      DOUBLE PRECISION   AA, BB, CC, DD, AB, CD, S, OV, UN, BE, EPS
*     ..
*     .. External Functions ..
      DOUBLE PRECISION   DLAMCH
      EXTERNAL           dlamch
*     ..
*     .. External Subroutines ..
      EXTERNAL           dladiv1
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, max
*     ..
*     .. Executable Statements ..
*
      aa = a
      bb = b
      cc = c
      dd = d
      ab = max( abs(a), abs(b) )
      cd = max( abs(c), abs(d) )
      s = 1.0d0
 
      ov = dlamch( 'Overflow threshold' )
      un = dlamch( 'Safe minimum' )
      eps = dlamch( 'Epsilon' )
      be = bs / (eps*eps)
 
      IF( ab >= half*ov ) THEN
         aa = half * aa
         bb = half * bb
         s  = two * s
      END IF
      IF( cd >= half*ov ) THEN
         cc = half * cc
         dd = half * dd
         s  = half * s
      END IF
      IF( ab <= un*bs/eps ) THEN
         aa = aa * be
         bb = bb * be
         s  = s / be
      END IF
      IF( cd <= un*bs/eps ) THEN
         cc = cc * be
         dd = dd * be
         s  = s * be
      END IF
      IF( abs( d ).LE.abs( c ) ) THEN
         CALL dladiv1(aa, bb, cc, dd, p, q)
      ELSE
         CALL dladiv1(bb, aa, dd, cc, p, q)
         q = -q
      END IF
      p = p * s
      q = q * s
*
      RETURN
*
*     End of DLADIV
*

◆ dladiv1()

subroutine dladiv1	(	double precision	a,
		double precision	b,
		double precision	c,
		double precision	d,
		double precision	p,
		double precision	q )

Definition at line 176 of file dladiv.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      DOUBLE PRECISION   A, B, C, D, P, Q
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ONE
      parameter( one = 1.0d0 )
*
*     .. Local Scalars ..
      DOUBLE PRECISION   R, T
*     ..
*     .. External Functions ..
      DOUBLE PRECISION   DLADIV2
      EXTERNAL           dladiv2
*     ..
*     .. Executable Statements ..
*
      r = d / c
      t = one / (c + d * r)
      p = dladiv2(a, b, c, d, r, t)
      a = -a
      q = dladiv2(b, a, c, d, r, t)
*
      RETURN
*
*     End of DLADIV1
*

◆ dladiv2()

double precision function dladiv2	(	double precision	a,
		double precision	b,
		double precision	c,
		double precision	d,
		double precision	r,
		double precision	t )

Definition at line 215 of file dladiv.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      DOUBLE PRECISION   A, B, C, D, R, T
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ZERO
      parameter( zero = 0.0d0 )
*
*     .. Local Scalars ..
      DOUBLE PRECISION   BR
*     ..
*     .. Executable Statements ..
*
      IF( r.NE.zero ) THEN
         br = b * r
         IF( br.NE.zero ) THEN
            dladiv2 = (a + br) * t
         ELSE
            dladiv2 = a * t + (b * t) * r
         END IF
      ELSE
         dladiv2 = (a + d * (b / c)) * t
      END IF
*
      RETURN
*
*     End of DLADIV2
*

◆ dlaein()

subroutine dlaein	(	logical	rightv,
		logical	noinit,
		integer	n,
		double precision, dimension( ldh, * )	h,
		integer	ldh,
		double precision	wr,
		double precision	wi,
		double precision, dimension( * )	vr,
		double precision, dimension( * )	vi,
		double precision, dimension( ldb, * )	b,
		integer	ldb,
		double precision, dimension( * )	work,
		double precision	eps3,
		double precision	smlnum,
		double precision	bignum,
		integer	info )

DLAEIN computes a specified right or left eigenvector of an upper Hessenberg matrix by inverse iteration.

Download DLAEIN + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLAEIN uses inverse iteration to find a right or left eigenvector
!> corresponding to the eigenvalue (WR,WI) of a real upper Hessenberg
!> matrix H.
!>

Parameters

[in]	RIGHTV	!> RIGHTV is LOGICAL !> = .TRUE. : compute right eigenvector; !> = .FALSE.: compute left eigenvector. !>
[in]	NOINIT	!> NOINIT is LOGICAL !> = .TRUE. : no initial vector supplied in (VR,VI). !> = .FALSE.: initial vector supplied in (VR,VI). !>
[in]	N	!> N is INTEGER !> The order of the matrix H. N >= 0. !>
[in]	H	!> H is DOUBLE PRECISION array, dimension (LDH,N) !> The upper Hessenberg matrix H. !>
[in]	LDH	!> LDH is INTEGER !> The leading dimension of the array H. LDH >= max(1,N). !>
[in]	WR	!> WR is DOUBLE PRECISION !>
[in]	WI	!> WI is DOUBLE PRECISION !> The real and imaginary parts of the eigenvalue of H whose !> corresponding right or left eigenvector is to be computed. !>
[in,out]	VR	!> VR is DOUBLE PRECISION array, dimension (N) !>
[in,out]	VI	!> VI is DOUBLE PRECISION array, dimension (N) !> On entry, if NOINIT = .FALSE. and WI = 0.0, VR must contain !> a real starting vector for inverse iteration using the real !> eigenvalue WR; if NOINIT = .FALSE. and WI.ne.0.0, VR and VI !> must contain the real and imaginary parts of a complex !> starting vector for inverse iteration using the complex !> eigenvalue (WR,WI); otherwise VR and VI need not be set. !> On exit, if WI = 0.0 (real eigenvalue), VR contains the !> computed real eigenvector; if WI.ne.0.0 (complex eigenvalue), !> VR and VI contain the real and imaginary parts of the !> computed complex eigenvector. The eigenvector is normalized !> so that the component of largest magnitude has magnitude 1; !> here the magnitude of a complex number (x,y) is taken to be !> \|x\| + \|y\|. !> VI is not referenced if WI = 0.0. !>
[out]	B	!> B is DOUBLE PRECISION array, dimension (LDB,N) !>
[in]	LDB	!> LDB is INTEGER !> The leading dimension of the array B. LDB >= N+1. !>
[out]	WORK	!> WORK is DOUBLE PRECISION array, dimension (N) !>
[in]	EPS3	!> EPS3 is DOUBLE PRECISION !> A small machine-dependent value which is used to perturb !> close eigenvalues, and to replace zero pivots. !>
[in]	SMLNUM	!> SMLNUM is DOUBLE PRECISION !> A machine-dependent value close to the underflow threshold. !>
[in]	BIGNUM	!> BIGNUM is DOUBLE PRECISION !> A machine-dependent value close to the overflow threshold. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> = 1: inverse iteration did not converge; VR is set to the !> last iterate, and so is VI if WI.ne.0.0. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 170 of file dlaein.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      LOGICAL            NOINIT, RIGHTV
      INTEGER            INFO, LDB, LDH, N
      DOUBLE PRECISION   BIGNUM, EPS3, SMLNUM, WI, WR
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   B( LDB, * ), H( LDH, * ), VI( * ), VR( * ),
     $                   WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ZERO, ONE, TENTH
      parameter( zero = 0.0d+0, one = 1.0d+0, tenth = 1.0d-1 )
*     ..
*     .. Local Scalars ..
      CHARACTER          NORMIN, TRANS
      INTEGER            I, I1, I2, I3, IERR, ITS, J
      DOUBLE PRECISION   ABSBII, ABSBJJ, EI, EJ, GROWTO, NORM, NRMSML,
     $                   REC, ROOTN, SCALE, TEMP, VCRIT, VMAX, VNORM, W,
     $                   W1, X, XI, XR, Y
*     ..
*     .. External Functions ..
      INTEGER            IDAMAX
      DOUBLE PRECISION   DASUM, DLAPY2, DNRM2
      EXTERNAL           idamax, dasum, dlapy2, dnrm2
*     ..
*     .. External Subroutines ..
      EXTERNAL           dladiv, dlatrs, dscal
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, dble, max, sqrt
*     ..
*     .. Executable Statements ..
*
      info = 0
*
*     GROWTO is the threshold used in the acceptance test for an
*     eigenvector.
*
      rootn = sqrt( dble( n ) )
      growto = tenth / rootn
      nrmsml = max( one, eps3*rootn )*smlnum
*
*     Form B = H - (WR,WI)*I (except that the subdiagonal elements and
*     the imaginary parts of the diagonal elements are not stored).
*
      DO 20 j = 1, n
         DO 10 i = 1, j - 1
            b( i, j ) = h( i, j )
   10    CONTINUE
         b( j, j ) = h( j, j ) - wr
   20 CONTINUE
*
      IF( wi.EQ.zero ) THEN
*
*        Real eigenvalue.
*
         IF( noinit ) THEN
*
*           Set initial vector.
*
            DO 30 i = 1, n
               vr( i ) = eps3
   30       CONTINUE
         ELSE
*
*           Scale supplied initial vector.
*
            vnorm = dnrm2( n, vr, 1 )
            CALL dscal( n, ( eps3*rootn ) / max( vnorm, nrmsml ), vr,
     $                  1 )
         END IF
*
         IF( rightv ) THEN
*
*           LU decomposition with partial pivoting of B, replacing zero
*           pivots by EPS3.
*
            DO 60 i = 1, n - 1
               ei = h( i+1, i )
               IF( abs( b( i, i ) ).LT.abs( ei ) ) THEN
*
*                 Interchange rows and eliminate.
*
                  x = b( i, i ) / ei
                  b( i, i ) = ei
                  DO 40 j = i + 1, n
                     temp = b( i+1, j )
                     b( i+1, j ) = b( i, j ) - x*temp
                     b( i, j ) = temp
   40             CONTINUE
               ELSE
*
*                 Eliminate without interchange.
*
                  IF( b( i, i ).EQ.zero )
     $               b( i, i ) = eps3
                  x = ei / b( i, i )
                  IF( x.NE.zero ) THEN
                     DO 50 j = i + 1, n
                        b( i+1, j ) = b( i+1, j ) - x*b( i, j )
   50                CONTINUE
                  END IF
               END IF
   60       CONTINUE
            IF( b( n, n ).EQ.zero )
     $         b( n, n ) = eps3
*
            trans = 'N'
*
         ELSE
*
*           UL decomposition with partial pivoting of B, replacing zero
*           pivots by EPS3.
*
            DO 90 j = n, 2, -1
               ej = h( j, j-1 )
               IF( abs( b( j, j ) ).LT.abs( ej ) ) THEN
*
*                 Interchange columns and eliminate.
*
                  x = b( j, j ) / ej
                  b( j, j ) = ej
                  DO 70 i = 1, j - 1
                     temp = b( i, j-1 )
                     b( i, j-1 ) = b( i, j ) - x*temp
                     b( i, j ) = temp
   70             CONTINUE
               ELSE
*
*                 Eliminate without interchange.
*
                  IF( b( j, j ).EQ.zero )
     $               b( j, j ) = eps3
                  x = ej / b( j, j )
                  IF( x.NE.zero ) THEN
                     DO 80 i = 1, j - 1
                        b( i, j-1 ) = b( i, j-1 ) - x*b( i, j )
   80                CONTINUE
                  END IF
               END IF
   90       CONTINUE
            IF( b( 1, 1 ).EQ.zero )
     $         b( 1, 1 ) = eps3
*
            trans = 'T'
*
         END IF
*
         normin = 'N'
         DO 110 its = 1, n
*
*           Solve U*x = scale*v for a right eigenvector
*             or U**T*x = scale*v for a left eigenvector,
*           overwriting x on v.
*
            CALL dlatrs( 'Upper', trans, 'Nonunit', normin, n, b, ldb,
     $                   vr, scale, work, ierr )
            normin = 'Y'
*
*           Test for sufficient growth in the norm of v.
*
            vnorm = dasum( n, vr, 1 )
            IF( vnorm.GE.growto*scale )
     $         GO TO 120
*
*           Choose new orthogonal starting vector and try again.
*
            temp = eps3 / ( rootn+one )
            vr( 1 ) = eps3
            DO 100 i = 2, n
               vr( i ) = temp
  100       CONTINUE
            vr( n-its+1 ) = vr( n-its+1 ) - eps3*rootn
  110    CONTINUE
*
*        Failure to find eigenvector in N iterations.
*
         info = 1
*
  120    CONTINUE
*
*        Normalize eigenvector.
*
         i = idamax( n, vr, 1 )
         CALL dscal( n, one / abs( vr( i ) ), vr, 1 )
      ELSE
*
*        Complex eigenvalue.
*
         IF( noinit ) THEN
*
*           Set initial vector.
*
            DO 130 i = 1, n
               vr( i ) = eps3
               vi( i ) = zero
  130       CONTINUE
         ELSE
*
*           Scale supplied initial vector.
*
            norm = dlapy2( dnrm2( n, vr, 1 ), dnrm2( n, vi, 1 ) )
            rec = ( eps3*rootn ) / max( norm, nrmsml )
            CALL dscal( n, rec, vr, 1 )
            CALL dscal( n, rec, vi, 1 )
         END IF
*
         IF( rightv ) THEN
*
*           LU decomposition with partial pivoting of B, replacing zero
*           pivots by EPS3.
*
*           The imaginary part of the (i,j)-th element of U is stored in
*           B(j+1,i).
*
            b( 2, 1 ) = -wi
            DO 140 i = 2, n
               b( i+1, 1 ) = zero
  140       CONTINUE
*
            DO 170 i = 1, n - 1
               absbii = dlapy2( b( i, i ), b( i+1, i ) )
               ei = h( i+1, i )
               IF( absbii.LT.abs( ei ) ) THEN
*
*                 Interchange rows and eliminate.
*
                  xr = b( i, i ) / ei
                  xi = b( i+1, i ) / ei
                  b( i, i ) = ei
                  b( i+1, i ) = zero
                  DO 150 j = i + 1, n
                     temp = b( i+1, j )
                     b( i+1, j ) = b( i, j ) - xr*temp
                     b( j+1, i+1 ) = b( j+1, i ) - xi*temp
                     b( i, j ) = temp
                     b( j+1, i ) = zero
  150             CONTINUE
                  b( i+2, i ) = -wi
                  b( i+1, i+1 ) = b( i+1, i+1 ) - xi*wi
                  b( i+2, i+1 ) = b( i+2, i+1 ) + xr*wi
               ELSE
*
*                 Eliminate without interchanging rows.
*
                  IF( absbii.EQ.zero ) THEN
                     b( i, i ) = eps3
                     b( i+1, i ) = zero
                     absbii = eps3
                  END IF
                  ei = ( ei / absbii ) / absbii
                  xr = b( i, i )*ei
                  xi = -b( i+1, i )*ei
                  DO 160 j = i + 1, n
                     b( i+1, j ) = b( i+1, j ) - xr*b( i, j ) +
     $                             xi*b( j+1, i )
                     b( j+1, i+1 ) = -xr*b( j+1, i ) - xi*b( i, j )
  160             CONTINUE
                  b( i+2, i+1 ) = b( i+2, i+1 ) - wi
               END IF
*
*              Compute 1-norm of offdiagonal elements of i-th row.
*
               work( i ) = dasum( n-i, b( i, i+1 ), ldb ) +
     $                     dasum( n-i, b( i+2, i ), 1 )
  170       CONTINUE
            IF( b( n, n ).EQ.zero .AND. b( n+1, n ).EQ.zero )
     $         b( n, n ) = eps3
            work( n ) = zero
*
            i1 = n
            i2 = 1
            i3 = -1
         ELSE
*
*           UL decomposition with partial pivoting of conjg(B),
*           replacing zero pivots by EPS3.
*
*           The imaginary part of the (i,j)-th element of U is stored in
*           B(j+1,i).
*
            b( n+1, n ) = wi
            DO 180 j = 1, n - 1
               b( n+1, j ) = zero
  180       CONTINUE
*
            DO 210 j = n, 2, -1
               ej = h( j, j-1 )
               absbjj = dlapy2( b( j, j ), b( j+1, j ) )
               IF( absbjj.LT.abs( ej ) ) THEN
*
*                 Interchange columns and eliminate
*
                  xr = b( j, j ) / ej
                  xi = b( j+1, j ) / ej
                  b( j, j ) = ej
                  b( j+1, j ) = zero
                  DO 190 i = 1, j - 1
                     temp = b( i, j-1 )
                     b( i, j-1 ) = b( i, j ) - xr*temp
                     b( j, i ) = b( j+1, i ) - xi*temp
                     b( i, j ) = temp
                     b( j+1, i ) = zero
  190             CONTINUE
                  b( j+1, j-1 ) = wi
                  b( j-1, j-1 ) = b( j-1, j-1 ) + xi*wi
                  b( j, j-1 ) = b( j, j-1 ) - xr*wi
               ELSE
*
*                 Eliminate without interchange.
*
                  IF( absbjj.EQ.zero ) THEN
                     b( j, j ) = eps3
                     b( j+1, j ) = zero
                     absbjj = eps3
                  END IF
                  ej = ( ej / absbjj ) / absbjj
                  xr = b( j, j )*ej
                  xi = -b( j+1, j )*ej
                  DO 200 i = 1, j - 1
                     b( i, j-1 ) = b( i, j-1 ) - xr*b( i, j ) +
     $                             xi*b( j+1, i )
                     b( j, i ) = -xr*b( j+1, i ) - xi*b( i, j )
  200             CONTINUE
                  b( j, j-1 ) = b( j, j-1 ) + wi
               END IF
*
*              Compute 1-norm of offdiagonal elements of j-th column.
*
               work( j ) = dasum( j-1, b( 1, j ), 1 ) +
     $                     dasum( j-1, b( j+1, 1 ), ldb )
  210       CONTINUE
            IF( b( 1, 1 ).EQ.zero .AND. b( 2, 1 ).EQ.zero )
     $         b( 1, 1 ) = eps3
            work( 1 ) = zero
*
            i1 = 1
            i2 = n
            i3 = 1
         END IF
*
         DO 270 its = 1, n
            scale = one
            vmax = one
            vcrit = bignum
*
*           Solve U*(xr,xi) = scale*(vr,vi) for a right eigenvector,
*             or U**T*(xr,xi) = scale*(vr,vi) for a left eigenvector,
*           overwriting (xr,xi) on (vr,vi).
*
            DO 250 i = i1, i2, i3
*
               IF( work( i ).GT.vcrit ) THEN
                  rec = one / vmax
                  CALL dscal( n, rec, vr, 1 )
                  CALL dscal( n, rec, vi, 1 )
                  scale = scale*rec
                  vmax = one
                  vcrit = bignum
               END IF
*
               xr = vr( i )
               xi = vi( i )
               IF( rightv ) THEN
                  DO 220 j = i + 1, n
                     xr = xr - b( i, j )*vr( j ) + b( j+1, i )*vi( j )
                     xi = xi - b( i, j )*vi( j ) - b( j+1, i )*vr( j )
  220             CONTINUE
               ELSE
                  DO 230 j = 1, i - 1
                     xr = xr - b( j, i )*vr( j ) + b( i+1, j )*vi( j )
                     xi = xi - b( j, i )*vi( j ) - b( i+1, j )*vr( j )
  230             CONTINUE
               END IF
*
               w = abs( b( i, i ) ) + abs( b( i+1, i ) )
               IF( w.GT.smlnum ) THEN
                  IF( w.LT.one ) THEN
                     w1 = abs( xr ) + abs( xi )
                     IF( w1.GT.w*bignum ) THEN
                        rec = one / w1
                        CALL dscal( n, rec, vr, 1 )
                        CALL dscal( n, rec, vi, 1 )
                        xr = vr( i )
                        xi = vi( i )
                        scale = scale*rec
                        vmax = vmax*rec
                     END IF
                  END IF
*
*                 Divide by diagonal element of B.
*
                  CALL dladiv( xr, xi, b( i, i ), b( i+1, i ), vr( i ),
     $                         vi( i ) )
                  vmax = max( abs( vr( i ) )+abs( vi( i ) ), vmax )
                  vcrit = bignum / vmax
               ELSE
                  DO 240 j = 1, n
                     vr( j ) = zero
                     vi( j ) = zero
  240             CONTINUE
                  vr( i ) = one
                  vi( i ) = one
                  scale = zero
                  vmax = one
                  vcrit = bignum
               END IF
  250       CONTINUE
*
*           Test for sufficient growth in the norm of (VR,VI).
*
            vnorm = dasum( n, vr, 1 ) + dasum( n, vi, 1 )
            IF( vnorm.GE.growto*scale )
     $         GO TO 280
*
*           Choose a new orthogonal starting vector and try again.
*
            y = eps3 / ( rootn+one )
            vr( 1 ) = eps3
            vi( 1 ) = zero
*
            DO 260 i = 2, n
               vr( i ) = y
               vi( i ) = zero
  260       CONTINUE
            vr( n-its+1 ) = vr( n-its+1 ) - eps3*rootn
  270    CONTINUE
*
*        Failure to find eigenvector in N iterations
*
         info = 1
*
  280    CONTINUE
*
*        Normalize eigenvector.
*
         vnorm = zero
         DO 290 i = 1, n
            vnorm = max( vnorm, abs( vr( i ) )+abs( vi( i ) ) )
  290    CONTINUE
         CALL dscal( n, one / vnorm, vr, 1 )
         CALL dscal( n, one / vnorm, vi, 1 )
*
      END IF
*
      RETURN
*
*     End of DLAEIN
*

◆ dlaexc()

subroutine dlaexc	(	logical	wantq,
		integer	n,
		double precision, dimension( ldt, * )	t,
		integer	ldt,
		double precision, dimension( ldq, * )	q,
		integer	ldq,
		integer	j1,
		integer	n1,
		integer	n2,
		double precision, dimension( * )	work,
		integer	info )

DLAEXC swaps adjacent diagonal blocks of a real upper quasi-triangular matrix in Schur canonical form, by an orthogonal similarity transformation.

Download DLAEXC + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLAEXC swaps adjacent diagonal blocks T11 and T22 of order 1 or 2 in
!> an upper quasi-triangular matrix T by an orthogonal similarity
!> transformation.
!>
!> T must be in Schur canonical form, that is, block upper triangular
!> with 1-by-1 and 2-by-2 diagonal blocks; each 2-by-2 diagonal block
!> has its diagonal elements equal and its off-diagonal elements of
!> opposite sign.
!>

Parameters

[in]	WANTQ	!> WANTQ is LOGICAL !> = .TRUE. : accumulate the transformation in the matrix Q; !> = .FALSE.: do not accumulate the transformation. !>
[in]	N	!> N is INTEGER !> The order of the matrix T. N >= 0. !>
[in,out]	T	!> T is DOUBLE PRECISION array, dimension (LDT,N) !> On entry, the upper quasi-triangular matrix T, in Schur !> canonical form. !> On exit, the updated matrix T, again in Schur canonical form. !>
[in]	LDT	!> LDT is INTEGER !> The leading dimension of the array T. LDT >= max(1,N). !>
[in,out]	Q	!> Q is DOUBLE PRECISION array, dimension (LDQ,N) !> On entry, if WANTQ is .TRUE., the orthogonal matrix Q. !> On exit, if WANTQ is .TRUE., the updated matrix Q. !> If WANTQ is .FALSE., Q is not referenced. !>
[in]	LDQ	!> LDQ is INTEGER !> The leading dimension of the array Q. !> LDQ >= 1; and if WANTQ is .TRUE., LDQ >= N. !>
[in]	J1	!> J1 is INTEGER !> The index of the first row of the first block T11. !>
[in]	N1	!> N1 is INTEGER !> The order of the first block T11. N1 = 0, 1 or 2. !>
[in]	N2	!> N2 is INTEGER !> The order of the second block T22. N2 = 0, 1 or 2. !>
[out]	WORK	!> WORK is DOUBLE PRECISION array, dimension (N) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> = 1: the transformed matrix T would be too far from Schur !> form; the blocks are not swapped and T and Q are !> unchanged. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 136 of file dlaexc.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      LOGICAL            WANTQ
      INTEGER            INFO, J1, LDQ, LDT, N, N1, N2
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   Q( LDQ, * ), T( LDT, * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ZERO, ONE
      parameter( zero = 0.0d+0, one = 1.0d+0 )
      DOUBLE PRECISION   TEN
      parameter( ten = 1.0d+1 )
      INTEGER            LDD, LDX
      parameter( ldd = 4, ldx = 2 )
*     ..
*     .. Local Scalars ..
      INTEGER            IERR, J2, J3, J4, K, ND
      DOUBLE PRECISION   CS, DNORM, EPS, SCALE, SMLNUM, SN, T11, T22,
     $                   T33, TAU, TAU1, TAU2, TEMP, THRESH, WI1, WI2,
     $                   WR1, WR2, XNORM
*     ..
*     .. Local Arrays ..
      DOUBLE PRECISION   D( LDD, 4 ), U( 3 ), U1( 3 ), U2( 3 ),
     $                   X( LDX, 2 )
*     ..
*     .. External Functions ..
      DOUBLE PRECISION   DLAMCH, DLANGE
      EXTERNAL           dlamch, dlange
*     ..
*     .. External Subroutines ..
      EXTERNAL           dlacpy, dlanv2, dlarfg, dlarfx, dlartg, dlasy2,
     $                   drot
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, max
*     ..
*     .. Executable Statements ..
*
      info = 0
*
*     Quick return if possible
*
      IF( n.EQ.0 .OR. n1.EQ.0 .OR. n2.EQ.0 )
     $   RETURN
      IF( j1+n1.GT.n )
     $   RETURN
*
      j2 = j1 + 1
      j3 = j1 + 2
      j4 = j1 + 3
*
      IF( n1.EQ.1 .AND. n2.EQ.1 ) THEN
*
*        Swap two 1-by-1 blocks.
*
         t11 = t( j1, j1 )
         t22 = t( j2, j2 )
*
*        Determine the transformation to perform the interchange.
*
         CALL dlartg( t( j1, j2 ), t22-t11, cs, sn, temp )
*
*        Apply transformation to the matrix T.
*
         IF( j3.LE.n )
     $      CALL drot( n-j1-1, t( j1, j3 ), ldt, t( j2, j3 ), ldt, cs,
     $                 sn )
         CALL drot( j1-1, t( 1, j1 ), 1, t( 1, j2 ), 1, cs, sn )
*
         t( j1, j1 ) = t22
         t( j2, j2 ) = t11
*
         IF( wantq ) THEN
*
*           Accumulate transformation in the matrix Q.
*
            CALL drot( n, q( 1, j1 ), 1, q( 1, j2 ), 1, cs, sn )
         END IF
*
      ELSE
*
*        Swapping involves at least one 2-by-2 block.
*
*        Copy the diagonal block of order N1+N2 to the local array D
*        and compute its norm.
*
         nd = n1 + n2
         CALL dlacpy( 'Full', nd, nd, t( j1, j1 ), ldt, d, ldd )
         dnorm = dlange( 'Max', nd, nd, d, ldd, work )
*
*        Compute machine-dependent threshold for test for accepting
*        swap.
*
         eps = dlamch( 'P' )
         smlnum = dlamch( 'S' ) / eps
         thresh = max( ten*eps*dnorm, smlnum )
*
*        Solve T11*X - X*T22 = scale*T12 for X.
*
         CALL dlasy2( .false., .false., -1, n1, n2, d, ldd,
     $                d( n1+1, n1+1 ), ldd, d( 1, n1+1 ), ldd, scale, x,
     $                ldx, xnorm, ierr )
*
*        Swap the adjacent diagonal blocks.
*
         k = n1 + n1 + n2 - 3
         GO TO ( 10, 20, 30 )k
*
   10    CONTINUE
*
*        N1 = 1, N2 = 2: generate elementary reflector H so that:
*
*        ( scale, X11, X12 ) H = ( 0, 0, * )
*
         u( 1 ) = scale
         u( 2 ) = x( 1, 1 )
         u( 3 ) = x( 1, 2 )
         CALL dlarfg( 3, u( 3 ), u, 1, tau )
         u( 3 ) = one
         t11 = t( j1, j1 )
*
*        Perform swap provisionally on diagonal block in D.
*
         CALL dlarfx( 'L', 3, 3, u, tau, d, ldd, work )
         CALL dlarfx( 'R', 3, 3, u, tau, d, ldd, work )
*
*        Test whether to reject swap.
*
         IF( max( abs( d( 3, 1 ) ), abs( d( 3, 2 ) ), abs( d( 3,
     $       3 )-t11 ) ).GT.thresh )GO TO 50
*
*        Accept swap: apply transformation to the entire matrix T.
*
         CALL dlarfx( 'L', 3, n-j1+1, u, tau, t( j1, j1 ), ldt, work )
         CALL dlarfx( 'R', j2, 3, u, tau, t( 1, j1 ), ldt, work )
*
         t( j3, j1 ) = zero
         t( j3, j2 ) = zero
         t( j3, j3 ) = t11
*
         IF( wantq ) THEN
*
*           Accumulate transformation in the matrix Q.
*
            CALL dlarfx( 'R', n, 3, u, tau, q( 1, j1 ), ldq, work )
         END IF
         GO TO 40
*
   20    CONTINUE
*
*        N1 = 2, N2 = 1: generate elementary reflector H so that:
*
*        H (  -X11 ) = ( * )
*          (  -X21 ) = ( 0 )
*          ( scale ) = ( 0 )
*
         u( 1 ) = -x( 1, 1 )
         u( 2 ) = -x( 2, 1 )
         u( 3 ) = scale
         CALL dlarfg( 3, u( 1 ), u( 2 ), 1, tau )
         u( 1 ) = one
         t33 = t( j3, j3 )
*
*        Perform swap provisionally on diagonal block in D.
*
         CALL dlarfx( 'L', 3, 3, u, tau, d, ldd, work )
         CALL dlarfx( 'R', 3, 3, u, tau, d, ldd, work )
*
*        Test whether to reject swap.
*
         IF( max( abs( d( 2, 1 ) ), abs( d( 3, 1 ) ), abs( d( 1,
     $       1 )-t33 ) ).GT.thresh )GO TO 50
*
*        Accept swap: apply transformation to the entire matrix T.
*
         CALL dlarfx( 'R', j3, 3, u, tau, t( 1, j1 ), ldt, work )
         CALL dlarfx( 'L', 3, n-j1, u, tau, t( j1, j2 ), ldt, work )
*
         t( j1, j1 ) = t33
         t( j2, j1 ) = zero
         t( j3, j1 ) = zero
*
         IF( wantq ) THEN
*
*           Accumulate transformation in the matrix Q.
*
            CALL dlarfx( 'R', n, 3, u, tau, q( 1, j1 ), ldq, work )
         END IF
         GO TO 40
*
   30    CONTINUE
*
*        N1 = 2, N2 = 2: generate elementary reflectors H(1) and H(2) so
*        that:
*
*        H(2) H(1) (  -X11  -X12 ) = (  *  * )
*                  (  -X21  -X22 )   (  0  * )
*                  ( scale    0  )   (  0  0 )
*                  (    0  scale )   (  0  0 )
*
         u1( 1 ) = -x( 1, 1 )
         u1( 2 ) = -x( 2, 1 )
         u1( 3 ) = scale
         CALL dlarfg( 3, u1( 1 ), u1( 2 ), 1, tau1 )
         u1( 1 ) = one
*
         temp = -tau1*( x( 1, 2 )+u1( 2 )*x( 2, 2 ) )
         u2( 1 ) = -temp*u1( 2 ) - x( 2, 2 )
         u2( 2 ) = -temp*u1( 3 )
         u2( 3 ) = scale
         CALL dlarfg( 3, u2( 1 ), u2( 2 ), 1, tau2 )
         u2( 1 ) = one
*
*        Perform swap provisionally on diagonal block in D.
*
         CALL dlarfx( 'L', 3, 4, u1, tau1, d, ldd, work )
         CALL dlarfx( 'R', 4, 3, u1, tau1, d, ldd, work )
         CALL dlarfx( 'L', 3, 4, u2, tau2, d( 2, 1 ), ldd, work )
         CALL dlarfx( 'R', 4, 3, u2, tau2, d( 1, 2 ), ldd, work )
*
*        Test whether to reject swap.
*
         IF( max( abs( d( 3, 1 ) ), abs( d( 3, 2 ) ), abs( d( 4, 1 ) ),
     $       abs( d( 4, 2 ) ) ).GT.thresh )GO TO 50
*
*        Accept swap: apply transformation to the entire matrix T.
*
         CALL dlarfx( 'L', 3, n-j1+1, u1, tau1, t( j1, j1 ), ldt, work )
         CALL dlarfx( 'R', j4, 3, u1, tau1, t( 1, j1 ), ldt, work )
         CALL dlarfx( 'L', 3, n-j1+1, u2, tau2, t( j2, j1 ), ldt, work )
         CALL dlarfx( 'R', j4, 3, u2, tau2, t( 1, j2 ), ldt, work )
*
         t( j3, j1 ) = zero
         t( j3, j2 ) = zero
         t( j4, j1 ) = zero
         t( j4, j2 ) = zero
*
         IF( wantq ) THEN
*
*           Accumulate transformation in the matrix Q.
*
            CALL dlarfx( 'R', n, 3, u1, tau1, q( 1, j1 ), ldq, work )
            CALL dlarfx( 'R', n, 3, u2, tau2, q( 1, j2 ), ldq, work )
         END IF
*
   40    CONTINUE
*
         IF( n2.EQ.2 ) THEN
*
*           Standardize new 2-by-2 block T11
*
            CALL dlanv2( t( j1, j1 ), t( j1, j2 ), t( j2, j1 ),
     $                   t( j2, j2 ), wr1, wi1, wr2, wi2, cs, sn )
            CALL drot( n-j1-1, t( j1, j1+2 ), ldt, t( j2, j1+2 ), ldt,
     $                 cs, sn )
            CALL drot( j1-1, t( 1, j1 ), 1, t( 1, j2 ), 1, cs, sn )
            IF( wantq )
     $         CALL drot( n, q( 1, j1 ), 1, q( 1, j2 ), 1, cs, sn )
         END IF
*
         IF( n1.EQ.2 ) THEN
*
*           Standardize new 2-by-2 block T22
*
            j3 = j1 + n2
            j4 = j3 + 1
            CALL dlanv2( t( j3, j3 ), t( j3, j4 ), t( j4, j3 ),
     $                   t( j4, j4 ), wr1, wi1, wr2, wi2, cs, sn )
            IF( j3+2.LE.n )
     $         CALL drot( n-j3-1, t( j3, j3+2 ), ldt, t( j4, j3+2 ),
     $                    ldt, cs, sn )
            CALL drot( j3-1, t( 1, j3 ), 1, t( 1, j4 ), 1, cs, sn )
            IF( wantq )
     $         CALL drot( n, q( 1, j3 ), 1, q( 1, j4 ), 1, cs, sn )
         END IF
*
      END IF
      RETURN
*
*     Exit with INFO = 1 if swap was rejected.
*
   50 CONTINUE
      info = 1
      RETURN
*
*     End of DLAEXC
*

◆ dlag2()

subroutine dlag2	(	double precision, dimension( lda, * )	a,
		integer	lda,
		double precision, dimension( ldb, * )	b,
		integer	ldb,
		double precision	safmin,
		double precision	scale1,
		double precision	scale2,
		double precision	wr1,
		double precision	wr2,
		double precision	wi )

DLAG2 computes the eigenvalues of a 2-by-2 generalized eigenvalue problem, with scaling as necessary to avoid over-/underflow.

Download DLAG2 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLAG2 computes the eigenvalues of a 2 x 2 generalized eigenvalue
!> problem  A - w B, with scaling as necessary to avoid over-/underflow.
!>
!> The scaling factor  results in a modified eigenvalue equation
!>
!>     s A - w B
!>
!> where  s  is a non-negative scaling factor chosen so that  w,  w B,
!> and  s A  do not overflow and, if possible, do not underflow, either.
!>

Parameters

[in]	A	!> A is DOUBLE PRECISION array, dimension (LDA, 2) !> On entry, the 2 x 2 matrix A. It is assumed that its 1-norm !> is less than 1/SAFMIN. Entries less than !> sqrt(SAFMIN)*norm(A) are subject to being treated as zero. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= 2. !>
[in]	B	!> B is DOUBLE PRECISION array, dimension (LDB, 2) !> On entry, the 2 x 2 upper triangular matrix B. It is !> assumed that the one-norm of B is less than 1/SAFMIN. The !> diagonals should be at least sqrt(SAFMIN) times the largest !> element of B (in absolute value); if a diagonal is smaller !> than that, then +/- sqrt(SAFMIN) will be used instead of !> that diagonal. !>
[in]	LDB	!> LDB is INTEGER !> The leading dimension of the array B. LDB >= 2. !>
[in]	SAFMIN	!> SAFMIN is DOUBLE PRECISION !> The smallest positive number s.t. 1/SAFMIN does not !> overflow. (This should always be DLAMCH('S') -- it is an !> argument in order to avoid having to call DLAMCH frequently.) !>
[out]	SCALE1	!> SCALE1 is DOUBLE PRECISION !> A scaling factor used to avoid over-/underflow in the !> eigenvalue equation which defines the first eigenvalue. If !> the eigenvalues are complex, then the eigenvalues are !> ( WR1 +/- WI i ) / SCALE1 (which may lie outside the !> exponent range of the machine), SCALE1=SCALE2, and SCALE1 !> will always be positive. If the eigenvalues are real, then !> the first (real) eigenvalue is WR1 / SCALE1 , but this may !> overflow or underflow, and in fact, SCALE1 may be zero or !> less than the underflow threshold if the exact eigenvalue !> is sufficiently large. !>
[out]	SCALE2	!> SCALE2 is DOUBLE PRECISION !> A scaling factor used to avoid over-/underflow in the !> eigenvalue equation which defines the second eigenvalue. If !> the eigenvalues are complex, then SCALE2=SCALE1. If the !> eigenvalues are real, then the second (real) eigenvalue is !> WR2 / SCALE2 , but this may overflow or underflow, and in !> fact, SCALE2 may be zero or less than the underflow !> threshold if the exact eigenvalue is sufficiently large. !>
[out]	WR1	!> WR1 is DOUBLE PRECISION !> If the eigenvalue is real, then WR1 is SCALE1 times the !> eigenvalue closest to the (2,2) element of A B**(-1). If the !> eigenvalue is complex, then WR1=WR2 is SCALE1 times the real !> part of the eigenvalues. !>
[out]	WR2	!> WR2 is DOUBLE PRECISION !> If the eigenvalue is real, then WR2 is SCALE2 times the !> other eigenvalue. If the eigenvalue is complex, then !> WR1=WR2 is SCALE1 times the real part of the eigenvalues. !>
[out]	WI	!> WI is DOUBLE PRECISION !> If the eigenvalue is real, then WI is zero. If the !> eigenvalue is complex, then WI is SCALE1 times the imaginary !> part of the eigenvalues. WI will always be non-negative. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 154 of file dlag2.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            LDA, LDB
      DOUBLE PRECISION   SAFMIN, SCALE1, SCALE2, WI, WR1, WR2
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   A( LDA, * ), B( LDB, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ZERO, ONE, TWO
      parameter( zero = 0.0d+0, one = 1.0d+0, two = 2.0d+0 )
      DOUBLE PRECISION   HALF
      parameter( half = one / two )
      DOUBLE PRECISION   FUZZY1
      parameter( fuzzy1 = one+1.0d-5 )
*     ..
*     .. Local Scalars ..
      DOUBLE PRECISION   A11, A12, A21, A22, ABI22, ANORM, AS11, AS12,
     $                   AS22, ASCALE, B11, B12, B22, BINV11, BINV22,
     $                   BMIN, BNORM, BSCALE, BSIZE, C1, C2, C3, C4, C5,
     $                   DIFF, DISCR, PP, QQ, R, RTMAX, RTMIN, S1, S2,
     $                   SAFMAX, SHIFT, SS, SUM, WABS, WBIG, WDET,
     $                   WSCALE, WSIZE, WSMALL
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, max, min, sign, sqrt
*     ..
*     .. Executable Statements ..
*
      rtmin = sqrt( safmin )
      rtmax = one / rtmin
      safmax = one / safmin
*
*     Scale A
*
      anorm = max( abs( a( 1, 1 ) )+abs( a( 2, 1 ) ),
     $        abs( a( 1, 2 ) )+abs( a( 2, 2 ) ), safmin )
      ascale = one / anorm
      a11 = ascale*a( 1, 1 )
      a21 = ascale*a( 2, 1 )
      a12 = ascale*a( 1, 2 )
      a22 = ascale*a( 2, 2 )
*
*     Perturb B if necessary to insure non-singularity
*
      b11 = b( 1, 1 )
      b12 = b( 1, 2 )
      b22 = b( 2, 2 )
      bmin = rtmin*max( abs( b11 ), abs( b12 ), abs( b22 ), rtmin )
      IF( abs( b11 ).LT.bmin )
     $   b11 = sign( bmin, b11 )
      IF( abs( b22 ).LT.bmin )
     $   b22 = sign( bmin, b22 )
*
*     Scale B
*
      bnorm = max( abs( b11 ), abs( b12 )+abs( b22 ), safmin )
      bsize = max( abs( b11 ), abs( b22 ) )
      bscale = one / bsize
      b11 = b11*bscale
      b12 = b12*bscale
      b22 = b22*bscale
*
*     Compute larger eigenvalue by method described by C. van Loan
*
*     ( AS is A shifted by -SHIFT*B )
*
      binv11 = one / b11
      binv22 = one / b22
      s1 = a11*binv11
      s2 = a22*binv22
      IF( abs( s1 ).LE.abs( s2 ) ) THEN
         as12 = a12 - s1*b12
         as22 = a22 - s1*b22
         ss = a21*( binv11*binv22 )
         abi22 = as22*binv22 - ss*b12
         pp = half*abi22
         shift = s1
      ELSE
         as12 = a12 - s2*b12
         as11 = a11 - s2*b11
         ss = a21*( binv11*binv22 )
         abi22 = -ss*b12
         pp = half*( as11*binv11+abi22 )
         shift = s2
      END IF
      qq = ss*as12
      IF( abs( pp*rtmin ).GE.one ) THEN
         discr = ( rtmin*pp )**2 + qq*safmin
         r = sqrt( abs( discr ) )*rtmax
      ELSE
         IF( pp**2+abs( qq ).LE.safmin ) THEN
            discr = ( rtmax*pp )**2 + qq*safmax
            r = sqrt( abs( discr ) )*rtmin
         ELSE
            discr = pp**2 + qq
            r = sqrt( abs( discr ) )
         END IF
      END IF
*
*     Note: the test of R in the following IF is to cover the case when
*           DISCR is small and negative and is flushed to zero during
*           the calculation of R.  On machines which have a consistent
*           flush-to-zero threshold and handle numbers above that
*           threshold correctly, it would not be necessary.
*
      IF( discr.GE.zero .OR. r.EQ.zero ) THEN
         sum = pp + sign( r, pp )
         diff = pp - sign( r, pp )
         wbig = shift + sum
*
*        Compute smaller eigenvalue
*
         wsmall = shift + diff
         IF( half*abs( wbig ).GT.max( abs( wsmall ), safmin ) ) THEN
            wdet = ( a11*a22-a12*a21 )*( binv11*binv22 )
            wsmall = wdet / wbig
         END IF
*
*        Choose (real) eigenvalue closest to 2,2 element of A*B**(-1)
*        for WR1.
*
         IF( pp.GT.abi22 ) THEN
            wr1 = min( wbig, wsmall )
            wr2 = max( wbig, wsmall )
         ELSE
            wr1 = max( wbig, wsmall )
            wr2 = min( wbig, wsmall )
         END IF
         wi = zero
      ELSE
*
*        Complex eigenvalues
*
         wr1 = shift + pp
         wr2 = wr1
         wi = r
      END IF
*
*     Further scaling to avoid underflow and overflow in computing
*     SCALE1 and overflow in computing w*B.
*
*     This scale factor (WSCALE) is bounded from above using C1 and C2,
*     and from below using C3 and C4.
*        C1 implements the condition  s A  must never overflow.
*        C2 implements the condition  w B  must never overflow.
*        C3, with C2,
*           implement the condition that s A - w B must never overflow.
*        C4 implements the condition  s    should not underflow.
*        C5 implements the condition  max(s,|w|) should be at least 2.
*
      c1 = bsize*( safmin*max( one, ascale ) )
      c2 = safmin*max( one, bnorm )
      c3 = bsize*safmin
      IF( ascale.LE.one .AND. bsize.LE.one ) THEN
         c4 = min( one, ( ascale / safmin )*bsize )
      ELSE
         c4 = one
      END IF
      IF( ascale.LE.one .OR. bsize.LE.one ) THEN
         c5 = min( one, ascale*bsize )
      ELSE
         c5 = one
      END IF
*
*     Scale first eigenvalue
*
      wabs = abs( wr1 ) + abs( wi )
      wsize = max( safmin, c1, fuzzy1*( wabs*c2+c3 ),
     $        min( c4, half*max( wabs, c5 ) ) )
      IF( wsize.NE.one ) THEN
         wscale = one / wsize
         IF( wsize.GT.one ) THEN
            scale1 = ( max( ascale, bsize )*wscale )*
     $               min( ascale, bsize )
         ELSE
            scale1 = ( min( ascale, bsize )*wscale )*
     $               max( ascale, bsize )
         END IF
         wr1 = wr1*wscale
         IF( wi.NE.zero ) THEN
            wi = wi*wscale
            wr2 = wr1
            scale2 = scale1
         END IF
      ELSE
         scale1 = ascale*bsize
         scale2 = scale1
      END IF
*
*     Scale second eigenvalue (if real)
*
      IF( wi.EQ.zero ) THEN
         wsize = max( safmin, c1, fuzzy1*( abs( wr2 )*c2+c3 ),
     $           min( c4, half*max( abs( wr2 ), c5 ) ) )
         IF( wsize.NE.one ) THEN
            wscale = one / wsize
            IF( wsize.GT.one ) THEN
               scale2 = ( max( ascale, bsize )*wscale )*
     $                  min( ascale, bsize )
            ELSE
               scale2 = ( min( ascale, bsize )*wscale )*
     $                  max( ascale, bsize )
            END IF
            wr2 = wr2*wscale
         ELSE
            scale2 = ascale*bsize
         END IF
      END IF
*
*     End of DLAG2
*
      RETURN

◆ dlag2s()

subroutine dlag2s	(	integer	m,
		integer	n,
		double precision, dimension( lda, * )	a,
		integer	lda,
		real, dimension( ldsa, * )	sa,
		integer	ldsa,
		integer	info )

DLAG2S converts a double precision matrix to a single precision matrix.

Download DLAG2S + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLAG2S converts a DOUBLE PRECISION matrix, SA, to a SINGLE
!> PRECISION matrix, A.
!>
!> RMAX is the overflow for the SINGLE PRECISION arithmetic
!> DLAG2S checks that all the entries of A are between -RMAX and
!> RMAX. If not the conversion is aborted and a flag is raised.
!>
!> This is an auxiliary routine so there is no argument checking.
!>

Parameters

[in]	M	!> M is INTEGER !> The number of lines of the matrix A. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix A. N >= 0. !>
[in]	A	!> A is DOUBLE PRECISION array, dimension (LDA,N) !> On entry, the M-by-N coefficient matrix A. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,M). !>
[out]	SA	!> SA is REAL array, dimension (LDSA,N) !> On exit, if INFO=0, the M-by-N coefficient matrix SA; if !> INFO>0, the content of SA is unspecified. !>
[in]	LDSA	!> LDSA is INTEGER !> The leading dimension of the array SA. LDSA >= max(1,M). !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> = 1: an entry of the matrix A is greater than the SINGLE !> PRECISION overflow threshold, in this case, the content !> of SA in exit is unspecified. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 107 of file dlag2s.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INFO, LDA, LDSA, M, N
*     ..
*     .. Array Arguments ..
      REAL               SA( LDSA, * )
      DOUBLE PRECISION   A( LDA, * )
*     ..
*
*  =====================================================================
*
*     .. Local Scalars ..
      INTEGER            I, J
      DOUBLE PRECISION   RMAX
*     ..
*     .. External Functions ..
      REAL               SLAMCH
      EXTERNAL           slamch
*     ..
*     .. Executable Statements ..
*
      rmax = slamch( 'O' )
      DO 20 j = 1, n
         DO 10 i = 1, m
            IF( ( a( i, j ).LT.-rmax ) .OR. ( a( i, j ).GT.rmax ) ) THEN
               info = 1
               GO TO 30
            END IF
            sa( i, j ) = a( i, j )
   10    CONTINUE
   20 CONTINUE
      info = 0
   30 CONTINUE
      RETURN
*
*     End of DLAG2S
*

◆ dlags2()

subroutine dlags2	(	logical	upper,
		double precision	a1,
		double precision	a2,
		double precision	a3,
		double precision	b1,
		double precision	b2,
		double precision	b3,
		double precision	csu,
		double precision	snu,
		double precision	csv,
		double precision	snv,
		double precision	csq,
		double precision	snq )

DLAGS2 computes 2-by-2 orthogonal matrices U, V, and Q, and applies them to matrices A and B such that the rows of the transformed A and B are parallel.

Download DLAGS2 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLAGS2 computes 2-by-2 orthogonal matrices U, V and Q, such
!> that if ( UPPER ) then
!>
!>           U**T *A*Q = U**T *( A1 A2 )*Q = ( x  0  )
!>                             ( 0  A3 )     ( x  x  )
!> and
!>           V**T*B*Q = V**T *( B1 B2 )*Q = ( x  0  )
!>                            ( 0  B3 )     ( x  x  )
!>
!> or if ( .NOT.UPPER ) then
!>
!>           U**T *A*Q = U**T *( A1 0  )*Q = ( x  x  )
!>                             ( A2 A3 )     ( 0  x  )
!> and
!>           V**T*B*Q = V**T*( B1 0  )*Q = ( x  x  )
!>                           ( B2 B3 )     ( 0  x  )
!>
!> The rows of the transformed A and B are parallel, where
!>
!>   U = (  CSU  SNU ), V = (  CSV SNV ), Q = (  CSQ   SNQ )
!>       ( -SNU  CSU )      ( -SNV CSV )      ( -SNQ   CSQ )
!>
!> Z**T denotes the transpose of Z.
!>
!>

Parameters

[in]	UPPER	!> UPPER is LOGICAL !> = .TRUE.: the input matrices A and B are upper triangular. !> = .FALSE.: the input matrices A and B are lower triangular. !>
[in]	A1	!> A1 is DOUBLE PRECISION !>
[in]	A2	!> A2 is DOUBLE PRECISION !>
[in]	A3	!> A3 is DOUBLE PRECISION !> On entry, A1, A2 and A3 are elements of the input 2-by-2 !> upper (lower) triangular matrix A. !>
[in]	B1	!> B1 is DOUBLE PRECISION !>
[in]	B2	!> B2 is DOUBLE PRECISION !>
[in]	B3	!> B3 is DOUBLE PRECISION !> On entry, B1, B2 and B3 are elements of the input 2-by-2 !> upper (lower) triangular matrix B. !>
[out]	CSU	!> CSU is DOUBLE PRECISION !>
[out]	SNU	!> SNU is DOUBLE PRECISION !> The desired orthogonal matrix U. !>
[out]	CSV	!> CSV is DOUBLE PRECISION !>
[out]	SNV	!> SNV is DOUBLE PRECISION !> The desired orthogonal matrix V. !>
[out]	CSQ	!> CSQ is DOUBLE PRECISION !>
[out]	SNQ	!> SNQ is DOUBLE PRECISION !> The desired orthogonal matrix Q. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 150 of file dlags2.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      LOGICAL            UPPER
      DOUBLE PRECISION   A1, A2, A3, B1, B2, B3, CSQ, CSU, CSV, SNQ,
     $                   SNU, SNV
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ZERO
      parameter( zero = 0.0d+0 )
*     ..
*     .. Local Scalars ..
      DOUBLE PRECISION   A, AUA11, AUA12, AUA21, AUA22, AVB11, AVB12,
     $                   AVB21, AVB22, B, C, CSL, CSR, D, R, S1, S2,
     $                   SNL, SNR, UA11, UA11R, UA12, UA21, UA22, UA22R,
     $                   VB11, VB11R, VB12, VB21, VB22, VB22R
*     ..
*     .. External Subroutines ..
      EXTERNAL           dlartg, dlasv2
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs
*     ..
*     .. Executable Statements ..
*
      IF( upper ) THEN
*
*        Input matrices A and B are upper triangular matrices
*
*        Form matrix C = A*adj(B) = ( a b )
*                                   ( 0 d )
*
         a = a1*b3
         d = a3*b1
         b = a2*b1 - a1*b2
*
*        The SVD of real 2-by-2 triangular C
*
*         ( CSL -SNL )*( A B )*(  CSR  SNR ) = ( R 0 )
*         ( SNL  CSL ) ( 0 D ) ( -SNR  CSR )   ( 0 T )
*
         CALL dlasv2( a, b, d, s1, s2, snr, csr, snl, csl )
*
         IF( abs( csl ).GE.abs( snl ) .OR. abs( csr ).GE.abs( snr ) )
     $        THEN
*
*           Compute the (1,1) and (1,2) elements of U**T *A and V**T *B,
*           and (1,2) element of |U|**T *|A| and |V|**T *|B|.
*
            ua11r = csl*a1
            ua12 = csl*a2 + snl*a3
*
            vb11r = csr*b1
            vb12 = csr*b2 + snr*b3
*
            aua12 = abs( csl )*abs( a2 ) + abs( snl )*abs( a3 )
            avb12 = abs( csr )*abs( b2 ) + abs( snr )*abs( b3 )
*
*           zero (1,2) elements of U**T *A and V**T *B
*
            IF( ( abs( ua11r )+abs( ua12 ) ).NE.zero ) THEN
               IF( aua12 / ( abs( ua11r )+abs( ua12 ) ).LE.avb12 /
     $             ( abs( vb11r )+abs( vb12 ) ) ) THEN
                  CALL dlartg( -ua11r, ua12, csq, snq, r )
               ELSE
                  CALL dlartg( -vb11r, vb12, csq, snq, r )
               END IF
            ELSE
               CALL dlartg( -vb11r, vb12, csq, snq, r )
            END IF
*
            csu = csl
            snu = -snl
            csv = csr
            snv = -snr
*
         ELSE
*
*           Compute the (2,1) and (2,2) elements of U**T *A and V**T *B,
*           and (2,2) element of |U|**T *|A| and |V|**T *|B|.
*
            ua21 = -snl*a1
            ua22 = -snl*a2 + csl*a3
*
            vb21 = -snr*b1
            vb22 = -snr*b2 + csr*b3
*
            aua22 = abs( snl )*abs( a2 ) + abs( csl )*abs( a3 )
            avb22 = abs( snr )*abs( b2 ) + abs( csr )*abs( b3 )
*
*           zero (2,2) elements of U**T*A and V**T*B, and then swap.
*
            IF( ( abs( ua21 )+abs( ua22 ) ).NE.zero ) THEN
               IF( aua22 / ( abs( ua21 )+abs( ua22 ) ).LE.avb22 /
     $             ( abs( vb21 )+abs( vb22 ) ) ) THEN
                  CALL dlartg( -ua21, ua22, csq, snq, r )
               ELSE
                  CALL dlartg( -vb21, vb22, csq, snq, r )
               END IF
            ELSE
               CALL dlartg( -vb21, vb22, csq, snq, r )
            END IF
*
            csu = snl
            snu = csl
            csv = snr
            snv = csr
*
         END IF
*
      ELSE
*
*        Input matrices A and B are lower triangular matrices
*
*        Form matrix C = A*adj(B) = ( a 0 )
*                                   ( c d )
*
         a = a1*b3
         d = a3*b1
         c = a2*b3 - a3*b2
*
*        The SVD of real 2-by-2 triangular C
*
*         ( CSL -SNL )*( A 0 )*(  CSR  SNR ) = ( R 0 )
*         ( SNL  CSL ) ( C D ) ( -SNR  CSR )   ( 0 T )
*
         CALL dlasv2( a, c, d, s1, s2, snr, csr, snl, csl )
*
         IF( abs( csr ).GE.abs( snr ) .OR. abs( csl ).GE.abs( snl ) )
     $        THEN
*
*           Compute the (2,1) and (2,2) elements of U**T *A and V**T *B,
*           and (2,1) element of |U|**T *|A| and |V|**T *|B|.
*
            ua21 = -snr*a1 + csr*a2
            ua22r = csr*a3
*
            vb21 = -snl*b1 + csl*b2
            vb22r = csl*b3
*
            aua21 = abs( snr )*abs( a1 ) + abs( csr )*abs( a2 )
            avb21 = abs( snl )*abs( b1 ) + abs( csl )*abs( b2 )
*
*           zero (2,1) elements of U**T *A and V**T *B.
*
            IF( ( abs( ua21 )+abs( ua22r ) ).NE.zero ) THEN
               IF( aua21 / ( abs( ua21 )+abs( ua22r ) ).LE.avb21 /
     $             ( abs( vb21 )+abs( vb22r ) ) ) THEN
                  CALL dlartg( ua22r, ua21, csq, snq, r )
               ELSE
                  CALL dlartg( vb22r, vb21, csq, snq, r )
               END IF
            ELSE
               CALL dlartg( vb22r, vb21, csq, snq, r )
            END IF
*
            csu = csr
            snu = -snr
            csv = csl
            snv = -snl
*
         ELSE
*
*           Compute the (1,1) and (1,2) elements of U**T *A and V**T *B,
*           and (1,1) element of |U|**T *|A| and |V|**T *|B|.
*
            ua11 = csr*a1 + snr*a2
            ua12 = snr*a3
*
            vb11 = csl*b1 + snl*b2
            vb12 = snl*b3
*
            aua11 = abs( csr )*abs( a1 ) + abs( snr )*abs( a2 )
            avb11 = abs( csl )*abs( b1 ) + abs( snl )*abs( b2 )
*
*           zero (1,1) elements of U**T*A and V**T*B, and then swap.
*
            IF( ( abs( ua11 )+abs( ua12 ) ).NE.zero ) THEN
               IF( aua11 / ( abs( ua11 )+abs( ua12 ) ).LE.avb11 /
     $             ( abs( vb11 )+abs( vb12 ) ) ) THEN
                  CALL dlartg( ua12, ua11, csq, snq, r )
               ELSE
                  CALL dlartg( vb12, vb11, csq, snq, r )
               END IF
            ELSE
               CALL dlartg( vb12, vb11, csq, snq, r )
            END IF
*
            csu = snr
            snu = csr
            csv = snl
            snv = csl
*
         END IF
*
      END IF
*
      RETURN
*
*     End of DLAGS2
*

◆ dlagtm()

subroutine dlagtm	(	character	trans,
		integer	n,
		integer	nrhs,
		double precision	alpha,
		double precision, dimension( * )	dl,
		double precision, dimension( * )	d,
		double precision, dimension( * )	du,
		double precision, dimension( ldx, * )	x,
		integer	ldx,
		double precision	beta,
		double precision, dimension( ldb, * )	b,
		integer	ldb )

DLAGTM performs a matrix-matrix product of the form C = αAB+βC, where A is a tridiagonal matrix, B and C are rectangular matrices, and α and β are scalars, which may be 0, 1, or -1.

Download DLAGTM + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLAGTM performs a matrix-vector product of the form
!>
!>    B := alpha * A * X + beta * B
!>
!> where A is a tridiagonal matrix of order N, B and X are N by NRHS
!> matrices, and alpha and beta are real scalars, each of which may be
!> 0., 1., or -1.
!>

Parameters

[in]	TRANS	!> TRANS is CHARACTER1 !> Specifies the operation applied to A. !> = 'N': No transpose, B := alpha A * X + beta * B !> = 'T': Transpose, B := alpha * A'* X + beta * B !> = 'C': Conjugate transpose = Transpose !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in]	NRHS	!> NRHS is INTEGER !> The number of right hand sides, i.e., the number of columns !> of the matrices X and B. !>
[in]	ALPHA	!> ALPHA is DOUBLE PRECISION !> The scalar alpha. ALPHA must be 0., 1., or -1.; otherwise, !> it is assumed to be 0. !>
[in]	DL	!> DL is DOUBLE PRECISION array, dimension (N-1) !> The (n-1) sub-diagonal elements of T. !>
[in]	D	!> D is DOUBLE PRECISION array, dimension (N) !> The diagonal elements of T. !>
[in]	DU	!> DU is DOUBLE PRECISION array, dimension (N-1) !> The (n-1) super-diagonal elements of T. !>
[in]	X	!> X is DOUBLE PRECISION array, dimension (LDX,NRHS) !> The N by NRHS matrix X. !>
[in]	LDX	!> LDX is INTEGER !> The leading dimension of the array X. LDX >= max(N,1). !>
[in]	BETA	!> BETA is DOUBLE PRECISION !> The scalar beta. BETA must be 0., 1., or -1.; otherwise, !> it is assumed to be 1. !>
[in,out]	B	!> B is DOUBLE PRECISION array, dimension (LDB,NRHS) !> On entry, the N by NRHS matrix B. !> On exit, B is overwritten by the matrix expression !> B := alpha * A * X + beta * B. !>
[in]	LDB	!> LDB is INTEGER !> The leading dimension of the array B. LDB >= max(N,1). !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 143 of file dlagtm.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          TRANS
      INTEGER            LDB, LDX, N, NRHS
      DOUBLE PRECISION   ALPHA, BETA
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   B( LDB, * ), D( * ), DL( * ), DU( * ),
     $                   X( LDX, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ONE, ZERO
      parameter( one = 1.0d+0, zero = 0.0d+0 )
*     ..
*     .. Local Scalars ..
      INTEGER            I, J
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. Executable Statements ..
*
      IF( n.EQ.0 )
     $   RETURN
*
*     Multiply B by BETA if BETA.NE.1.
*
      IF( beta.EQ.zero ) THEN
         DO 20 j = 1, nrhs
            DO 10 i = 1, n
               b( i, j ) = zero
   10       CONTINUE
   20    CONTINUE
      ELSE IF( beta.EQ.-one ) THEN
         DO 40 j = 1, nrhs
            DO 30 i = 1, n
               b( i, j ) = -b( i, j )
   30       CONTINUE
   40    CONTINUE
      END IF
*
      IF( alpha.EQ.one ) THEN
         IF( lsame( trans, 'N' ) ) THEN
*
*           Compute B := B + A*X
*
            DO 60 j = 1, nrhs
               IF( n.EQ.1 ) THEN
                  b( 1, j ) = b( 1, j ) + d( 1 )*x( 1, j )
               ELSE
                  b( 1, j ) = b( 1, j ) + d( 1 )*x( 1, j ) +
     $                        du( 1 )*x( 2, j )
                  b( n, j ) = b( n, j ) + dl( n-1 )*x( n-1, j ) +
     $                        d( n )*x( n, j )
                  DO 50 i = 2, n - 1
                     b( i, j ) = b( i, j ) + dl( i-1 )*x( i-1, j ) +
     $                           d( i )*x( i, j ) + du( i )*x( i+1, j )
   50             CONTINUE
               END IF
   60       CONTINUE
         ELSE
*
*           Compute B := B + A**T*X
*
            DO 80 j = 1, nrhs
               IF( n.EQ.1 ) THEN
                  b( 1, j ) = b( 1, j ) + d( 1 )*x( 1, j )
               ELSE
                  b( 1, j ) = b( 1, j ) + d( 1 )*x( 1, j ) +
     $                        dl( 1 )*x( 2, j )
                  b( n, j ) = b( n, j ) + du( n-1 )*x( n-1, j ) +
     $                        d( n )*x( n, j )
                  DO 70 i = 2, n - 1
                     b( i, j ) = b( i, j ) + du( i-1 )*x( i-1, j ) +
     $                           d( i )*x( i, j ) + dl( i )*x( i+1, j )
   70             CONTINUE
               END IF
   80       CONTINUE
         END IF
      ELSE IF( alpha.EQ.-one ) THEN
         IF( lsame( trans, 'N' ) ) THEN
*
*           Compute B := B - A*X
*
            DO 100 j = 1, nrhs
               IF( n.EQ.1 ) THEN
                  b( 1, j ) = b( 1, j ) - d( 1 )*x( 1, j )
               ELSE
                  b( 1, j ) = b( 1, j ) - d( 1 )*x( 1, j ) -
     $                        du( 1 )*x( 2, j )
                  b( n, j ) = b( n, j ) - dl( n-1 )*x( n-1, j ) -
     $                        d( n )*x( n, j )
                  DO 90 i = 2, n - 1
                     b( i, j ) = b( i, j ) - dl( i-1 )*x( i-1, j ) -
     $                           d( i )*x( i, j ) - du( i )*x( i+1, j )
   90             CONTINUE
               END IF
  100       CONTINUE
         ELSE
*
*           Compute B := B - A**T*X
*
            DO 120 j = 1, nrhs
               IF( n.EQ.1 ) THEN
                  b( 1, j ) = b( 1, j ) - d( 1 )*x( 1, j )
               ELSE
                  b( 1, j ) = b( 1, j ) - d( 1 )*x( 1, j ) -
     $                        dl( 1 )*x( 2, j )
                  b( n, j ) = b( n, j ) - du( n-1 )*x( n-1, j ) -
     $                        d( n )*x( n, j )
                  DO 110 i = 2, n - 1
                     b( i, j ) = b( i, j ) - du( i-1 )*x( i-1, j ) -
     $                           d( i )*x( i, j ) - dl( i )*x( i+1, j )
  110             CONTINUE
               END IF
  120       CONTINUE
         END IF
      END IF
      RETURN
*
*     End of DLAGTM
*

◆ dlagv2()

subroutine dlagv2	(	double precision, dimension( lda, * )	a,
		integer	lda,
		double precision, dimension( ldb, * )	b,
		integer	ldb,
		double precision, dimension( 2 )	alphar,
		double precision, dimension( 2 )	alphai,
		double precision, dimension( 2 )	beta,
		double precision	csl,
		double precision	snl,
		double precision	csr,
		double precision	snr )

DLAGV2 computes the Generalized Schur factorization of a real 2-by-2 matrix pencil (A,B) where B is upper triangular.

Download DLAGV2 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLAGV2 computes the Generalized Schur factorization of a real 2-by-2
!> matrix pencil (A,B) where B is upper triangular. This routine
!> computes orthogonal (rotation) matrices given by CSL, SNL and CSR,
!> SNR such that
!>
!> 1) if the pencil (A,B) has two real eigenvalues (include 0/0 or 1/0
!>    types), then
!>
!>    [ a11 a12 ] := [  CSL  SNL ] [ a11 a12 ] [  CSR -SNR ]
!>    [  0  a22 ]    [ -SNL  CSL ] [ a21 a22 ] [  SNR  CSR ]
!>
!>    [ b11 b12 ] := [  CSL  SNL ] [ b11 b12 ] [  CSR -SNR ]
!>    [  0  b22 ]    [ -SNL  CSL ] [  0  b22 ] [  SNR  CSR ],
!>
!> 2) if the pencil (A,B) has a pair of complex conjugate eigenvalues,
!>    then
!>
!>    [ a11 a12 ] := [  CSL  SNL ] [ a11 a12 ] [  CSR -SNR ]
!>    [ a21 a22 ]    [ -SNL  CSL ] [ a21 a22 ] [  SNR  CSR ]
!>
!>    [ b11  0  ] := [  CSL  SNL ] [ b11 b12 ] [  CSR -SNR ]
!>    [  0  b22 ]    [ -SNL  CSL ] [  0  b22 ] [  SNR  CSR ]
!>
!>    where b11 >= b22 > 0.
!>
!>

Parameters

[in,out]	A	!> A is DOUBLE PRECISION array, dimension (LDA, 2) !> On entry, the 2 x 2 matrix A. !> On exit, A is overwritten by the ``A-part'' of the !> generalized Schur form. !>
[in]	LDA	!> LDA is INTEGER !> THe leading dimension of the array A. LDA >= 2. !>
[in,out]	B	!> B is DOUBLE PRECISION array, dimension (LDB, 2) !> On entry, the upper triangular 2 x 2 matrix B. !> On exit, B is overwritten by the ``B-part'' of the !> generalized Schur form. !>
[in]	LDB	!> LDB is INTEGER !> THe leading dimension of the array B. LDB >= 2. !>
[out]	ALPHAR	!> ALPHAR is DOUBLE PRECISION array, dimension (2) !>
[out]	ALPHAI	!> ALPHAI is DOUBLE PRECISION array, dimension (2) !>
[out]	BETA	!> BETA is DOUBLE PRECISION array, dimension (2) !> (ALPHAR(k)+i*ALPHAI(k))/BETA(k) are the eigenvalues of the !> pencil (A,B), k=1,2, i = sqrt(-1). Note that BETA(k) may !> be zero. !>
[out]	CSL	!> CSL is DOUBLE PRECISION !> The cosine of the left rotation matrix. !>
[out]	SNL	!> SNL is DOUBLE PRECISION !> The sine of the left rotation matrix. !>
[out]	CSR	!> CSR is DOUBLE PRECISION !> The cosine of the right rotation matrix. !>
[out]	SNR	!> SNR is DOUBLE PRECISION !> The sine of the right rotation matrix. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: Mark Fahey, Department of Mathematics, Univ. of Kentucky, USA

Definition at line 155 of file dlagv2.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            LDA, LDB
      DOUBLE PRECISION   CSL, CSR, SNL, SNR
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   A( LDA, * ), ALPHAI( 2 ), ALPHAR( 2 ),
     $                   B( LDB, * ), BETA( 2 )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ZERO, ONE
      parameter( zero = 0.0d+0, one = 1.0d+0 )
*     ..
*     .. Local Scalars ..
      DOUBLE PRECISION   ANORM, ASCALE, BNORM, BSCALE, H1, H2, H3, QQ,
     $                   R, RR, SAFMIN, SCALE1, SCALE2, T, ULP, WI, WR1,
     $                   WR2
*     ..
*     .. External Subroutines ..
      EXTERNAL           dlag2, dlartg, dlasv2, drot
*     ..
*     .. External Functions ..
      DOUBLE PRECISION   DLAMCH, DLAPY2
      EXTERNAL           dlamch, dlapy2
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, max
*     ..
*     .. Executable Statements ..
*
      safmin = dlamch( 'S' )
      ulp = dlamch( 'P' )
*
*     Scale A
*
      anorm = max( abs( a( 1, 1 ) )+abs( a( 2, 1 ) ),
     $        abs( a( 1, 2 ) )+abs( a( 2, 2 ) ), safmin )
      ascale = one / anorm
      a( 1, 1 ) = ascale*a( 1, 1 )
      a( 1, 2 ) = ascale*a( 1, 2 )
      a( 2, 1 ) = ascale*a( 2, 1 )
      a( 2, 2 ) = ascale*a( 2, 2 )
*
*     Scale B
*
      bnorm = max( abs( b( 1, 1 ) ), abs( b( 1, 2 ) )+abs( b( 2, 2 ) ),
     $        safmin )
      bscale = one / bnorm
      b( 1, 1 ) = bscale*b( 1, 1 )
      b( 1, 2 ) = bscale*b( 1, 2 )
      b( 2, 2 ) = bscale*b( 2, 2 )
*
*     Check if A can be deflated
*
      IF( abs( a( 2, 1 ) ).LE.ulp ) THEN
         csl = one
         snl = zero
         csr = one
         snr = zero
         a( 2, 1 ) = zero
         b( 2, 1 ) = zero
         wi = zero
*
*     Check if B is singular
*
      ELSE IF( abs( b( 1, 1 ) ).LE.ulp ) THEN
         CALL dlartg( a( 1, 1 ), a( 2, 1 ), csl, snl, r )
         csr = one
         snr = zero
         CALL drot( 2, a( 1, 1 ), lda, a( 2, 1 ), lda, csl, snl )
         CALL drot( 2, b( 1, 1 ), ldb, b( 2, 1 ), ldb, csl, snl )
         a( 2, 1 ) = zero
         b( 1, 1 ) = zero
         b( 2, 1 ) = zero
         wi = zero
*
      ELSE IF( abs( b( 2, 2 ) ).LE.ulp ) THEN
         CALL dlartg( a( 2, 2 ), a( 2, 1 ), csr, snr, t )
         snr = -snr
         CALL drot( 2, a( 1, 1 ), 1, a( 1, 2 ), 1, csr, snr )
         CALL drot( 2, b( 1, 1 ), 1, b( 1, 2 ), 1, csr, snr )
         csl = one
         snl = zero
         a( 2, 1 ) = zero
         b( 2, 1 ) = zero
         b( 2, 2 ) = zero
         wi = zero
*
      ELSE
*
*        B is nonsingular, first compute the eigenvalues of (A,B)
*
         CALL dlag2( a, lda, b, ldb, safmin, scale1, scale2, wr1, wr2,
     $               wi )
*
         IF( wi.EQ.zero ) THEN
*
*           two real eigenvalues, compute s*A-w*B
*
            h1 = scale1*a( 1, 1 ) - wr1*b( 1, 1 )
            h2 = scale1*a( 1, 2 ) - wr1*b( 1, 2 )
            h3 = scale1*a( 2, 2 ) - wr1*b( 2, 2 )
*
            rr = dlapy2( h1, h2 )
            qq = dlapy2( scale1*a( 2, 1 ), h3 )
*
            IF( rr.GT.qq ) THEN
*
*              find right rotation matrix to zero 1,1 element of
*              (sA - wB)
*
               CALL dlartg( h2, h1, csr, snr, t )
*
            ELSE
*
*              find right rotation matrix to zero 2,1 element of
*              (sA - wB)
*
               CALL dlartg( h3, scale1*a( 2, 1 ), csr, snr, t )
*
            END IF
*
            snr = -snr
            CALL drot( 2, a( 1, 1 ), 1, a( 1, 2 ), 1, csr, snr )
            CALL drot( 2, b( 1, 1 ), 1, b( 1, 2 ), 1, csr, snr )
*
*           compute inf norms of A and B
*
            h1 = max( abs( a( 1, 1 ) )+abs( a( 1, 2 ) ),
     $           abs( a( 2, 1 ) )+abs( a( 2, 2 ) ) )
            h2 = max( abs( b( 1, 1 ) )+abs( b( 1, 2 ) ),
     $           abs( b( 2, 1 ) )+abs( b( 2, 2 ) ) )
*
            IF( ( scale1*h1 ).GE.abs( wr1 )*h2 ) THEN
*
*              find left rotation matrix Q to zero out B(2,1)
*
               CALL dlartg( b( 1, 1 ), b( 2, 1 ), csl, snl, r )
*
            ELSE
*
*              find left rotation matrix Q to zero out A(2,1)
*
               CALL dlartg( a( 1, 1 ), a( 2, 1 ), csl, snl, r )
*
            END IF
*
            CALL drot( 2, a( 1, 1 ), lda, a( 2, 1 ), lda, csl, snl )
            CALL drot( 2, b( 1, 1 ), ldb, b( 2, 1 ), ldb, csl, snl )
*
            a( 2, 1 ) = zero
            b( 2, 1 ) = zero
*
         ELSE
*
*           a pair of complex conjugate eigenvalues
*           first compute the SVD of the matrix B
*
            CALL dlasv2( b( 1, 1 ), b( 1, 2 ), b( 2, 2 ), r, t, snr,
     $                   csr, snl, csl )
*
*           Form (A,B) := Q(A,B)Z**T where Q is left rotation matrix and
*           Z is right rotation matrix computed from DLASV2
*
            CALL drot( 2, a( 1, 1 ), lda, a( 2, 1 ), lda, csl, snl )
            CALL drot( 2, b( 1, 1 ), ldb, b( 2, 1 ), ldb, csl, snl )
            CALL drot( 2, a( 1, 1 ), 1, a( 1, 2 ), 1, csr, snr )
            CALL drot( 2, b( 1, 1 ), 1, b( 1, 2 ), 1, csr, snr )
*
            b( 2, 1 ) = zero
            b( 1, 2 ) = zero
*
         END IF
*
      END IF
*
*     Unscaling
*
      a( 1, 1 ) = anorm*a( 1, 1 )
      a( 2, 1 ) = anorm*a( 2, 1 )
      a( 1, 2 ) = anorm*a( 1, 2 )
      a( 2, 2 ) = anorm*a( 2, 2 )
      b( 1, 1 ) = bnorm*b( 1, 1 )
      b( 2, 1 ) = bnorm*b( 2, 1 )
      b( 1, 2 ) = bnorm*b( 1, 2 )
      b( 2, 2 ) = bnorm*b( 2, 2 )
*
      IF( wi.EQ.zero ) THEN
         alphar( 1 ) = a( 1, 1 )
         alphar( 2 ) = a( 2, 2 )
         alphai( 1 ) = zero
         alphai( 2 ) = zero
         beta( 1 ) = b( 1, 1 )
         beta( 2 ) = b( 2, 2 )
      ELSE
         alphar( 1 ) = anorm*wr1 / scale1 / bnorm
         alphai( 1 ) = anorm*wi / scale1 / bnorm
         alphar( 2 ) = alphar( 1 )
         alphai( 2 ) = -alphai( 1 )
         beta( 1 ) = one
         beta( 2 ) = one
      END IF
*
      RETURN
*
*     End of DLAGV2
*

◆ dlahqr()

subroutine dlahqr	(	logical	wantt,
		logical	wantz,
		integer	n,
		integer	ilo,
		integer	ihi,
		double precision, dimension( ldh, * )	h,
		integer	ldh,
		double precision, dimension( * )	wr,
		double precision, dimension( * )	wi,
		integer	iloz,
		integer	ihiz,
		double precision, dimension( ldz, * )	z,
		integer	ldz,
		integer	info )

DLAHQR computes the eigenvalues and Schur factorization of an upper Hessenberg matrix, using the double-shift/single-shift QR algorithm.

Download DLAHQR + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!>    DLAHQR is an auxiliary routine called by DHSEQR to update the
!>    eigenvalues and Schur decomposition already computed by DHSEQR, by
!>    dealing with the Hessenberg submatrix in rows and columns ILO to
!>    IHI.
!>

Parameters

[in]	WANTT	!> WANTT is LOGICAL !> = .TRUE. : the full Schur form T is required; !> = .FALSE.: only eigenvalues are required. !>
[in]	WANTZ	!> WANTZ is LOGICAL !> = .TRUE. : the matrix of Schur vectors Z is required; !> = .FALSE.: Schur vectors are not required. !>
[in]	N	!> N is INTEGER !> The order of the matrix H. N >= 0. !>
[in]	ILO	!> ILO is INTEGER !>
[in]	IHI	!> IHI is INTEGER !> It is assumed that H is already upper quasi-triangular in !> rows and columns IHI+1:N, and that H(ILO,ILO-1) = 0 (unless !> ILO = 1). DLAHQR works primarily with the Hessenberg !> submatrix in rows and columns ILO to IHI, but applies !> transformations to all of H if WANTT is .TRUE.. !> 1 <= ILO <= max(1,IHI); IHI <= N. !>
[in,out]	H	!> H is DOUBLE PRECISION array, dimension (LDH,N) !> On entry, the upper Hessenberg matrix H. !> On exit, if INFO is zero and if WANTT is .TRUE., H is upper !> quasi-triangular in rows and columns ILO:IHI, with any !> 2-by-2 diagonal blocks in standard form. If INFO is zero !> and WANTT is .FALSE., the contents of H are unspecified on !> exit. The output state of H if INFO is nonzero is given !> below under the description of INFO. !>
[in]	LDH	!> LDH is INTEGER !> The leading dimension of the array H. LDH >= max(1,N). !>
[out]	WR	!> WR is DOUBLE PRECISION array, dimension (N) !>
[out]	WI	!> WI is DOUBLE PRECISION array, dimension (N) !> The real and imaginary parts, respectively, of the computed !> eigenvalues ILO to IHI are stored in the corresponding !> elements of WR and WI. If two eigenvalues are computed as a !> complex conjugate pair, they are stored in consecutive !> elements of WR and WI, say the i-th and (i+1)th, with !> WI(i) > 0 and WI(i+1) < 0. If WANTT is .TRUE., the !> eigenvalues are stored in the same order as on the diagonal !> of the Schur form returned in H, with WR(i) = H(i,i), and, if !> H(i:i+1,i:i+1) is a 2-by-2 diagonal block, !> WI(i) = sqrt(H(i+1,i)*H(i,i+1)) and WI(i+1) = -WI(i). !>
[in]	ILOZ	!> ILOZ is INTEGER !>
[in]	IHIZ	!> IHIZ is INTEGER !> Specify the rows of Z to which transformations must be !> applied if WANTZ is .TRUE.. !> 1 <= ILOZ <= ILO; IHI <= IHIZ <= N. !>
[in,out]	Z	!> Z is DOUBLE PRECISION array, dimension (LDZ,N) !> If WANTZ is .TRUE., on entry Z must contain the current !> matrix Z of transformations accumulated by DHSEQR, and on !> exit Z has been updated; transformations are applied only to !> the submatrix Z(ILOZ:IHIZ,ILO:IHI). !> If WANTZ is .FALSE., Z is not referenced. !>
[in]	LDZ	!> LDZ is INTEGER !> The leading dimension of the array Z. LDZ >= max(1,N). !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> > 0: If INFO = i, DLAHQR failed to compute all the !> eigenvalues ILO to IHI in a total of 30 iterations !> per eigenvalue; elements i+1:ihi of WR and WI !> contain those eigenvalues which have been !> successfully computed. !> !> If INFO > 0 and WANTT is .FALSE., then on exit, !> the remaining unconverged eigenvalues are the !> eigenvalues of the upper Hessenberg matrix rows !> and columns ILO through INFO of the final, output !> value of H. !> !> If INFO > 0 and WANTT is .TRUE., then on exit !> () (initial value of H)U = U(final value of H) !> where U is an orthogonal matrix. The final !> value of H is upper Hessenberg and triangular in !> rows and columns INFO+1 through IHI. !> !> If INFO > 0 and WANTZ is .TRUE., then on exit !> (final value of Z) = (initial value of Z)U !> where U is the orthogonal matrix in (*) !> (regardless of the value of WANTT.) !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>     02-96 Based on modifications by
!>     David Day, Sandia National Laboratory, USA
!>
!>     12-04 Further modifications by
!>     Ralph Byers, University of Kansas, USA
!>     This is a modified version of DLAHQR from LAPACK version 3.0.
!>     It is (1) more robust against overflow and underflow and
!>     (2) adopts the more conservative Ahues & Tisseur stopping
!>     criterion (LAWN 122, 1997).
!>

Definition at line 205 of file dlahqr.f.

      IMPLICIT NONE
*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            IHI, IHIZ, ILO, ILOZ, INFO, LDH, LDZ, N
      LOGICAL            WANTT, WANTZ
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   H( LDH, * ), WI( * ), WR( * ), Z( LDZ, * )
*     ..
*
*  =========================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ZERO, ONE, TWO
      parameter( zero = 0.0d0, one = 1.0d0, two = 2.0d0 )
      DOUBLE PRECISION   DAT1, DAT2
      parameter( dat1 = 3.0d0 / 4.0d0, dat2 = -0.4375d0 )
      INTEGER            KEXSH
      parameter( kexsh = 10 )
*     ..
*     .. Local Scalars ..
      DOUBLE PRECISION   AA, AB, BA, BB, CS, DET, H11, H12, H21, H21S,
     $                   H22, RT1I, RT1R, RT2I, RT2R, RTDISC, S, SAFMAX,
     $                   SAFMIN, SMLNUM, SN, SUM, T1, T2, T3, TR, TST,
     $                   ULP, V2, V3
      INTEGER            I, I1, I2, ITS, ITMAX, J, K, L, M, NH, NR, NZ,
     $                   KDEFL 
*     ..
*     .. Local Arrays ..
      DOUBLE PRECISION   V( 3 )
*     ..
*     .. External Functions ..
      DOUBLE PRECISION   DLAMCH
      EXTERNAL           dlamch
*     ..
*     .. External Subroutines ..
      EXTERNAL           dcopy, dlabad, dlanv2, dlarfg, drot
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, dble, max, min, sqrt
*     ..
*     .. Executable Statements ..
*
      info = 0
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
      IF( ilo.EQ.ihi ) THEN
         wr( ilo ) = h( ilo, ilo )
         wi( ilo ) = zero
         RETURN
      END IF
*
*     ==== clear out the trash ====
      DO 10 j = ilo, ihi - 3
         h( j+2, j ) = zero
         h( j+3, j ) = zero
   10 CONTINUE
      IF( ilo.LE.ihi-2 )
     $   h( ihi, ihi-2 ) = zero
*
      nh = ihi - ilo + 1
      nz = ihiz - iloz + 1
*
*     Set machine-dependent constants for the stopping criterion.
*
      safmin = dlamch( 'SAFE MINIMUM' )
      safmax = one / safmin
      CALL dlabad( safmin, safmax )
      ulp = dlamch( 'PRECISION' )
      smlnum = safmin*( dble( nh ) / ulp )
*
*     I1 and I2 are the indices of the first row and last column of H
*     to which transformations must be applied. If eigenvalues only are
*     being computed, I1 and I2 are set inside the main loop.
*
      IF( wantt ) THEN
         i1 = 1
         i2 = n
      END IF
*
*     ITMAX is the total number of QR iterations allowed.
*
      itmax = 30 * max( 10, nh )
*
*     KDEFL counts the number of iterations since a deflation
*
      kdefl = 0
*
*     The main loop begins here. I is the loop index and decreases from
*     IHI to ILO in steps of 1 or 2. Each iteration of the loop works
*     with the active submatrix in rows and columns L to I.
*     Eigenvalues I+1 to IHI have already converged. Either L = ILO or
*     H(L,L-1) is negligible so that the matrix splits.
*
      i = ihi
   20 CONTINUE
      l = ilo
      IF( i.LT.ilo )
     $   GO TO 160
*
*     Perform QR iterations on rows and columns ILO to I until a
*     submatrix of order 1 or 2 splits off at the bottom because a
*     subdiagonal element has become negligible.
*
      DO 140 its = 0, itmax
*
*        Look for a single small subdiagonal element.
*
         DO 30 k = i, l + 1, -1
            IF( abs( h( k, k-1 ) ).LE.smlnum )
     $         GO TO 40
            tst = abs( h( k-1, k-1 ) ) + abs( h( k, k ) )
            IF( tst.EQ.zero ) THEN
               IF( k-2.GE.ilo )
     $            tst = tst + abs( h( k-1, k-2 ) )
               IF( k+1.LE.ihi )
     $            tst = tst + abs( h( k+1, k ) )
            END IF
*           ==== The following is a conservative small subdiagonal
*           .    deflation  criterion due to Ahues & Tisseur (LAWN 122,
*           .    1997). It has better mathematical foundation and
*           .    improves accuracy in some cases.  ====
            IF( abs( h( k, k-1 ) ).LE.ulp*tst ) THEN
               ab = max( abs( h( k, k-1 ) ), abs( h( k-1, k ) ) )
               ba = min( abs( h( k, k-1 ) ), abs( h( k-1, k ) ) )
               aa = max( abs( h( k, k ) ),
     $              abs( h( k-1, k-1 )-h( k, k ) ) )
               bb = min( abs( h( k, k ) ),
     $              abs( h( k-1, k-1 )-h( k, k ) ) )
               s = aa + ab
               IF( ba*( ab / s ).LE.max( smlnum,
     $             ulp*( bb*( aa / s ) ) ) )GO TO 40
            END IF
   30    CONTINUE
   40    CONTINUE
         l = k
         IF( l.GT.ilo ) THEN
*
*           H(L,L-1) is negligible
*
            h( l, l-1 ) = zero
         END IF
*
*        Exit from loop if a submatrix of order 1 or 2 has split off.
*
         IF( l.GE.i-1 )
     $      GO TO 150
         kdefl = kdefl + 1
*
*        Now the active submatrix is in rows and columns L to I. If
*        eigenvalues only are being computed, only the active submatrix
*        need be transformed.
*
         IF( .NOT.wantt ) THEN
            i1 = l
            i2 = i
         END IF
*
         IF( mod(kdefl,2*kexsh).EQ.0 ) THEN
*
*           Exceptional shift.
*
            s = abs( h( i, i-1 ) ) + abs( h( i-1, i-2 ) )
            h11 = dat1*s + h( i, i )
            h12 = dat2*s
            h21 = s
            h22 = h11
         ELSE IF( mod(kdefl,kexsh).EQ.0 ) THEN
*
*           Exceptional shift.
*
            s = abs( h( l+1, l ) ) + abs( h( l+2, l+1 ) )
            h11 = dat1*s + h( l, l )
            h12 = dat2*s
            h21 = s
            h22 = h11
         ELSE
*
*           Prepare to use Francis' double shift
*           (i.e. 2nd degree generalized Rayleigh quotient)
*
            h11 = h( i-1, i-1 )
            h21 = h( i, i-1 )
            h12 = h( i-1, i )
            h22 = h( i, i )
         END IF
         s = abs( h11 ) + abs( h12 ) + abs( h21 ) + abs( h22 )
         IF( s.EQ.zero ) THEN
            rt1r = zero
            rt1i = zero
            rt2r = zero
            rt2i = zero
         ELSE
            h11 = h11 / s
            h21 = h21 / s
            h12 = h12 / s
            h22 = h22 / s
            tr = ( h11+h22 ) / two
            det = ( h11-tr )*( h22-tr ) - h12*h21
            rtdisc = sqrt( abs( det ) )
            IF( det.GE.zero ) THEN
*
*              ==== complex conjugate shifts ====
*
               rt1r = tr*s
               rt2r = rt1r
               rt1i = rtdisc*s
               rt2i = -rt1i
            ELSE
*
*              ==== real shifts (use only one of them)  ====
*
               rt1r = tr + rtdisc
               rt2r = tr - rtdisc
               IF( abs( rt1r-h22 ).LE.abs( rt2r-h22 ) ) THEN
                  rt1r = rt1r*s
                  rt2r = rt1r
               ELSE
                  rt2r = rt2r*s
                  rt1r = rt2r
               END IF
               rt1i = zero
               rt2i = zero
            END IF
         END IF
*
*        Look for two consecutive small subdiagonal elements.
*
         DO 50 m = i - 2, l, -1
*           Determine the effect of starting the double-shift QR
*           iteration at row M, and see if this would make H(M,M-1)
*           negligible.  (The following uses scaling to avoid
*           overflows and most underflows.)
*
            h21s = h( m+1, m )
            s = abs( h( m, m )-rt2r ) + abs( rt2i ) + abs( h21s )
            h21s = h( m+1, m ) / s
            v( 1 ) = h21s*h( m, m+1 ) + ( h( m, m )-rt1r )*
     $               ( ( h( m, m )-rt2r ) / s ) - rt1i*( rt2i / s )
            v( 2 ) = h21s*( h( m, m )+h( m+1, m+1 )-rt1r-rt2r )
            v( 3 ) = h21s*h( m+2, m+1 )
            s = abs( v( 1 ) ) + abs( v( 2 ) ) + abs( v( 3 ) )
            v( 1 ) = v( 1 ) / s
            v( 2 ) = v( 2 ) / s
            v( 3 ) = v( 3 ) / s
            IF( m.EQ.l )
     $         GO TO 60
            IF( abs( h( m, m-1 ) )*( abs( v( 2 ) )+abs( v( 3 ) ) ).LE.
     $          ulp*abs( v( 1 ) )*( abs( h( m-1, m-1 ) )+abs( h( m,
     $          m ) )+abs( h( m+1, m+1 ) ) ) )GO TO 60
   50    CONTINUE
   60    CONTINUE
*
*        Double-shift QR step
*
         DO 130 k = m, i - 1
*
*           The first iteration of this loop determines a reflection G
*           from the vector V and applies it from left and right to H,
*           thus creating a nonzero bulge below the subdiagonal.
*
*           Each subsequent iteration determines a reflection G to
*           restore the Hessenberg form in the (K-1)th column, and thus
*           chases the bulge one step toward the bottom of the active
*           submatrix. NR is the order of G.
*
            nr = min( 3, i-k+1 )
            IF( k.GT.m )
     $         CALL dcopy( nr, h( k, k-1 ), 1, v, 1 )
            CALL dlarfg( nr, v( 1 ), v( 2 ), 1, t1 )
            IF( k.GT.m ) THEN
               h( k, k-1 ) = v( 1 )
               h( k+1, k-1 ) = zero
               IF( k.LT.i-1 )
     $            h( k+2, k-1 ) = zero
            ELSE IF( m.GT.l ) THEN
*               ==== Use the following instead of
*               .    H( K, K-1 ) = -H( K, K-1 ) to
*               .    avoid a bug when v(2) and v(3)
*               .    underflow. ====
               h( k, k-1 ) = h( k, k-1 )*( one-t1 )
            END IF
            v2 = v( 2 )
            t2 = t1*v2
            IF( nr.EQ.3 ) THEN
               v3 = v( 3 )
               t3 = t1*v3
*
*              Apply G from the left to transform the rows of the matrix
*              in columns K to I2.
*
               DO 70 j = k, i2
                  sum = h( k, j ) + v2*h( k+1, j ) + v3*h( k+2, j )
                  h( k, j ) = h( k, j ) - sum*t1
                  h( k+1, j ) = h( k+1, j ) - sum*t2
                  h( k+2, j ) = h( k+2, j ) - sum*t3
   70          CONTINUE
*
*              Apply G from the right to transform the columns of the
*              matrix in rows I1 to min(K+3,I).
*
               DO 80 j = i1, min( k+3, i )
                  sum = h( j, k ) + v2*h( j, k+1 ) + v3*h( j, k+2 )
                  h( j, k ) = h( j, k ) - sum*t1
                  h( j, k+1 ) = h( j, k+1 ) - sum*t2
                  h( j, k+2 ) = h( j, k+2 ) - sum*t3
   80          CONTINUE
*
               IF( wantz ) THEN
*
*                 Accumulate transformations in the matrix Z
*
                  DO 90 j = iloz, ihiz
                     sum = z( j, k ) + v2*z( j, k+1 ) + v3*z( j, k+2 )
                     z( j, k ) = z( j, k ) - sum*t1
                     z( j, k+1 ) = z( j, k+1 ) - sum*t2
                     z( j, k+2 ) = z( j, k+2 ) - sum*t3
   90             CONTINUE
               END IF
            ELSE IF( nr.EQ.2 ) THEN
*
*              Apply G from the left to transform the rows of the matrix
*              in columns K to I2.
*
               DO 100 j = k, i2
                  sum = h( k, j ) + v2*h( k+1, j )
                  h( k, j ) = h( k, j ) - sum*t1
                  h( k+1, j ) = h( k+1, j ) - sum*t2
  100          CONTINUE
*
*              Apply G from the right to transform the columns of the
*              matrix in rows I1 to min(K+3,I).
*
               DO 110 j = i1, i
                  sum = h( j, k ) + v2*h( j, k+1 )
                  h( j, k ) = h( j, k ) - sum*t1
                  h( j, k+1 ) = h( j, k+1 ) - sum*t2
  110          CONTINUE
*
               IF( wantz ) THEN
*
*                 Accumulate transformations in the matrix Z
*
                  DO 120 j = iloz, ihiz
                     sum = z( j, k ) + v2*z( j, k+1 )
                     z( j, k ) = z( j, k ) - sum*t1
                     z( j, k+1 ) = z( j, k+1 ) - sum*t2
  120             CONTINUE
               END IF
            END IF
  130    CONTINUE
*
  140 CONTINUE
*
*     Failure to converge in remaining number of iterations
*
      info = i
      RETURN
*
  150 CONTINUE
*
      IF( l.EQ.i ) THEN
*
*        H(I,I-1) is negligible: one eigenvalue has converged.
*
         wr( i ) = h( i, i )
         wi( i ) = zero
      ELSE IF( l.EQ.i-1 ) THEN
*
*        H(I-1,I-2) is negligible: a pair of eigenvalues have converged.
*
*        Transform the 2-by-2 submatrix to standard Schur form,
*        and compute and store the eigenvalues.
*
         CALL dlanv2( h( i-1, i-1 ), h( i-1, i ), h( i, i-1 ),
     $                h( i, i ), wr( i-1 ), wi( i-1 ), wr( i ), wi( i ),
     $                cs, sn )
*
         IF( wantt ) THEN
*
*           Apply the transformation to the rest of H.
*
            IF( i2.GT.i )
     $         CALL drot( i2-i, h( i-1, i+1 ), ldh, h( i, i+1 ), ldh,
     $                    cs, sn )
            CALL drot( i-i1-1, h( i1, i-1 ), 1, h( i1, i ), 1, cs, sn )
         END IF
         IF( wantz ) THEN
*
*           Apply the transformation to Z.
*
            CALL drot( nz, z( iloz, i-1 ), 1, z( iloz, i ), 1, cs, sn )
         END IF
      END IF
*     reset deflation counter
      kdefl = 0
*
*     return to start of the main loop with new value of I.
*
      i = l - 1
      GO TO 20
*
  160 CONTINUE
      RETURN
*
*     End of DLAHQR
*

◆ dlahr2()

subroutine dlahr2	(	integer	n,
		integer	k,
		integer	nb,
		double precision, dimension( lda, * )	a,
		integer	lda,
		double precision, dimension( nb )	tau,
		double precision, dimension( ldt, nb )	t,
		integer	ldt,
		double precision, dimension( ldy, nb )	y,
		integer	ldy )

DLAHR2 reduces the specified number of first columns of a general rectangular matrix A so that elements below the specified subdiagonal are zero, and returns auxiliary matrices which are needed to apply the transformation to the unreduced part of A.

Download DLAHR2 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLAHR2 reduces the first NB columns of A real general n-BY-(n-k+1)
!> matrix A so that elements below the k-th subdiagonal are zero. The
!> reduction is performed by an orthogonal similarity transformation
!> Q**T * A * Q. The routine returns the matrices V and T which determine
!> Q as a block reflector I - V*T*V**T, and also the matrix Y = A * V * T.
!>
!> This is an auxiliary routine called by DGEHRD.
!>

Parameters

[in]	N	!> N is INTEGER !> The order of the matrix A. !>
[in]	K	!> K is INTEGER !> The offset for the reduction. Elements below the k-th !> subdiagonal in the first NB columns are reduced to zero. !> K < N. !>
[in]	NB	!> NB is INTEGER !> The number of columns to be reduced. !>
[in,out]	A	!> A is DOUBLE PRECISION array, dimension (LDA,N-K+1) !> On entry, the n-by-(n-k+1) general matrix A. !> On exit, the elements on and above the k-th subdiagonal in !> the first NB columns are overwritten with the corresponding !> elements of the reduced matrix; the elements below the k-th !> subdiagonal, with the array TAU, represent the matrix Q as a !> product of elementary reflectors. The other columns of A are !> unchanged. See Further Details. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,N). !>
[out]	TAU	!> TAU is DOUBLE PRECISION array, dimension (NB) !> The scalar factors of the elementary reflectors. See Further !> Details. !>
[out]	T	!> T is DOUBLE PRECISION array, dimension (LDT,NB) !> The upper triangular matrix T. !>
[in]	LDT	!> LDT is INTEGER !> The leading dimension of the array T. LDT >= NB. !>
[out]	Y	!> Y is DOUBLE PRECISION array, dimension (LDY,NB) !> The n-by-nb matrix Y. !>
[in]	LDY	!> LDY is INTEGER !> The leading dimension of the array Y. LDY >= N. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  The matrix Q is represented as a product of nb elementary reflectors
!>
!>     Q = H(1) H(2) . . . H(nb).
!>
!>  Each H(i) has the form
!>
!>     H(i) = I - tau * v * v**T
!>
!>  where tau is a real scalar, and v is a real vector with
!>  v(1:i+k-1) = 0, v(i+k) = 1; v(i+k+1:n) is stored on exit in
!>  A(i+k+1:n,i), and tau in TAU(i).
!>
!>  The elements of the vectors v together form the (n-k+1)-by-nb matrix
!>  V which is needed, with T and Y, to apply the transformation to the
!>  unreduced part of the matrix, using an update of the form:
!>  A := (I - V*T*V**T) * (A - Y*V**T).
!>
!>  The contents of A on exit are illustrated by the following example
!>  with n = 7, k = 3 and nb = 2:
!>
!>     ( a   a   a   a   a )
!>     ( a   a   a   a   a )
!>     ( a   a   a   a   a )
!>     ( h   h   a   a   a )
!>     ( v1  h   a   a   a )
!>     ( v1  v2  a   a   a )
!>     ( v1  v2  a   a   a )
!>
!>  where a denotes an element of the original matrix A, h denotes a
!>  modified element of the upper Hessenberg matrix H, and vi denotes an
!>  element of the vector defining H(i).
!>
!>  This subroutine is a slight modification of LAPACK-3.0's DLAHRD
!>  incorporating improvements proposed by Quintana-Orti and Van de
!>  Gejin. Note that the entries of A(1:K,2:NB) differ from those
!>  returned by the original LAPACK-3.0's DLAHRD routine. (This
!>  subroutine is not backward compatible with LAPACK-3.0's DLAHRD.)
!>

References:: Gregorio Quintana-Orti and Robert van de Geijn, "Improving the performance of reduction to Hessenberg form," ACM Transactions on Mathematical Software, 32(2):180-194, June 2006.

Definition at line 180 of file dlahr2.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            K, LDA, LDT, LDY, N, NB
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION  A( LDA, * ), T( LDT, NB ), TAU( NB ),
     $                   Y( LDY, NB )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION  ZERO, ONE
      parameter( zero = 0.0d+0,
     $                     one = 1.0d+0 )
*     ..
*     .. Local Scalars ..
      INTEGER            I
      DOUBLE PRECISION  EI
*     ..
*     .. External Subroutines ..
      EXTERNAL           daxpy, dcopy, dgemm, dgemv, dlacpy,
     $                   dlarfg, dscal, dtrmm, dtrmv
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          min
*     ..
*     .. Executable Statements ..
*
*     Quick return if possible
*
      IF( n.LE.1 )
     $   RETURN
*
      DO 10 i = 1, nb
         IF( i.GT.1 ) THEN
*
*           Update A(K+1:N,I)
*
*           Update I-th column of A - Y * V**T
*
            CALL dgemv( 'NO TRANSPOSE', n-k, i-1, -one, y(k+1,1), ldy,
     $                  a( k+i-1, 1 ), lda, one, a( k+1, i ), 1 )
*
*           Apply I - V * T**T * V**T to this column (call it b) from the
*           left, using the last column of T as workspace
*
*           Let  V = ( V1 )   and   b = ( b1 )   (first I-1 rows)
*                    ( V2 )             ( b2 )
*
*           where V1 is unit lower triangular
*
*           w := V1**T * b1
*
            CALL dcopy( i-1, a( k+1, i ), 1, t( 1, nb ), 1 )
            CALL dtrmv( 'Lower', 'Transpose', 'UNIT',
     $                  i-1, a( k+1, 1 ),
     $                  lda, t( 1, nb ), 1 )
*
*           w := w + V2**T * b2
*
            CALL dgemv( 'Transpose', n-k-i+1, i-1,
     $                  one, a( k+i, 1 ),
     $                  lda, a( k+i, i ), 1, one, t( 1, nb ), 1 )
*
*           w := T**T * w
*
            CALL dtrmv( 'Upper', 'Transpose', 'NON-UNIT',
     $                  i-1, t, ldt,
     $                  t( 1, nb ), 1 )
*
*           b2 := b2 - V2*w
*
            CALL dgemv( 'NO TRANSPOSE', n-k-i+1, i-1, -one,
     $                  a( k+i, 1 ),
     $                  lda, t( 1, nb ), 1, one, a( k+i, i ), 1 )
*
*           b1 := b1 - V1*w
*
            CALL dtrmv( 'Lower', 'NO TRANSPOSE',
     $                  'UNIT', i-1,
     $                  a( k+1, 1 ), lda, t( 1, nb ), 1 )
            CALL daxpy( i-1, -one, t( 1, nb ), 1, a( k+1, i ), 1 )
*
            a( k+i-1, i-1 ) = ei
         END IF
*
*        Generate the elementary reflector H(I) to annihilate
*        A(K+I+1:N,I)
*
         CALL dlarfg( n-k-i+1, a( k+i, i ), a( min( k+i+1, n ), i ), 1,
     $                tau( i ) )
         ei = a( k+i, i )
         a( k+i, i ) = one
*
*        Compute  Y(K+1:N,I)
*
         CALL dgemv( 'NO TRANSPOSE', n-k, n-k-i+1,
     $               one, a( k+1, i+1 ),
     $               lda, a( k+i, i ), 1, zero, y( k+1, i ), 1 )
         CALL dgemv( 'Transpose', n-k-i+1, i-1,
     $               one, a( k+i, 1 ), lda,
     $               a( k+i, i ), 1, zero, t( 1, i ), 1 )
         CALL dgemv( 'NO TRANSPOSE', n-k, i-1, -one,
     $               y( k+1, 1 ), ldy,
     $               t( 1, i ), 1, one, y( k+1, i ), 1 )
         CALL dscal( n-k, tau( i ), y( k+1, i ), 1 )
*
*        Compute T(1:I,I)
*
         CALL dscal( i-1, -tau( i ), t( 1, i ), 1 )
         CALL dtrmv( 'Upper', 'No Transpose', 'NON-UNIT',
     $               i-1, t, ldt,
     $               t( 1, i ), 1 )
         t( i, i ) = tau( i )
*
   10 CONTINUE
      a( k+nb, nb ) = ei
*
*     Compute Y(1:K,1:NB)
*
      CALL dlacpy( 'ALL', k, nb, a( 1, 2 ), lda, y, ldy )
      CALL dtrmm( 'RIGHT', 'Lower', 'NO TRANSPOSE',
     $            'UNIT', k, nb,
     $            one, a( k+1, 1 ), lda, y, ldy )
      IF( n.GT.k+nb )
     $   CALL dgemm( 'NO TRANSPOSE', 'NO TRANSPOSE', k,
     $               nb, n-k-nb, one,
     $               a( 1, 2+nb ), lda, a( k+1+nb, 1 ), lda, one, y,
     $               ldy )
      CALL dtrmm( 'RIGHT', 'Upper', 'NO TRANSPOSE',
     $            'NON-UNIT', k, nb,
     $            one, t, ldt, y, ldy )
*
      RETURN
*
*     End of DLAHR2
*

◆ dlahrd()

subroutine dlahrd	(	integer	n,
		integer	k,
		integer	nb,
		double precision, dimension( lda, * )	a,
		integer	lda,
		double precision, dimension( nb )	tau,
		double precision, dimension( ldt, nb )	t,
		integer	ldt,
		double precision, dimension( ldy, nb )	y,
		integer	ldy )

DLAHRD reduces the first nb columns of a general rectangular matrix A so that elements below the k-th subdiagonal are zero, and returns auxiliary matrices which are needed to apply the transformation to the unreduced part of A.

Download DLAHRD + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> This routine is deprecated and has been replaced by routine DLAHR2.
!>
!> DLAHRD reduces the first NB columns of a real general n-by-(n-k+1)
!> matrix A so that elements below the k-th subdiagonal are zero. The
!> reduction is performed by an orthogonal similarity transformation
!> Q**T * A * Q. The routine returns the matrices V and T which determine
!> Q as a block reflector I - V*T*V**T, and also the matrix Y = A * V * T.
!>

Parameters

[in]	N	!> N is INTEGER !> The order of the matrix A. !>
[in]	K	!> K is INTEGER !> The offset for the reduction. Elements below the k-th !> subdiagonal in the first NB columns are reduced to zero. !>
[in]	NB	!> NB is INTEGER !> The number of columns to be reduced. !>
[in,out]	A	!> A is DOUBLE PRECISION array, dimension (LDA,N-K+1) !> On entry, the n-by-(n-k+1) general matrix A. !> On exit, the elements on and above the k-th subdiagonal in !> the first NB columns are overwritten with the corresponding !> elements of the reduced matrix; the elements below the k-th !> subdiagonal, with the array TAU, represent the matrix Q as a !> product of elementary reflectors. The other columns of A are !> unchanged. See Further Details. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,N). !>
[out]	TAU	!> TAU is DOUBLE PRECISION array, dimension (NB) !> The scalar factors of the elementary reflectors. See Further !> Details. !>
[out]	T	!> T is DOUBLE PRECISION array, dimension (LDT,NB) !> The upper triangular matrix T. !>
[in]	LDT	!> LDT is INTEGER !> The leading dimension of the array T. LDT >= NB. !>
[out]	Y	!> Y is DOUBLE PRECISION array, dimension (LDY,NB) !> The n-by-nb matrix Y. !>
[in]	LDY	!> LDY is INTEGER !> The leading dimension of the array Y. LDY >= N. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  The matrix Q is represented as a product of nb elementary reflectors
!>
!>     Q = H(1) H(2) . . . H(nb).
!>
!>  Each H(i) has the form
!>
!>     H(i) = I - tau * v * v**T
!>
!>  where tau is a real scalar, and v is a real vector with
!>  v(1:i+k-1) = 0, v(i+k) = 1; v(i+k+1:n) is stored on exit in
!>  A(i+k+1:n,i), and tau in TAU(i).
!>
!>  The elements of the vectors v together form the (n-k+1)-by-nb matrix
!>  V which is needed, with T and Y, to apply the transformation to the
!>  unreduced part of the matrix, using an update of the form:
!>  A := (I - V*T*V**T) * (A - Y*V**T).
!>
!>  The contents of A on exit are illustrated by the following example
!>  with n = 7, k = 3 and nb = 2:
!>
!>     ( a   h   a   a   a )
!>     ( a   h   a   a   a )
!>     ( a   h   a   a   a )
!>     ( h   h   a   a   a )
!>     ( v1  h   a   a   a )
!>     ( v1  v2  a   a   a )
!>     ( v1  v2  a   a   a )
!>
!>  where a denotes an element of the original matrix A, h denotes a
!>  modified element of the upper Hessenberg matrix H, and vi denotes an
!>  element of the vector defining H(i).
!>

Definition at line 166 of file dlahrd.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            K, LDA, LDT, LDY, N, NB
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   A( LDA, * ), T( LDT, NB ), TAU( NB ),
     $                   Y( LDY, NB )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ZERO, ONE
      parameter( zero = 0.0d+0, one = 1.0d+0 )
*     ..
*     .. Local Scalars ..
      INTEGER            I
      DOUBLE PRECISION   EI
*     ..
*     .. External Subroutines ..
      EXTERNAL           daxpy, dcopy, dgemv, dlarfg, dscal, dtrmv
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          min
*     ..
*     .. Executable Statements ..
*
*     Quick return if possible
*
      IF( n.LE.1 )
     $   RETURN
*
      DO 10 i = 1, nb
         IF( i.GT.1 ) THEN
*
*           Update A(1:n,i)
*
*           Compute i-th column of A - Y * V**T
*
            CALL dgemv( 'No transpose', n, i-1, -one, y, ldy,
     $                  a( k+i-1, 1 ), lda, one, a( 1, i ), 1 )
*
*           Apply I - V * T**T * V**T to this column (call it b) from the
*           left, using the last column of T as workspace
*
*           Let  V = ( V1 )   and   b = ( b1 )   (first I-1 rows)
*                    ( V2 )             ( b2 )
*
*           where V1 is unit lower triangular
*
*           w := V1**T * b1
*
            CALL dcopy( i-1, a( k+1, i ), 1, t( 1, nb ), 1 )
            CALL dtrmv( 'Lower', 'Transpose', 'Unit', i-1, a( k+1, 1 ),
     $                  lda, t( 1, nb ), 1 )
*
*           w := w + V2**T *b2
*
            CALL dgemv( 'Transpose', n-k-i+1, i-1, one, a( k+i, 1 ),
     $                  lda, a( k+i, i ), 1, one, t( 1, nb ), 1 )
*
*           w := T**T *w
*
            CALL dtrmv( 'Upper', 'Transpose', 'Non-unit', i-1, t, ldt,
     $                  t( 1, nb ), 1 )
*
*           b2 := b2 - V2*w
*
            CALL dgemv( 'No transpose', n-k-i+1, i-1, -one, a( k+i, 1 ),
     $                  lda, t( 1, nb ), 1, one, a( k+i, i ), 1 )
*
*           b1 := b1 - V1*w
*
            CALL dtrmv( 'Lower', 'No transpose', 'Unit', i-1,
     $                  a( k+1, 1 ), lda, t( 1, nb ), 1 )
            CALL daxpy( i-1, -one, t( 1, nb ), 1, a( k+1, i ), 1 )
*
            a( k+i-1, i-1 ) = ei
         END IF
*
*        Generate the elementary reflector H(i) to annihilate
*        A(k+i+1:n,i)
*
         CALL dlarfg( n-k-i+1, a( k+i, i ), a( min( k+i+1, n ), i ), 1,
     $                tau( i ) )
         ei = a( k+i, i )
         a( k+i, i ) = one
*
*        Compute  Y(1:n,i)
*
         CALL dgemv( 'No transpose', n, n-k-i+1, one, a( 1, i+1 ), lda,
     $               a( k+i, i ), 1, zero, y( 1, i ), 1 )
         CALL dgemv( 'Transpose', n-k-i+1, i-1, one, a( k+i, 1 ), lda,
     $               a( k+i, i ), 1, zero, t( 1, i ), 1 )
         CALL dgemv( 'No transpose', n, i-1, -one, y, ldy, t( 1, i ), 1,
     $               one, y( 1, i ), 1 )
         CALL dscal( n, tau( i ), y( 1, i ), 1 )
*
*        Compute T(1:i,i)
*
         CALL dscal( i-1, -tau( i ), t( 1, i ), 1 )
         CALL dtrmv( 'Upper', 'No transpose', 'Non-unit', i-1, t, ldt,
     $               t( 1, i ), 1 )
         t( i, i ) = tau( i )
*
   10 CONTINUE
      a( k+nb, nb ) = ei
*
      RETURN
*
*     End of DLAHRD
*

◆ dlaic1()

subroutine dlaic1	(	integer	job,
		integer	j,
		double precision, dimension( j )	x,
		double precision	sest,
		double precision, dimension( j )	w,
		double precision	gamma,
		double precision	sestpr,
		double precision	s,
		double precision	c )

DLAIC1 applies one step of incremental condition estimation.

Download DLAIC1 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLAIC1 applies one step of incremental condition estimation in
!> its simplest version:
!>
!> Let x, twonorm(x) = 1, be an approximate singular vector of an j-by-j
!> lower triangular matrix L, such that
!>          twonorm(L*x) = sest
!> Then DLAIC1 computes sestpr, s, c such that
!> the vector
!>                 [ s*x ]
!>          xhat = [  c  ]
!> is an approximate singular vector of
!>                 [ L       0  ]
!>          Lhat = [ w**T gamma ]
!> in the sense that
!>          twonorm(Lhat*xhat) = sestpr.
!>
!> Depending on JOB, an estimate for the largest or smallest singular
!> value is computed.
!>
!> Note that [s c]**T and sestpr**2 is an eigenpair of the system
!>
!>     diag(sest*sest, 0) + [alpha  gamma] * [ alpha ]
!>                                           [ gamma ]
!>
!> where  alpha =  x**T*w.
!>

Parameters

[in]	JOB	!> JOB is INTEGER !> = 1: an estimate for the largest singular value is computed. !> = 2: an estimate for the smallest singular value is computed. !>
[in]	J	!> J is INTEGER !> Length of X and W !>
[in]	X	!> X is DOUBLE PRECISION array, dimension (J) !> The j-vector x. !>
[in]	SEST	!> SEST is DOUBLE PRECISION !> Estimated singular value of j by j matrix L !>
[in]	W	!> W is DOUBLE PRECISION array, dimension (J) !> The j-vector w. !>
[in]	GAMMA	!> GAMMA is DOUBLE PRECISION !> The diagonal element gamma. !>
[out]	SESTPR	!> SESTPR is DOUBLE PRECISION !> Estimated singular value of (j+1) by (j+1) matrix Lhat. !>
[out]	S	!> S is DOUBLE PRECISION !> Sine needed in forming xhat. !>
[out]	C	!> C is DOUBLE PRECISION !> Cosine needed in forming xhat. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 133 of file dlaic1.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            J, JOB
      DOUBLE PRECISION   C, GAMMA, S, SEST, SESTPR
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   W( J ), X( J )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ZERO, ONE, TWO
      parameter( zero = 0.0d0, one = 1.0d0, two = 2.0d0 )
      DOUBLE PRECISION   HALF, FOUR
      parameter( half = 0.5d0, four = 4.0d0 )
*     ..
*     .. Local Scalars ..
      DOUBLE PRECISION   ABSALP, ABSEST, ABSGAM, ALPHA, B, COSINE, EPS,
     $                   NORMA, S1, S2, SINE, T, TEST, TMP, ZETA1, ZETA2
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, max, sign, sqrt
*     ..
*     .. External Functions ..
      DOUBLE PRECISION   DDOT, DLAMCH
      EXTERNAL           ddot, dlamch
*     ..
*     .. Executable Statements ..
*
      eps = dlamch( 'Epsilon' )
      alpha = ddot( j, x, 1, w, 1 )
*
      absalp = abs( alpha )
      absgam = abs( gamma )
      absest = abs( sest )
*
      IF( job.EQ.1 ) THEN
*
*        Estimating largest singular value
*
*        special cases
*
         IF( sest.EQ.zero ) THEN
            s1 = max( absgam, absalp )
            IF( s1.EQ.zero ) THEN
               s = zero
               c = one
               sestpr = zero
            ELSE
               s = alpha / s1
               c = gamma / s1
               tmp = sqrt( s*s+c*c )
               s = s / tmp
               c = c / tmp
               sestpr = s1*tmp
            END IF
            RETURN
         ELSE IF( absgam.LE.eps*absest ) THEN
            s = one
            c = zero
            tmp = max( absest, absalp )
            s1 = absest / tmp
            s2 = absalp / tmp
            sestpr = tmp*sqrt( s1*s1+s2*s2 )
            RETURN
         ELSE IF( absalp.LE.eps*absest ) THEN
            s1 = absgam
            s2 = absest
            IF( s1.LE.s2 ) THEN
               s = one
               c = zero
               sestpr = s2
            ELSE
               s = zero
               c = one
               sestpr = s1
            END IF
            RETURN
         ELSE IF( absest.LE.eps*absalp .OR. absest.LE.eps*absgam ) THEN
            s1 = absgam
            s2 = absalp
            IF( s1.LE.s2 ) THEN
               tmp = s1 / s2
               s = sqrt( one+tmp*tmp )
               sestpr = s2*s
               c = ( gamma / s2 ) / s
               s = sign( one, alpha ) / s
            ELSE
               tmp = s2 / s1
               c = sqrt( one+tmp*tmp )
               sestpr = s1*c
               s = ( alpha / s1 ) / c
               c = sign( one, gamma ) / c
            END IF
            RETURN
         ELSE
*
*           normal case
*
            zeta1 = alpha / absest
            zeta2 = gamma / absest
*
            b = ( one-zeta1*zeta1-zeta2*zeta2 )*half
            c = zeta1*zeta1
            IF( b.GT.zero ) THEN
               t = c / ( b+sqrt( b*b+c ) )
            ELSE
               t = sqrt( b*b+c ) - b
            END IF
*
            sine = -zeta1 / t
            cosine = -zeta2 / ( one+t )
            tmp = sqrt( sine*sine+cosine*cosine )
            s = sine / tmp
            c = cosine / tmp
            sestpr = sqrt( t+one )*absest
            RETURN
         END IF
*
      ELSE IF( job.EQ.2 ) THEN
*
*        Estimating smallest singular value
*
*        special cases
*
         IF( sest.EQ.zero ) THEN
            sestpr = zero
            IF( max( absgam, absalp ).EQ.zero ) THEN
               sine = one
               cosine = zero
            ELSE
               sine = -gamma
               cosine = alpha
            END IF
            s1 = max( abs( sine ), abs( cosine ) )
            s = sine / s1
            c = cosine / s1
            tmp = sqrt( s*s+c*c )
            s = s / tmp
            c = c / tmp
            RETURN
         ELSE IF( absgam.LE.eps*absest ) THEN
            s = zero
            c = one
            sestpr = absgam
            RETURN
         ELSE IF( absalp.LE.eps*absest ) THEN
            s1 = absgam
            s2 = absest
            IF( s1.LE.s2 ) THEN
               s = zero
               c = one
               sestpr = s1
            ELSE
               s = one
               c = zero
               sestpr = s2
            END IF
            RETURN
         ELSE IF( absest.LE.eps*absalp .OR. absest.LE.eps*absgam ) THEN
            s1 = absgam
            s2 = absalp
            IF( s1.LE.s2 ) THEN
               tmp = s1 / s2
               c = sqrt( one+tmp*tmp )
               sestpr = absest*( tmp / c )
               s = -( gamma / s2 ) / c
               c = sign( one, alpha ) / c
            ELSE
               tmp = s2 / s1
               s = sqrt( one+tmp*tmp )
               sestpr = absest / s
               c = ( alpha / s1 ) / s
               s = -sign( one, gamma ) / s
            END IF
            RETURN
         ELSE
*
*           normal case
*
            zeta1 = alpha / absest
            zeta2 = gamma / absest
*
            norma = max( one+zeta1*zeta1+abs( zeta1*zeta2 ),
     $              abs( zeta1*zeta2 )+zeta2*zeta2 )
*
*           See if root is closer to zero or to ONE
*
            test = one + two*( zeta1-zeta2 )*( zeta1+zeta2 )
            IF( test.GE.zero ) THEN
*
*              root is close to zero, compute directly
*
               b = ( zeta1*zeta1+zeta2*zeta2+one )*half
               c = zeta2*zeta2
               t = c / ( b+sqrt( abs( b*b-c ) ) )
               sine = zeta1 / ( one-t )
               cosine = -zeta2 / t
               sestpr = sqrt( t+four*eps*eps*norma )*absest
            ELSE
*
*              root is closer to ONE, shift by that amount
*
               b = ( zeta2*zeta2+zeta1*zeta1-one )*half
               c = zeta1*zeta1
               IF( b.GE.zero ) THEN
                  t = -c / ( b+sqrt( b*b+c ) )
               ELSE
                  t = b - sqrt( b*b+c )
               END IF
               sine = -zeta1 / t
               cosine = -zeta2 / ( one+t )
               sestpr = sqrt( one+t+four*eps*eps*norma )*absest
            END IF
            tmp = sqrt( sine*sine+cosine*cosine )
            s = sine / tmp
            c = cosine / tmp
            RETURN
*
         END IF
      END IF
      RETURN
*
*     End of DLAIC1
*

◆ dlaln2()

subroutine dlaln2	(	logical	ltrans,
		integer	na,
		integer	nw,
		double precision	smin,
		double precision	ca,
		double precision, dimension( lda, * )	a,
		integer	lda,
		double precision	d1,
		double precision	d2,
		double precision, dimension( ldb, * )	b,
		integer	ldb,
		double precision	wr,
		double precision	wi,
		double precision, dimension( ldx, * )	x,
		integer	ldx,
		double precision	scale,
		double precision	xnorm,
		integer	info )

DLALN2 solves a 1-by-1 or 2-by-2 linear system of equations of the specified form.

Download DLALN2 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLALN2 solves a system of the form  (ca A - w D ) X = s B
!> or (ca A**T - w D) X = s B   with possible scaling () and
!> perturbation of A.  (A**T means A-transpose.)
!>
!> A is an NA x NA real matrix, ca is a real scalar, D is an NA x NA
!> real diagonal matrix, w is a real or complex value, and X and B are
!> NA x 1 matrices -- real if w is real, complex if w is complex.  NA
!> may be 1 or 2.
!>
!> If w is complex, X and B are represented as NA x 2 matrices,
!> the first column of each being the real part and the second
!> being the imaginary part.
!>
!>  is a scaling factor (<= 1), computed by DLALN2, which is
!> so chosen that X can be computed without overflow.  X is further
!> scaled if necessary to assure that norm(ca A - w D)*norm(X) is less
!> than overflow.
!>
!> If both singular values of (ca A - w D) are less than SMIN,
!> SMIN*identity will be used instead of (ca A - w D).  If only one
!> singular value is less than SMIN, one element of (ca A - w D) will be
!> perturbed enough to make the smallest singular value roughly SMIN.
!> If both singular values are at least SMIN, (ca A - w D) will not be
!> perturbed.  In any case, the perturbation will be at most some small
!> multiple of max( SMIN, ulp*norm(ca A - w D) ).  The singular values
!> are computed by infinity-norm approximations, and thus will only be
!> correct to a factor of 2 or so.
!>
!> Note: all input quantities are assumed to be smaller than overflow
!> by a reasonable factor.  (See BIGNUM.)
!>

Parameters

[in]	LTRANS	!> LTRANS is LOGICAL !> =.TRUE.: A-transpose will be used. !> =.FALSE.: A will be used (not transposed.) !>
[in]	NA	!> NA is INTEGER !> The size of the matrix A. It may (only) be 1 or 2. !>
[in]	NW	!> NW is INTEGER !> 1 if is real, 2 if is complex. It may only be 1 !> or 2. !>
[in]	SMIN	!> SMIN is DOUBLE PRECISION !> The desired lower bound on the singular values of A. This !> should be a safe distance away from underflow or overflow, !> say, between (underflow/machine precision) and (machine !> precision * overflow ). (See BIGNUM and ULP.) !>
[in]	CA	!> CA is DOUBLE PRECISION !> The coefficient c, which A is multiplied by. !>
[in]	A	!> A is DOUBLE PRECISION array, dimension (LDA,NA) !> The NA x NA matrix A. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of A. It must be at least NA. !>
[in]	D1	!> D1 is DOUBLE PRECISION !> The 1,1 element in the diagonal matrix D. !>
[in]	D2	!> D2 is DOUBLE PRECISION !> The 2,2 element in the diagonal matrix D. Not used if NA=1. !>
[in]	B	!> B is DOUBLE PRECISION array, dimension (LDB,NW) !> The NA x NW matrix B (right-hand side). If NW=2 ( is !> complex), column 1 contains the real part of B and column 2 !> contains the imaginary part. !>
[in]	LDB	!> LDB is INTEGER !> The leading dimension of B. It must be at least NA. !>
[in]	WR	!> WR is DOUBLE PRECISION !> The real part of the scalar . !>
[in]	WI	!> WI is DOUBLE PRECISION !> The imaginary part of the scalar . Not used if NW=1. !>
[out]	X	!> X is DOUBLE PRECISION array, dimension (LDX,NW) !> The NA x NW matrix X (unknowns), as computed by DLALN2. !> If NW=2 ( is complex), on exit, column 1 will contain !> the real part of X and column 2 will contain the imaginary !> part. !>
[in]	LDX	!> LDX is INTEGER !> The leading dimension of X. It must be at least NA. !>
[out]	SCALE	!> SCALE is DOUBLE PRECISION !> The scale factor that B must be multiplied by to insure !> that overflow does not occur when computing X. Thus, !> (ca A - w D) X will be SCALE*B, not B (ignoring !> perturbations of A.) It will be at most 1. !>
[out]	XNORM	!> XNORM is DOUBLE PRECISION !> The infinity-norm of X, when X is regarded as an NA x NW !> real matrix. !>
[out]	INFO	!> INFO is INTEGER !> An error flag. It will be set to zero if no error occurs, !> a negative number if an argument is in error, or a positive !> number if ca A - w D had to be perturbed. !> The possible values are: !> = 0: No error occurred, and (ca A - w D) did not have to be !> perturbed. !> = 1: (ca A - w D) had to be perturbed to make its smallest !> (or only) singular value greater than SMIN. !> NOTE: In the interests of speed, this routine does not !> check the inputs for errors. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 216 of file dlaln2.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      LOGICAL            LTRANS
      INTEGER            INFO, LDA, LDB, LDX, NA, NW
      DOUBLE PRECISION   CA, D1, D2, SCALE, SMIN, WI, WR, XNORM
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   A( LDA, * ), B( LDB, * ), X( LDX, * )
*     ..
*
* =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ZERO, ONE
      parameter( zero = 0.0d0, one = 1.0d0 )
      DOUBLE PRECISION   TWO
      parameter( two = 2.0d0 )
*     ..
*     .. Local Scalars ..
      INTEGER            ICMAX, J
      DOUBLE PRECISION   BBND, BI1, BI2, BIGNUM, BNORM, BR1, BR2, CI21,
     $                   CI22, CMAX, CNORM, CR21, CR22, CSI, CSR, LI21,
     $                   LR21, SMINI, SMLNUM, TEMP, U22ABS, UI11, UI11R,
     $                   UI12, UI12S, UI22, UR11, UR11R, UR12, UR12S,
     $                   UR22, XI1, XI2, XR1, XR2
*     ..
*     .. Local Arrays ..
      LOGICAL            RSWAP( 4 ), ZSWAP( 4 )
      INTEGER            IPIVOT( 4, 4 )
      DOUBLE PRECISION   CI( 2, 2 ), CIV( 4 ), CR( 2, 2 ), CRV( 4 )
*     ..
*     .. External Functions ..
      DOUBLE PRECISION   DLAMCH
      EXTERNAL           dlamch
*     ..
*     .. External Subroutines ..
      EXTERNAL           dladiv
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, max
*     ..
*     .. Equivalences ..
      equivalence( ci( 1, 1 ), civ( 1 ) ),
     $                   ( cr( 1, 1 ), crv( 1 ) )
*     ..
*     .. Data statements ..
      DATA               zswap / .false., .false., .true., .true. /
      DATA               rswap / .false., .true., .false., .true. /
      DATA               ipivot / 1, 2, 3, 4, 2, 1, 4, 3, 3, 4, 1, 2, 4,
     $                   3, 2, 1 /
*     ..
*     .. Executable Statements ..
*
*     Compute BIGNUM
*
      smlnum = two*dlamch( 'Safe minimum' )
      bignum = one / smlnum
      smini = max( smin, smlnum )
*
*     Don't check for input errors
*
      info = 0
*
*     Standard Initializations
*
      scale = one
*
      IF( na.EQ.1 ) THEN
*
*        1 x 1  (i.e., scalar) system   C X = B
*
         IF( nw.EQ.1 ) THEN
*
*           Real 1x1 system.
*
*           C = ca A - w D
*
            csr = ca*a( 1, 1 ) - wr*d1
            cnorm = abs( csr )
*
*           If | C | < SMINI, use C = SMINI
*
            IF( cnorm.LT.smini ) THEN
               csr = smini
               cnorm = smini
               info = 1
            END IF
*
*           Check scaling for  X = B / C
*
            bnorm = abs( b( 1, 1 ) )
            IF( cnorm.LT.one .AND. bnorm.GT.one ) THEN
               IF( bnorm.GT.bignum*cnorm )
     $            scale = one / bnorm
            END IF
*
*           Compute X
*
            x( 1, 1 ) = ( b( 1, 1 )*scale ) / csr
            xnorm = abs( x( 1, 1 ) )
         ELSE
*
*           Complex 1x1 system (w is complex)
*
*           C = ca A - w D
*
            csr = ca*a( 1, 1 ) - wr*d1
            csi = -wi*d1
            cnorm = abs( csr ) + abs( csi )
*
*           If | C | < SMINI, use C = SMINI
*
            IF( cnorm.LT.smini ) THEN
               csr = smini
               csi = zero
               cnorm = smini
               info = 1
            END IF
*
*           Check scaling for  X = B / C
*
            bnorm = abs( b( 1, 1 ) ) + abs( b( 1, 2 ) )
            IF( cnorm.LT.one .AND. bnorm.GT.one ) THEN
               IF( bnorm.GT.bignum*cnorm )
     $            scale = one / bnorm
            END IF
*
*           Compute X
*
            CALL dladiv( scale*b( 1, 1 ), scale*b( 1, 2 ), csr, csi,
     $                   x( 1, 1 ), x( 1, 2 ) )
            xnorm = abs( x( 1, 1 ) ) + abs( x( 1, 2 ) )
         END IF
*
      ELSE
*
*        2x2 System
*
*        Compute the real part of  C = ca A - w D  (or  ca A**T - w D )
*
         cr( 1, 1 ) = ca*a( 1, 1 ) - wr*d1
         cr( 2, 2 ) = ca*a( 2, 2 ) - wr*d2
         IF( ltrans ) THEN
            cr( 1, 2 ) = ca*a( 2, 1 )
            cr( 2, 1 ) = ca*a( 1, 2 )
         ELSE
            cr( 2, 1 ) = ca*a( 2, 1 )
            cr( 1, 2 ) = ca*a( 1, 2 )
         END IF
*
         IF( nw.EQ.1 ) THEN
*
*           Real 2x2 system  (w is real)
*
*           Find the largest element in C
*
            cmax = zero
            icmax = 0
*
            DO 10 j = 1, 4
               IF( abs( crv( j ) ).GT.cmax ) THEN
                  cmax = abs( crv( j ) )
                  icmax = j
               END IF
   10       CONTINUE
*
*           If norm(C) < SMINI, use SMINI*identity.
*
            IF( cmax.LT.smini ) THEN
               bnorm = max( abs( b( 1, 1 ) ), abs( b( 2, 1 ) ) )
               IF( smini.LT.one .AND. bnorm.GT.one ) THEN
                  IF( bnorm.GT.bignum*smini )
     $               scale = one / bnorm
               END IF
               temp = scale / smini
               x( 1, 1 ) = temp*b( 1, 1 )
               x( 2, 1 ) = temp*b( 2, 1 )
               xnorm = temp*bnorm
               info = 1
               RETURN
            END IF
*
*           Gaussian elimination with complete pivoting.
*
            ur11 = crv( icmax )
            cr21 = crv( ipivot( 2, icmax ) )
            ur12 = crv( ipivot( 3, icmax ) )
            cr22 = crv( ipivot( 4, icmax ) )
            ur11r = one / ur11
            lr21 = ur11r*cr21
            ur22 = cr22 - ur12*lr21
*
*           If smaller pivot < SMINI, use SMINI
*
            IF( abs( ur22 ).LT.smini ) THEN
               ur22 = smini
               info = 1
            END IF
            IF( rswap( icmax ) ) THEN
               br1 = b( 2, 1 )
               br2 = b( 1, 1 )
            ELSE
               br1 = b( 1, 1 )
               br2 = b( 2, 1 )
            END IF
            br2 = br2 - lr21*br1
            bbnd = max( abs( br1*( ur22*ur11r ) ), abs( br2 ) )
            IF( bbnd.GT.one .AND. abs( ur22 ).LT.one ) THEN
               IF( bbnd.GE.bignum*abs( ur22 ) )
     $            scale = one / bbnd
            END IF
*
            xr2 = ( br2*scale ) / ur22
            xr1 = ( scale*br1 )*ur11r - xr2*( ur11r*ur12 )
            IF( zswap( icmax ) ) THEN
               x( 1, 1 ) = xr2
               x( 2, 1 ) = xr1
            ELSE
               x( 1, 1 ) = xr1
               x( 2, 1 ) = xr2
            END IF
            xnorm = max( abs( xr1 ), abs( xr2 ) )
*
*           Further scaling if  norm(A) norm(X) > overflow
*
            IF( xnorm.GT.one .AND. cmax.GT.one ) THEN
               IF( xnorm.GT.bignum / cmax ) THEN
                  temp = cmax / bignum
                  x( 1, 1 ) = temp*x( 1, 1 )
                  x( 2, 1 ) = temp*x( 2, 1 )
                  xnorm = temp*xnorm
                  scale = temp*scale
               END IF
            END IF
         ELSE
*
*           Complex 2x2 system  (w is complex)
*
*           Find the largest element in C
*
            ci( 1, 1 ) = -wi*d1
            ci( 2, 1 ) = zero
            ci( 1, 2 ) = zero
            ci( 2, 2 ) = -wi*d2
            cmax = zero
            icmax = 0
*
            DO 20 j = 1, 4
               IF( abs( crv( j ) )+abs( civ( j ) ).GT.cmax ) THEN
                  cmax = abs( crv( j ) ) + abs( civ( j ) )
                  icmax = j
               END IF
   20       CONTINUE
*
*           If norm(C) < SMINI, use SMINI*identity.
*
            IF( cmax.LT.smini ) THEN
               bnorm = max( abs( b( 1, 1 ) )+abs( b( 1, 2 ) ),
     $                 abs( b( 2, 1 ) )+abs( b( 2, 2 ) ) )
               IF( smini.LT.one .AND. bnorm.GT.one ) THEN
                  IF( bnorm.GT.bignum*smini )
     $               scale = one / bnorm
               END IF
               temp = scale / smini
               x( 1, 1 ) = temp*b( 1, 1 )
               x( 2, 1 ) = temp*b( 2, 1 )
               x( 1, 2 ) = temp*b( 1, 2 )
               x( 2, 2 ) = temp*b( 2, 2 )
               xnorm = temp*bnorm
               info = 1
               RETURN
            END IF
*
*           Gaussian elimination with complete pivoting.
*
            ur11 = crv( icmax )
            ui11 = civ( icmax )
            cr21 = crv( ipivot( 2, icmax ) )
            ci21 = civ( ipivot( 2, icmax ) )
            ur12 = crv( ipivot( 3, icmax ) )
            ui12 = civ( ipivot( 3, icmax ) )
            cr22 = crv( ipivot( 4, icmax ) )
            ci22 = civ( ipivot( 4, icmax ) )
            IF( icmax.EQ.1 .OR. icmax.EQ.4 ) THEN
*
*              Code when off-diagonals of pivoted C are real
*
               IF( abs( ur11 ).GT.abs( ui11 ) ) THEN
                  temp = ui11 / ur11
                  ur11r = one / ( ur11*( one+temp**2 ) )
                  ui11r = -temp*ur11r
               ELSE
                  temp = ur11 / ui11
                  ui11r = -one / ( ui11*( one+temp**2 ) )
                  ur11r = -temp*ui11r
               END IF
               lr21 = cr21*ur11r
               li21 = cr21*ui11r
               ur12s = ur12*ur11r
               ui12s = ur12*ui11r
               ur22 = cr22 - ur12*lr21
               ui22 = ci22 - ur12*li21
            ELSE
*
*              Code when diagonals of pivoted C are real
*
               ur11r = one / ur11
               ui11r = zero
               lr21 = cr21*ur11r
               li21 = ci21*ur11r
               ur12s = ur12*ur11r
               ui12s = ui12*ur11r
               ur22 = cr22 - ur12*lr21 + ui12*li21
               ui22 = -ur12*li21 - ui12*lr21
            END IF
            u22abs = abs( ur22 ) + abs( ui22 )
*
*           If smaller pivot < SMINI, use SMINI
*
            IF( u22abs.LT.smini ) THEN
               ur22 = smini
               ui22 = zero
               info = 1
            END IF
            IF( rswap( icmax ) ) THEN
               br2 = b( 1, 1 )
               br1 = b( 2, 1 )
               bi2 = b( 1, 2 )
               bi1 = b( 2, 2 )
            ELSE
               br1 = b( 1, 1 )
               br2 = b( 2, 1 )
               bi1 = b( 1, 2 )
               bi2 = b( 2, 2 )
            END IF
            br2 = br2 - lr21*br1 + li21*bi1
            bi2 = bi2 - li21*br1 - lr21*bi1
            bbnd = max( ( abs( br1 )+abs( bi1 ) )*
     $             ( u22abs*( abs( ur11r )+abs( ui11r ) ) ),
     $             abs( br2 )+abs( bi2 ) )
            IF( bbnd.GT.one .AND. u22abs.LT.one ) THEN
               IF( bbnd.GE.bignum*u22abs ) THEN
                  scale = one / bbnd
                  br1 = scale*br1
                  bi1 = scale*bi1
                  br2 = scale*br2
                  bi2 = scale*bi2
               END IF
            END IF
*
            CALL dladiv( br2, bi2, ur22, ui22, xr2, xi2 )
            xr1 = ur11r*br1 - ui11r*bi1 - ur12s*xr2 + ui12s*xi2
            xi1 = ui11r*br1 + ur11r*bi1 - ui12s*xr2 - ur12s*xi2
            IF( zswap( icmax ) ) THEN
               x( 1, 1 ) = xr2
               x( 2, 1 ) = xr1
               x( 1, 2 ) = xi2
               x( 2, 2 ) = xi1
            ELSE
               x( 1, 1 ) = xr1
               x( 2, 1 ) = xr2
               x( 1, 2 ) = xi1
               x( 2, 2 ) = xi2
            END IF
            xnorm = max( abs( xr1 )+abs( xi1 ), abs( xr2 )+abs( xi2 ) )
*
*           Further scaling if  norm(A) norm(X) > overflow
*
            IF( xnorm.GT.one .AND. cmax.GT.one ) THEN
               IF( xnorm.GT.bignum / cmax ) THEN
                  temp = cmax / bignum
                  x( 1, 1 ) = temp*x( 1, 1 )
                  x( 2, 1 ) = temp*x( 2, 1 )
                  x( 1, 2 ) = temp*x( 1, 2 )
                  x( 2, 2 ) = temp*x( 2, 2 )
                  xnorm = temp*xnorm
                  scale = temp*scale
               END IF
            END IF
         END IF
      END IF
*
      RETURN
*
*     End of DLALN2
*

◆ dlangt()

double precision function dlangt	(	character	norm,
		integer	n,
		double precision, dimension( * )	dl,
		double precision, dimension( * )	d,
		double precision, dimension( * )	du )

DLANGT returns the value of the 1-norm, Frobenius norm, infinity-norm, or the largest absolute value of any element of a general tridiagonal matrix.

Download DLANGT + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLANGT  returns the value of the one norm,  or the Frobenius norm, or
!> the  infinity norm,  or the  element of  largest absolute value  of a
!> real tridiagonal matrix A.
!>

Returns

DLANGT

!>
!>    DLANGT = ( max(abs(A(i,j))), NORM = 'M' or 'm'
!>             (
!>             ( norm1(A),         NORM = '1', 'O' or 'o'
!>             (
!>             ( normI(A),         NORM = 'I' or 'i'
!>             (
!>             ( normF(A),         NORM = 'F', 'f', 'E' or 'e'
!>
!> where  norm1  denotes the  one norm of a matrix (maximum column sum),
!> normI  denotes the  infinity norm  of a matrix  (maximum row sum) and
!> normF  denotes the  Frobenius norm of a matrix (square root of sum of
!> squares).  Note that  max(abs(A(i,j)))  is not a consistent matrix norm.
!>

Parameters

[in]	NORM	!> NORM is CHARACTER*1 !> Specifies the value to be returned in DLANGT as described !> above. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. When N = 0, DLANGT is !> set to zero. !>
[in]	DL	!> DL is DOUBLE PRECISION array, dimension (N-1) !> The (n-1) sub-diagonal elements of A. !>
[in]	D	!> D is DOUBLE PRECISION array, dimension (N) !> The diagonal elements of A. !>
[in]	DU	!> DU is DOUBLE PRECISION array, dimension (N-1) !> The (n-1) super-diagonal elements of A. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 105 of file dlangt.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          NORM
      INTEGER            N
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   D( * ), DL( * ), DU( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ONE, ZERO
      parameter( one = 1.0d+0, zero = 0.0d+0 )
*     ..
*     .. Local Scalars ..
      INTEGER            I
      DOUBLE PRECISION   ANORM, SCALE, SUM, TEMP
*     ..
*     .. External Functions ..
      LOGICAL            LSAME, DISNAN
      EXTERNAL           lsame, disnan
*     ..
*     .. External Subroutines ..
      EXTERNAL           dlassq
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, sqrt
*     ..
*     .. Executable Statements ..
*
      IF( n.LE.0 ) THEN
         anorm = zero
      ELSE IF( lsame( norm, 'M' ) ) THEN
*
*        Find max(abs(A(i,j))).
*
         anorm = abs( d( n ) )
         DO 10 i = 1, n - 1
            IF( anorm.LT.abs( dl( i ) ) .OR. disnan( abs( dl( i ) ) ) )
     $           anorm = abs(dl(i))
            IF( anorm.LT.abs( d( i ) ) .OR. disnan( abs( d( i ) ) ) )
     $           anorm = abs(d(i))
            IF( anorm.LT.abs( du( i ) ) .OR. disnan(abs( du( i ) ) ) )
     $           anorm = abs(du(i))
   10    CONTINUE
      ELSE IF( lsame( norm, 'O' ) .OR. norm.EQ.'1' ) THEN
*
*        Find norm1(A).
*
         IF( n.EQ.1 ) THEN
            anorm = abs( d( 1 ) )
         ELSE
            anorm = abs( d( 1 ) )+abs( dl( 1 ) )
            temp = abs( d( n ) )+abs( du( n-1 ) )
            IF( anorm .LT. temp .OR. disnan( temp ) ) anorm = temp
            DO 20 i = 2, n - 1
               temp = abs( d( i ) )+abs( dl( i ) )+abs( du( i-1 ) )
               IF( anorm .LT. temp .OR. disnan( temp ) ) anorm = temp
   20       CONTINUE
         END IF
      ELSE IF( lsame( norm, 'I' ) ) THEN
*
*        Find normI(A).
*
         IF( n.EQ.1 ) THEN
            anorm = abs( d( 1 ) )
         ELSE
            anorm = abs( d( 1 ) )+abs( du( 1 ) )
            temp = abs( d( n ) )+abs( dl( n-1 ) )
            IF( anorm .LT. temp .OR. disnan( temp ) ) anorm = temp
            DO 30 i = 2, n - 1
               temp = abs( d( i ) )+abs( du( i ) )+abs( dl( i-1 ) )
               IF( anorm .LT. temp .OR. disnan( temp ) ) anorm = temp
   30       CONTINUE
         END IF
      ELSE IF( ( lsame( norm, 'F' ) ) .OR. ( lsame( norm, 'E' ) ) ) THEN
*
*        Find normF(A).
*
         scale = zero
         sum = one
         CALL dlassq( n, d, 1, scale, sum )
         IF( n.GT.1 ) THEN
            CALL dlassq( n-1, dl, 1, scale, sum )
            CALL dlassq( n-1, du, 1, scale, sum )
         END IF
         anorm = scale*sqrt( sum )
      END IF
*
      dlangt = anorm
      RETURN
*
*     End of DLANGT
*

◆ dlanhs()

double precision function dlanhs	(	character	norm,
		integer	n,
		double precision, dimension( lda, * )	a,
		integer	lda,
		double precision, dimension( * )	work )

DLANHS returns the value of the 1-norm, Frobenius norm, infinity-norm, or the largest absolute value of any element of an upper Hessenberg matrix.

Download DLANHS + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLANHS  returns the value of the one norm,  or the Frobenius norm, or
!> the  infinity norm,  or the  element of  largest absolute value  of a
!> Hessenberg matrix A.
!>

Returns

DLANHS

!>
!>    DLANHS = ( max(abs(A(i,j))), NORM = 'M' or 'm'
!>             (
!>             ( norm1(A),         NORM = '1', 'O' or 'o'
!>             (
!>             ( normI(A),         NORM = 'I' or 'i'
!>             (
!>             ( normF(A),         NORM = 'F', 'f', 'E' or 'e'
!>
!> where  norm1  denotes the  one norm of a matrix (maximum column sum),
!> normI  denotes the  infinity norm  of a matrix  (maximum row sum) and
!> normF  denotes the  Frobenius norm of a matrix (square root of sum of
!> squares).  Note that  max(abs(A(i,j)))  is not a consistent matrix norm.
!>

Parameters

[in]	NORM	!> NORM is CHARACTER*1 !> Specifies the value to be returned in DLANHS as described !> above. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. When N = 0, DLANHS is !> set to zero. !>
[in]	A	!> A is DOUBLE PRECISION array, dimension (LDA,N) !> The n by n upper Hessenberg matrix A; the part of A below the !> first sub-diagonal is not referenced. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(N,1). !>
[out]	WORK	!> WORK is DOUBLE PRECISION array, dimension (MAX(1,LWORK)), !> where LWORK >= N when NORM = 'I'; otherwise, WORK is not !> referenced. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 107 of file dlanhs.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          NORM
      INTEGER            LDA, N
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   A( LDA, * ), WORK( * )
*     ..
*
* =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ONE, ZERO
      parameter( one = 1.0d+0, zero = 0.0d+0 )
*     ..
*     .. Local Scalars ..
      INTEGER            I, J
      DOUBLE PRECISION   SCALE, SUM, VALUE
*     ..
*     .. External Subroutines ..
      EXTERNAL           dlassq
*     ..
*     .. External Functions ..
      LOGICAL            LSAME, DISNAN
      EXTERNAL           lsame, disnan
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, min, sqrt
*     ..
*     .. Executable Statements ..
*
      IF( n.EQ.0 ) THEN
         VALUE = zero
      ELSE IF( lsame( norm, 'M' ) ) THEN
*
*        Find max(abs(A(i,j))).
*
         VALUE = zero
         DO 20 j = 1, n
            DO 10 i = 1, min( n, j+1 )
               sum = abs( a( i, j ) )
               IF( VALUE .LT. sum .OR. disnan( sum ) ) VALUE = sum
   10       CONTINUE
   20    CONTINUE
      ELSE IF( ( lsame( norm, 'O' ) ) .OR. ( norm.EQ.'1' ) ) THEN
*
*        Find norm1(A).
*
         VALUE = zero
         DO 40 j = 1, n
            sum = zero
            DO 30 i = 1, min( n, j+1 )
               sum = sum + abs( a( i, j ) )
   30       CONTINUE
            IF( VALUE .LT. sum .OR. disnan( sum ) ) VALUE = sum
   40    CONTINUE
      ELSE IF( lsame( norm, 'I' ) ) THEN
*
*        Find normI(A).
*
         DO 50 i = 1, n
            work( i ) = zero
   50    CONTINUE
         DO 70 j = 1, n
            DO 60 i = 1, min( n, j+1 )
               work( i ) = work( i ) + abs( a( i, j ) )
   60       CONTINUE
   70    CONTINUE
         VALUE = zero
         DO 80 i = 1, n
            sum = work( i )
            IF( VALUE .LT. sum .OR. disnan( sum ) ) VALUE = sum
   80    CONTINUE
      ELSE IF( ( lsame( norm, 'F' ) ) .OR. ( lsame( norm, 'E' ) ) ) THEN
*
*        Find normF(A).
*
         scale = zero
         sum = one
         DO 90 j = 1, n
            CALL dlassq( min( n, j+1 ), a( 1, j ), 1, scale, sum )
   90    CONTINUE
         VALUE = scale*sqrt( sum )
      END IF
*
      dlanhs = VALUE
      RETURN
*
*     End of DLANHS
*

◆ dlansb()

double precision function dlansb	(	character	norm,
		character	uplo,
		integer	n,
		integer	k,
		double precision, dimension( ldab, * )	ab,
		integer	ldab,
		double precision, dimension( * )	work )

DLANSB returns the value of the 1-norm, or the Frobenius norm, or the infinity norm, or the element of largest absolute value of a symmetric band matrix.

Download DLANSB + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLANSB  returns the value of the one norm,  or the Frobenius norm, or
!> the  infinity norm,  or the element of  largest absolute value  of an
!> n by n symmetric band matrix A,  with k super-diagonals.
!>

Returns

DLANSB

!>
!>    DLANSB = ( max(abs(A(i,j))), NORM = 'M' or 'm'
!>             (
!>             ( norm1(A),         NORM = '1', 'O' or 'o'
!>             (
!>             ( normI(A),         NORM = 'I' or 'i'
!>             (
!>             ( normF(A),         NORM = 'F', 'f', 'E' or 'e'
!>
!> where  norm1  denotes the  one norm of a matrix (maximum column sum),
!> normI  denotes the  infinity norm  of a matrix  (maximum row sum) and
!> normF  denotes the  Frobenius norm of a matrix (square root of sum of
!> squares).  Note that  max(abs(A(i,j)))  is not a consistent matrix norm.
!>

Parameters

[in]	NORM	!> NORM is CHARACTER*1 !> Specifies the value to be returned in DLANSB as described !> above. !>
[in]	UPLO	!> UPLO is CHARACTER*1 !> Specifies whether the upper or lower triangular part of the !> band matrix A is supplied. !> = 'U': Upper triangular part is supplied !> = 'L': Lower triangular part is supplied !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. When N = 0, DLANSB is !> set to zero. !>
[in]	K	!> K is INTEGER !> The number of super-diagonals or sub-diagonals of the !> band matrix A. K >= 0. !>
[in]	AB	!> AB is DOUBLE PRECISION array, dimension (LDAB,N) !> The upper or lower triangle of the symmetric band matrix A, !> stored in the first K+1 rows of AB. The j-th column of A is !> stored in the j-th column of the array AB as follows: !> if UPLO = 'U', AB(k+1+i-j,j) = A(i,j) for max(1,j-k)<=i<=j; !> if UPLO = 'L', AB(1+i-j,j) = A(i,j) for j<=i<=min(n,j+k). !>
[in]	LDAB	!> LDAB is INTEGER !> The leading dimension of the array AB. LDAB >= K+1. !>
[out]	WORK	!> WORK is DOUBLE PRECISION array, dimension (MAX(1,LWORK)), !> where LWORK >= N when NORM = 'I' or '1' or 'O'; otherwise, !> WORK is not referenced. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 127 of file dlansb.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          NORM, UPLO
      INTEGER            K, LDAB, N
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   AB( LDAB, * ), WORK( * )
*     ..
*
* =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ONE, ZERO
      parameter( one = 1.0d+0, zero = 0.0d+0 )
*     ..
*     .. Local Scalars ..
      INTEGER            I, J, L
      DOUBLE PRECISION   ABSA, SCALE, SUM, VALUE
*     ..
*     .. External Subroutines ..
      EXTERNAL           dlassq
*     ..
*     .. External Functions ..
      LOGICAL            LSAME, DISNAN
      EXTERNAL           lsame, disnan
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, max, min, sqrt
*     ..
*     .. Executable Statements ..
*
      IF( n.EQ.0 ) THEN
         VALUE = zero
      ELSE IF( lsame( norm, 'M' ) ) THEN
*
*        Find max(abs(A(i,j))).
*
         VALUE = zero
         IF( lsame( uplo, 'U' ) ) THEN
            DO 20 j = 1, n
               DO 10 i = max( k+2-j, 1 ), k + 1
                  sum = abs( ab( i, j ) )
                  IF( VALUE .LT. sum .OR. disnan( sum ) ) VALUE = sum
   10          CONTINUE
   20       CONTINUE
         ELSE
            DO 40 j = 1, n
               DO 30 i = 1, min( n+1-j, k+1 )
                  sum = abs( ab( i, j ) )
                  IF( VALUE .LT. sum .OR. disnan( sum ) ) VALUE = sum
   30          CONTINUE
   40       CONTINUE
         END IF
      ELSE IF( ( lsame( norm, 'I' ) ) .OR. ( lsame( norm, 'O' ) ) .OR.
     $         ( norm.EQ.'1' ) ) THEN
*
*        Find normI(A) ( = norm1(A), since A is symmetric).
*
         VALUE = zero
         IF( lsame( uplo, 'U' ) ) THEN
            DO 60 j = 1, n
               sum = zero
               l = k + 1 - j
               DO 50 i = max( 1, j-k ), j - 1
                  absa = abs( ab( l+i, j ) )
                  sum = sum + absa
                  work( i ) = work( i ) + absa
   50          CONTINUE
               work( j ) = sum + abs( ab( k+1, j ) )
   60       CONTINUE
            DO 70 i = 1, n
               sum = work( i )
               IF( VALUE .LT. sum .OR. disnan( sum ) ) VALUE = sum
   70       CONTINUE
         ELSE
            DO 80 i = 1, n
               work( i ) = zero
   80       CONTINUE
            DO 100 j = 1, n
               sum = work( j ) + abs( ab( 1, j ) )
               l = 1 - j
               DO 90 i = j + 1, min( n, j+k )
                  absa = abs( ab( l+i, j ) )
                  sum = sum + absa
                  work( i ) = work( i ) + absa
   90          CONTINUE
               IF( VALUE .LT. sum .OR. disnan( sum ) ) VALUE = sum
  100       CONTINUE
         END IF
      ELSE IF( ( lsame( norm, 'F' ) ) .OR. ( lsame( norm, 'E' ) ) ) THEN
*
*        Find normF(A).
*
         scale = zero
         sum = one
         IF( k.GT.0 ) THEN
            IF( lsame( uplo, 'U' ) ) THEN
               DO 110 j = 2, n
                  CALL dlassq( min( j-1, k ), ab( max( k+2-j, 1 ), j ),
     $                         1, scale, sum )
  110          CONTINUE
               l = k + 1
            ELSE
               DO 120 j = 1, n - 1
                  CALL dlassq( min( n-j, k ), ab( 2, j ), 1, scale,
     $                         sum )
  120          CONTINUE
               l = 1
            END IF
            sum = 2*sum
         ELSE
            l = 1
         END IF
         CALL dlassq( n, ab( l, 1 ), ldab, scale, sum )
         VALUE = scale*sqrt( sum )
      END IF
*
      dlansb = VALUE
      RETURN
*
*     End of DLANSB
*

◆ dlansp()

double precision function dlansp	(	character	norm,
		character	uplo,
		integer	n,
		double precision, dimension( * )	ap,
		double precision, dimension( * )	work )

DLANSP returns the value of the 1-norm, or the Frobenius norm, or the infinity norm, or the element of largest absolute value of a symmetric matrix supplied in packed form.

Download DLANSP + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLANSP  returns the value of the one norm,  or the Frobenius norm, or
!> the  infinity norm,  or the  element of  largest absolute value  of a
!> real symmetric matrix A,  supplied in packed form.
!>

Returns

DLANSP

!>
!>    DLANSP = ( max(abs(A(i,j))), NORM = 'M' or 'm'
!>             (
!>             ( norm1(A),         NORM = '1', 'O' or 'o'
!>             (
!>             ( normI(A),         NORM = 'I' or 'i'
!>             (
!>             ( normF(A),         NORM = 'F', 'f', 'E' or 'e'
!>
!> where  norm1  denotes the  one norm of a matrix (maximum column sum),
!> normI  denotes the  infinity norm  of a matrix  (maximum row sum) and
!> normF  denotes the  Frobenius norm of a matrix (square root of sum of
!> squares).  Note that  max(abs(A(i,j)))  is not a consistent matrix norm.
!>

Parameters

[in]	NORM	!> NORM is CHARACTER*1 !> Specifies the value to be returned in DLANSP as described !> above. !>
[in]	UPLO	!> UPLO is CHARACTER*1 !> Specifies whether the upper or lower triangular part of the !> symmetric matrix A is supplied. !> = 'U': Upper triangular part of A is supplied !> = 'L': Lower triangular part of A is supplied !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. When N = 0, DLANSP is !> set to zero. !>
[in]	AP	!> AP is DOUBLE PRECISION array, dimension (N(N+1)/2) !> The upper or lower triangle of the symmetric matrix A, packed !> columnwise in a linear array. The j-th column of A is stored !> in the array AP as follows: !> if UPLO = 'U', AP(i + (j-1)j/2) = A(i,j) for 1<=i<=j; !> if UPLO = 'L', AP(i + (j-1)*(2n-j)/2) = A(i,j) for j<=i<=n. !>
[out]	WORK	!> WORK is DOUBLE PRECISION array, dimension (MAX(1,LWORK)), !> where LWORK >= N when NORM = 'I' or '1' or 'O'; otherwise, !> WORK is not referenced. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 113 of file dlansp.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          NORM, UPLO
      INTEGER            N
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   AP( * ), WORK( * )
*     ..
*
* =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ONE, ZERO
      parameter( one = 1.0d+0, zero = 0.0d+0 )
*     ..
*     .. Local Scalars ..
      INTEGER            I, J, K
      DOUBLE PRECISION   ABSA, SCALE, SUM, VALUE
*     ..
*     .. External Subroutines ..
      EXTERNAL           dlassq
*     ..
*     .. External Functions ..
      LOGICAL            LSAME, DISNAN
      EXTERNAL           lsame, disnan
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, sqrt
*     ..
*     .. Executable Statements ..
*
      IF( n.EQ.0 ) THEN
         VALUE = zero
      ELSE IF( lsame( norm, 'M' ) ) THEN
*
*        Find max(abs(A(i,j))).
*
         VALUE = zero
         IF( lsame( uplo, 'U' ) ) THEN
            k = 1
            DO 20 j = 1, n
               DO 10 i = k, k + j - 1
                  sum = abs( ap( i ) )
                  IF( VALUE .LT. sum .OR. disnan( sum ) ) VALUE = sum
   10          CONTINUE
               k = k + j
   20       CONTINUE
         ELSE
            k = 1
            DO 40 j = 1, n
               DO 30 i = k, k + n - j
                  sum = abs( ap( i ) )
                  IF( VALUE .LT. sum .OR. disnan( sum ) ) VALUE = sum
   30          CONTINUE
               k = k + n - j + 1
   40       CONTINUE
         END IF
      ELSE IF( ( lsame( norm, 'I' ) ) .OR. ( lsame( norm, 'O' ) ) .OR.
     $         ( norm.EQ.'1' ) ) THEN
*
*        Find normI(A) ( = norm1(A), since A is symmetric).
*
         VALUE = zero
         k = 1
         IF( lsame( uplo, 'U' ) ) THEN
            DO 60 j = 1, n
               sum = zero
               DO 50 i = 1, j - 1
                  absa = abs( ap( k ) )
                  sum = sum + absa
                  work( i ) = work( i ) + absa
                  k = k + 1
   50          CONTINUE
               work( j ) = sum + abs( ap( k ) )
               k = k + 1
   60       CONTINUE
            DO 70 i = 1, n
               sum = work( i )
               IF( VALUE .LT. sum .OR. disnan( sum ) ) VALUE = sum
   70       CONTINUE
         ELSE
            DO 80 i = 1, n
               work( i ) = zero
   80       CONTINUE
            DO 100 j = 1, n
               sum = work( j ) + abs( ap( k ) )
               k = k + 1
               DO 90 i = j + 1, n
                  absa = abs( ap( k ) )
                  sum = sum + absa
                  work( i ) = work( i ) + absa
                  k = k + 1
   90          CONTINUE
               IF( VALUE .LT. sum .OR. disnan( sum ) ) VALUE = sum
  100       CONTINUE
         END IF
      ELSE IF( ( lsame( norm, 'F' ) ) .OR. ( lsame( norm, 'E' ) ) ) THEN
*
*        Find normF(A).
*
         scale = zero
         sum = one
         k = 2
         IF( lsame( uplo, 'U' ) ) THEN
            DO 110 j = 2, n
               CALL dlassq( j-1, ap( k ), 1, scale, sum )
               k = k + j
  110       CONTINUE
         ELSE
            DO 120 j = 1, n - 1
               CALL dlassq( n-j, ap( k ), 1, scale, sum )
               k = k + n - j + 1
  120       CONTINUE
         END IF
         sum = 2*sum
         k = 1
         DO 130 i = 1, n
            IF( ap( k ).NE.zero ) THEN
               absa = abs( ap( k ) )
               IF( scale.LT.absa ) THEN
                  sum = one + sum*( scale / absa )**2
                  scale = absa
               ELSE
                  sum = sum + ( absa / scale )**2
               END IF
            END IF
            IF( lsame( uplo, 'U' ) ) THEN
               k = k + i + 1
            ELSE
               k = k + n - i + 1
            END IF
  130    CONTINUE
         VALUE = scale*sqrt( sum )
      END IF
*
      dlansp = VALUE
      RETURN
*
*     End of DLANSP
*

◆ dlantb()

double precision function dlantb	(	character	norm,
		character	uplo,
		character	diag,
		integer	n,
		integer	k,
		double precision, dimension( ldab, * )	ab,
		integer	ldab,
		double precision, dimension( * )	work )

DLANTB returns the value of the 1-norm, or the Frobenius norm, or the infinity norm, or the element of largest absolute value of a triangular band matrix.

Download DLANTB + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLANTB  returns the value of the one norm,  or the Frobenius norm, or
!> the  infinity norm,  or the element of  largest absolute value  of an
!> n by n triangular band matrix A,  with ( k + 1 ) diagonals.
!>

Returns

DLANTB

!>
!>    DLANTB = ( max(abs(A(i,j))), NORM = 'M' or 'm'
!>             (
!>             ( norm1(A),         NORM = '1', 'O' or 'o'
!>             (
!>             ( normI(A),         NORM = 'I' or 'i'
!>             (
!>             ( normF(A),         NORM = 'F', 'f', 'E' or 'e'
!>
!> where  norm1  denotes the  one norm of a matrix (maximum column sum),
!> normI  denotes the  infinity norm  of a matrix  (maximum row sum) and
!> normF  denotes the  Frobenius norm of a matrix (square root of sum of
!> squares).  Note that  max(abs(A(i,j)))  is not a consistent matrix norm.
!>

Parameters

[in]	NORM	!> NORM is CHARACTER*1 !> Specifies the value to be returned in DLANTB as described !> above. !>
[in]	UPLO	!> UPLO is CHARACTER*1 !> Specifies whether the matrix A is upper or lower triangular. !> = 'U': Upper triangular !> = 'L': Lower triangular !>
[in]	DIAG	!> DIAG is CHARACTER*1 !> Specifies whether or not the matrix A is unit triangular. !> = 'N': Non-unit triangular !> = 'U': Unit triangular !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. When N = 0, DLANTB is !> set to zero. !>
[in]	K	!> K is INTEGER !> The number of super-diagonals of the matrix A if UPLO = 'U', !> or the number of sub-diagonals of the matrix A if UPLO = 'L'. !> K >= 0. !>
[in]	AB	!> AB is DOUBLE PRECISION array, dimension (LDAB,N) !> The upper or lower triangular band matrix A, stored in the !> first k+1 rows of AB. The j-th column of A is stored !> in the j-th column of the array AB as follows: !> if UPLO = 'U', AB(k+1+i-j,j) = A(i,j) for max(1,j-k)<=i<=j; !> if UPLO = 'L', AB(1+i-j,j) = A(i,j) for j<=i<=min(n,j+k). !> Note that when DIAG = 'U', the elements of the array AB !> corresponding to the diagonal elements of the matrix A are !> not referenced, but are assumed to be one. !>
[in]	LDAB	!> LDAB is INTEGER !> The leading dimension of the array AB. LDAB >= K+1. !>
[out]	WORK	!> WORK is DOUBLE PRECISION array, dimension (MAX(1,LWORK)), !> where LWORK >= N when NORM = 'I'; otherwise, WORK is not !> referenced. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 138 of file dlantb.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          DIAG, NORM, UPLO
      INTEGER            K, LDAB, N
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   AB( LDAB, * ), WORK( * )
*     ..
*
* =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ONE, ZERO
      parameter( one = 1.0d+0, zero = 0.0d+0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            UDIAG
      INTEGER            I, J, L
      DOUBLE PRECISION   SCALE, SUM, VALUE
*     ..
*     .. External Subroutines ..
      EXTERNAL           dlassq
*     ..
*     .. External Functions ..
      LOGICAL            LSAME, DISNAN
      EXTERNAL           lsame, disnan
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, max, min, sqrt
*     ..
*     .. Executable Statements ..
*
      IF( n.EQ.0 ) THEN
         VALUE = zero
      ELSE IF( lsame( norm, 'M' ) ) THEN
*
*        Find max(abs(A(i,j))).
*
         IF( lsame( diag, 'U' ) ) THEN
            VALUE = one
            IF( lsame( uplo, 'U' ) ) THEN
               DO 20 j = 1, n
                  DO 10 i = max( k+2-j, 1 ), k
                     sum = abs( ab( i, j ) )
                     IF( VALUE .LT. sum .OR. disnan( sum ) ) VALUE = sum
   10             CONTINUE
   20          CONTINUE
            ELSE
               DO 40 j = 1, n
                  DO 30 i = 2, min( n+1-j, k+1 )
                     sum = abs( ab( i, j ) )
                     IF( VALUE .LT. sum .OR. disnan( sum ) ) VALUE = sum
   30             CONTINUE
   40          CONTINUE
            END IF
         ELSE
            VALUE = zero
            IF( lsame( uplo, 'U' ) ) THEN
               DO 60 j = 1, n
                  DO 50 i = max( k+2-j, 1 ), k + 1
                     sum = abs( ab( i, j ) )
                     IF( VALUE .LT. sum .OR. disnan( sum ) ) VALUE = sum
   50             CONTINUE
   60          CONTINUE
            ELSE
               DO 80 j = 1, n
                  DO 70 i = 1, min( n+1-j, k+1 )
                     sum = abs( ab( i, j ) )
                     IF( VALUE .LT. sum .OR. disnan( sum ) ) VALUE = sum
   70             CONTINUE
   80          CONTINUE
            END IF
         END IF
      ELSE IF( ( lsame( norm, 'O' ) ) .OR. ( norm.EQ.'1' ) ) THEN
*
*        Find norm1(A).
*
         VALUE = zero
         udiag = lsame( diag, 'U' )
         IF( lsame( uplo, 'U' ) ) THEN
            DO 110 j = 1, n
               IF( udiag ) THEN
                  sum = one
                  DO 90 i = max( k+2-j, 1 ), k
                     sum = sum + abs( ab( i, j ) )
   90             CONTINUE
               ELSE
                  sum = zero
                  DO 100 i = max( k+2-j, 1 ), k + 1
                     sum = sum + abs( ab( i, j ) )
  100             CONTINUE
               END IF
               IF( VALUE .LT. sum .OR. disnan( sum ) ) VALUE = sum
  110       CONTINUE
         ELSE
            DO 140 j = 1, n
               IF( udiag ) THEN
                  sum = one
                  DO 120 i = 2, min( n+1-j, k+1 )
                     sum = sum + abs( ab( i, j ) )
  120             CONTINUE
               ELSE
                  sum = zero
                  DO 130 i = 1, min( n+1-j, k+1 )
                     sum = sum + abs( ab( i, j ) )
  130             CONTINUE
               END IF
               IF( VALUE .LT. sum .OR. disnan( sum ) ) VALUE = sum
  140       CONTINUE
         END IF
      ELSE IF( lsame( norm, 'I' ) ) THEN
*
*        Find normI(A).
*
         VALUE = zero
         IF( lsame( uplo, 'U' ) ) THEN
            IF( lsame( diag, 'U' ) ) THEN
               DO 150 i = 1, n
                  work( i ) = one
  150          CONTINUE
               DO 170 j = 1, n
                  l = k + 1 - j
                  DO 160 i = max( 1, j-k ), j - 1
                     work( i ) = work( i ) + abs( ab( l+i, j ) )
  160             CONTINUE
  170          CONTINUE
            ELSE
               DO 180 i = 1, n
                  work( i ) = zero
  180          CONTINUE
               DO 200 j = 1, n
                  l = k + 1 - j
                  DO 190 i = max( 1, j-k ), j
                     work( i ) = work( i ) + abs( ab( l+i, j ) )
  190             CONTINUE
  200          CONTINUE
            END IF
         ELSE
            IF( lsame( diag, 'U' ) ) THEN
               DO 210 i = 1, n
                  work( i ) = one
  210          CONTINUE
               DO 230 j = 1, n
                  l = 1 - j
                  DO 220 i = j + 1, min( n, j+k )
                     work( i ) = work( i ) + abs( ab( l+i, j ) )
  220             CONTINUE
  230          CONTINUE
            ELSE
               DO 240 i = 1, n
                  work( i ) = zero
  240          CONTINUE
               DO 260 j = 1, n
                  l = 1 - j
                  DO 250 i = j, min( n, j+k )
                     work( i ) = work( i ) + abs( ab( l+i, j ) )
  250             CONTINUE
  260          CONTINUE
            END IF
         END IF
         DO 270 i = 1, n
            sum = work( i )
            IF( VALUE .LT. sum .OR. disnan( sum ) ) VALUE = sum
  270    CONTINUE
      ELSE IF( ( lsame( norm, 'F' ) ) .OR. ( lsame( norm, 'E' ) ) ) THEN
*
*        Find normF(A).
*
         IF( lsame( uplo, 'U' ) ) THEN
            IF( lsame( diag, 'U' ) ) THEN
               scale = one
               sum = n
               IF( k.GT.0 ) THEN
                  DO 280 j = 2, n
                     CALL dlassq( min( j-1, k ),
     $                            ab( max( k+2-j, 1 ), j ), 1, scale,
     $                            sum )
  280             CONTINUE
               END IF
            ELSE
               scale = zero
               sum = one
               DO 290 j = 1, n
                  CALL dlassq( min( j, k+1 ), ab( max( k+2-j, 1 ), j ),
     $                         1, scale, sum )
  290          CONTINUE
            END IF
         ELSE
            IF( lsame( diag, 'U' ) ) THEN
               scale = one
               sum = n
               IF( k.GT.0 ) THEN
                  DO 300 j = 1, n - 1
                     CALL dlassq( min( n-j, k ), ab( 2, j ), 1, scale,
     $                            sum )
  300             CONTINUE
               END IF
            ELSE
               scale = zero
               sum = one
               DO 310 j = 1, n
                  CALL dlassq( min( n-j+1, k+1 ), ab( 1, j ), 1, scale,
     $                         sum )
  310          CONTINUE
            END IF
         END IF
         VALUE = scale*sqrt( sum )
      END IF
*
      dlantb = VALUE
      RETURN
*
*     End of DLANTB
*

◆ dlantp()

double precision function dlantp	(	character	norm,
		character	uplo,
		character	diag,
		integer	n,
		double precision, dimension( * )	ap,
		double precision, dimension( * )	work )

DLANTP returns the value of the 1-norm, or the Frobenius norm, or the infinity norm, or the element of largest absolute value of a triangular matrix supplied in packed form.

Download DLANTP + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLANTP  returns the value of the one norm,  or the Frobenius norm, or
!> the  infinity norm,  or the  element of  largest absolute value  of a
!> triangular matrix A, supplied in packed form.
!>

Returns

DLANTP

!>
!>    DLANTP = ( max(abs(A(i,j))), NORM = 'M' or 'm'
!>             (
!>             ( norm1(A),         NORM = '1', 'O' or 'o'
!>             (
!>             ( normI(A),         NORM = 'I' or 'i'
!>             (
!>             ( normF(A),         NORM = 'F', 'f', 'E' or 'e'
!>
!> where  norm1  denotes the  one norm of a matrix (maximum column sum),
!> normI  denotes the  infinity norm  of a matrix  (maximum row sum) and
!> normF  denotes the  Frobenius norm of a matrix (square root of sum of
!> squares).  Note that  max(abs(A(i,j)))  is not a consistent matrix norm.
!>

Parameters

[in]	NORM	!> NORM is CHARACTER*1 !> Specifies the value to be returned in DLANTP as described !> above. !>
[in]	UPLO	!> UPLO is CHARACTER*1 !> Specifies whether the matrix A is upper or lower triangular. !> = 'U': Upper triangular !> = 'L': Lower triangular !>
[in]	DIAG	!> DIAG is CHARACTER*1 !> Specifies whether or not the matrix A is unit triangular. !> = 'N': Non-unit triangular !> = 'U': Unit triangular !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. When N = 0, DLANTP is !> set to zero. !>
[in]	AP	!> AP is DOUBLE PRECISION array, dimension (N(N+1)/2) !> The upper or lower triangular matrix A, packed columnwise in !> a linear array. The j-th column of A is stored in the array !> AP as follows: !> if UPLO = 'U', AP(i + (j-1)j/2) = A(i,j) for 1<=i<=j; !> if UPLO = 'L', AP(i + (j-1)*(2n-j)/2) = A(i,j) for j<=i<=n. !> Note that when DIAG = 'U', the elements of the array AP !> corresponding to the diagonal elements of the matrix A are !> not referenced, but are assumed to be one. !>
[out]	WORK	!> WORK is DOUBLE PRECISION array, dimension (MAX(1,LWORK)), !> where LWORK >= N when NORM = 'I'; otherwise, WORK is not !> referenced. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 123 of file dlantp.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          DIAG, NORM, UPLO
      INTEGER            N
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   AP( * ), WORK( * )
*     ..
*
* =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ONE, ZERO
      parameter( one = 1.0d+0, zero = 0.0d+0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            UDIAG
      INTEGER            I, J, K
      DOUBLE PRECISION   SCALE, SUM, VALUE
*     ..
*     .. External Subroutines ..
      EXTERNAL           dlassq
*     ..
*     .. External Functions ..
      LOGICAL            LSAME, DISNAN
      EXTERNAL           lsame, disnan
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, sqrt
*     ..
*     .. Executable Statements ..
*
      IF( n.EQ.0 ) THEN
         VALUE = zero
      ELSE IF( lsame( norm, 'M' ) ) THEN
*
*        Find max(abs(A(i,j))).
*
         k = 1
         IF( lsame( diag, 'U' ) ) THEN
            VALUE = one
            IF( lsame( uplo, 'U' ) ) THEN
               DO 20 j = 1, n
                  DO 10 i = k, k + j - 2
                     sum = abs( ap( i ) )
                     IF( VALUE .LT. sum .OR. disnan( sum ) ) VALUE = sum
   10             CONTINUE
                  k = k + j
   20          CONTINUE
            ELSE
               DO 40 j = 1, n
                  DO 30 i = k + 1, k + n - j
                     sum = abs( ap( i ) )
                     IF( VALUE .LT. sum .OR. disnan( sum ) ) VALUE = sum
   30             CONTINUE
                  k = k + n - j + 1
   40          CONTINUE
            END IF
         ELSE
            VALUE = zero
            IF( lsame( uplo, 'U' ) ) THEN
               DO 60 j = 1, n
                  DO 50 i = k, k + j - 1
                     sum = abs( ap( i ) )
                     IF( VALUE .LT. sum .OR. disnan( sum ) ) VALUE = sum
   50             CONTINUE
                  k = k + j
   60          CONTINUE
            ELSE
               DO 80 j = 1, n
                  DO 70 i = k, k + n - j
                     sum = abs( ap( i ) )
                     IF( VALUE .LT. sum .OR. disnan( sum ) ) VALUE = sum
   70             CONTINUE
                  k = k + n - j + 1
   80          CONTINUE
            END IF
         END IF
      ELSE IF( ( lsame( norm, 'O' ) ) .OR. ( norm.EQ.'1' ) ) THEN
*
*        Find norm1(A).
*
         VALUE = zero
         k = 1
         udiag = lsame( diag, 'U' )
         IF( lsame( uplo, 'U' ) ) THEN
            DO 110 j = 1, n
               IF( udiag ) THEN
                  sum = one
                  DO 90 i = k, k + j - 2
                     sum = sum + abs( ap( i ) )
   90             CONTINUE
               ELSE
                  sum = zero
                  DO 100 i = k, k + j - 1
                     sum = sum + abs( ap( i ) )
  100             CONTINUE
               END IF
               k = k + j
               IF( VALUE .LT. sum .OR. disnan( sum ) ) VALUE = sum
  110       CONTINUE
         ELSE
            DO 140 j = 1, n
               IF( udiag ) THEN
                  sum = one
                  DO 120 i = k + 1, k + n - j
                     sum = sum + abs( ap( i ) )
  120             CONTINUE
               ELSE
                  sum = zero
                  DO 130 i = k, k + n - j
                     sum = sum + abs( ap( i ) )
  130             CONTINUE
               END IF
               k = k + n - j + 1
               IF( VALUE .LT. sum .OR. disnan( sum ) ) VALUE = sum
  140       CONTINUE
         END IF
      ELSE IF( lsame( norm, 'I' ) ) THEN
*
*        Find normI(A).
*
         k = 1
         IF( lsame( uplo, 'U' ) ) THEN
            IF( lsame( diag, 'U' ) ) THEN
               DO 150 i = 1, n
                  work( i ) = one
  150          CONTINUE
               DO 170 j = 1, n
                  DO 160 i = 1, j - 1
                     work( i ) = work( i ) + abs( ap( k ) )
                     k = k + 1
  160             CONTINUE
                  k = k + 1
  170          CONTINUE
            ELSE
               DO 180 i = 1, n
                  work( i ) = zero
  180          CONTINUE
               DO 200 j = 1, n
                  DO 190 i = 1, j
                     work( i ) = work( i ) + abs( ap( k ) )
                     k = k + 1
  190             CONTINUE
  200          CONTINUE
            END IF
         ELSE
            IF( lsame( diag, 'U' ) ) THEN
               DO 210 i = 1, n
                  work( i ) = one
  210          CONTINUE
               DO 230 j = 1, n
                  k = k + 1
                  DO 220 i = j + 1, n
                     work( i ) = work( i ) + abs( ap( k ) )
                     k = k + 1
  220             CONTINUE
  230          CONTINUE
            ELSE
               DO 240 i = 1, n
                  work( i ) = zero
  240          CONTINUE
               DO 260 j = 1, n
                  DO 250 i = j, n
                     work( i ) = work( i ) + abs( ap( k ) )
                     k = k + 1
  250             CONTINUE
  260          CONTINUE
            END IF
         END IF
         VALUE = zero
         DO 270 i = 1, n
            sum = work( i )
            IF( VALUE .LT. sum .OR. disnan( sum ) ) VALUE = sum
  270    CONTINUE
      ELSE IF( ( lsame( norm, 'F' ) ) .OR. ( lsame( norm, 'E' ) ) ) THEN
*
*        Find normF(A).
*
         IF( lsame( uplo, 'U' ) ) THEN
            IF( lsame( diag, 'U' ) ) THEN
               scale = one
               sum = n
               k = 2
               DO 280 j = 2, n
                  CALL dlassq( j-1, ap( k ), 1, scale, sum )
                  k = k + j
  280          CONTINUE
            ELSE
               scale = zero
               sum = one
               k = 1
               DO 290 j = 1, n
                  CALL dlassq( j, ap( k ), 1, scale, sum )
                  k = k + j
  290          CONTINUE
            END IF
         ELSE
            IF( lsame( diag, 'U' ) ) THEN
               scale = one
               sum = n
               k = 2
               DO 300 j = 1, n - 1
                  CALL dlassq( n-j, ap( k ), 1, scale, sum )
                  k = k + n - j + 1
  300          CONTINUE
            ELSE
               scale = zero
               sum = one
               k = 1
               DO 310 j = 1, n
                  CALL dlassq( n-j+1, ap( k ), 1, scale, sum )
                  k = k + n - j + 1
  310          CONTINUE
            END IF
         END IF
         VALUE = scale*sqrt( sum )
      END IF
*
      dlantp = VALUE
      RETURN
*
*     End of DLANTP
*

◆ dlantr()

double precision function dlantr	(	character	norm,
		character	uplo,
		character	diag,
		integer	m,
		integer	n,
		double precision, dimension( lda, * )	a,
		integer	lda,
		double precision, dimension( * )	work )

DLANTR returns the value of the 1-norm, or the Frobenius norm, or the infinity norm, or the element of largest absolute value of a trapezoidal or triangular matrix.

Download DLANTR + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLANTR  returns the value of the one norm,  or the Frobenius norm, or
!> the  infinity norm,  or the  element of  largest absolute value  of a
!> trapezoidal or triangular matrix A.
!>

Returns

DLANTR

!>
!>    DLANTR = ( max(abs(A(i,j))), NORM = 'M' or 'm'
!>             (
!>             ( norm1(A),         NORM = '1', 'O' or 'o'
!>             (
!>             ( normI(A),         NORM = 'I' or 'i'
!>             (
!>             ( normF(A),         NORM = 'F', 'f', 'E' or 'e'
!>
!> where  norm1  denotes the  one norm of a matrix (maximum column sum),
!> normI  denotes the  infinity norm  of a matrix  (maximum row sum) and
!> normF  denotes the  Frobenius norm of a matrix (square root of sum of
!> squares).  Note that  max(abs(A(i,j)))  is not a consistent matrix norm.
!>

Parameters

[in]	NORM	!> NORM is CHARACTER*1 !> Specifies the value to be returned in DLANTR as described !> above. !>
[in]	UPLO	!> UPLO is CHARACTER*1 !> Specifies whether the matrix A is upper or lower trapezoidal. !> = 'U': Upper trapezoidal !> = 'L': Lower trapezoidal !> Note that A is triangular instead of trapezoidal if M = N. !>
[in]	DIAG	!> DIAG is CHARACTER*1 !> Specifies whether or not the matrix A has unit diagonal. !> = 'N': Non-unit diagonal !> = 'U': Unit diagonal !>
[in]	M	!> M is INTEGER !> The number of rows of the matrix A. M >= 0, and if !> UPLO = 'U', M <= N. When M = 0, DLANTR is set to zero. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix A. N >= 0, and if !> UPLO = 'L', N <= M. When N = 0, DLANTR is set to zero. !>
[in]	A	!> A is DOUBLE PRECISION array, dimension (LDA,N) !> The trapezoidal matrix A (A is triangular if M = N). !> If UPLO = 'U', the leading m by n upper trapezoidal part of !> the array A contains the upper trapezoidal matrix, and the !> strictly lower triangular part of A is not referenced. !> If UPLO = 'L', the leading m by n lower trapezoidal part of !> the array A contains the lower trapezoidal matrix, and the !> strictly upper triangular part of A is not referenced. Note !> that when DIAG = 'U', the diagonal elements of A are not !> referenced and are assumed to be one. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(M,1). !>
[out]	WORK	!> WORK is DOUBLE PRECISION array, dimension (MAX(1,LWORK)), !> where LWORK >= M when NORM = 'I'; otherwise, WORK is not !> referenced. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 139 of file dlantr.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          DIAG, NORM, UPLO
      INTEGER            LDA, M, N
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   A( LDA, * ), WORK( * )
*     ..
*
* =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ONE, ZERO
      parameter( one = 1.0d+0, zero = 0.0d+0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            UDIAG
      INTEGER            I, J
      DOUBLE PRECISION   SCALE, SUM, VALUE
*     ..
*     .. External Subroutines ..
      EXTERNAL           dlassq
*     ..
*     .. External Functions ..
      LOGICAL            LSAME, DISNAN
      EXTERNAL           lsame, disnan
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, min, sqrt
*     ..
*     .. Executable Statements ..
*
      IF( min( m, n ).EQ.0 ) THEN
         VALUE = zero
      ELSE IF( lsame( norm, 'M' ) ) THEN
*
*        Find max(abs(A(i,j))).
*
         IF( lsame( diag, 'U' ) ) THEN
            VALUE = one
            IF( lsame( uplo, 'U' ) ) THEN
               DO 20 j = 1, n
                  DO 10 i = 1, min( m, j-1 )
                     sum = abs( a( i, j ) )
                     IF( VALUE .LT. sum .OR. disnan( sum ) ) VALUE = sum
   10             CONTINUE
   20          CONTINUE
            ELSE
               DO 40 j = 1, n
                  DO 30 i = j + 1, m
                     sum = abs( a( i, j ) )
                     IF( VALUE .LT. sum .OR. disnan( sum ) ) VALUE = sum
   30             CONTINUE
   40          CONTINUE
            END IF
         ELSE
            VALUE = zero
            IF( lsame( uplo, 'U' ) ) THEN
               DO 60 j = 1, n
                  DO 50 i = 1, min( m, j )
                     sum = abs( a( i, j ) )
                     IF( VALUE .LT. sum .OR. disnan( sum ) ) VALUE = sum
   50             CONTINUE
   60          CONTINUE
            ELSE
               DO 80 j = 1, n
                  DO 70 i = j, m
                     sum = abs( a( i, j ) )
                     IF( VALUE .LT. sum .OR. disnan( sum ) ) VALUE = sum
   70             CONTINUE
   80          CONTINUE
            END IF
         END IF
      ELSE IF( ( lsame( norm, 'O' ) ) .OR. ( norm.EQ.'1' ) ) THEN
*
*        Find norm1(A).
*
         VALUE = zero
         udiag = lsame( diag, 'U' )
         IF( lsame( uplo, 'U' ) ) THEN
            DO 110 j = 1, n
               IF( ( udiag ) .AND. ( j.LE.m ) ) THEN
                  sum = one
                  DO 90 i = 1, j - 1
                     sum = sum + abs( a( i, j ) )
   90             CONTINUE
               ELSE
                  sum = zero
                  DO 100 i = 1, min( m, j )
                     sum = sum + abs( a( i, j ) )
  100             CONTINUE
               END IF
               IF( VALUE .LT. sum .OR. disnan( sum ) ) VALUE = sum
  110       CONTINUE
         ELSE
            DO 140 j = 1, n
               IF( udiag ) THEN
                  sum = one
                  DO 120 i = j + 1, m
                     sum = sum + abs( a( i, j ) )
  120             CONTINUE
               ELSE
                  sum = zero
                  DO 130 i = j, m
                     sum = sum + abs( a( i, j ) )
  130             CONTINUE
               END IF
               IF( VALUE .LT. sum .OR. disnan( sum ) ) VALUE = sum
  140       CONTINUE
         END IF
      ELSE IF( lsame( norm, 'I' ) ) THEN
*
*        Find normI(A).
*
         IF( lsame( uplo, 'U' ) ) THEN
            IF( lsame( diag, 'U' ) ) THEN
               DO 150 i = 1, m
                  work( i ) = one
  150          CONTINUE
               DO 170 j = 1, n
                  DO 160 i = 1, min( m, j-1 )
                     work( i ) = work( i ) + abs( a( i, j ) )
  160             CONTINUE
  170          CONTINUE
            ELSE
               DO 180 i = 1, m
                  work( i ) = zero
  180          CONTINUE
               DO 200 j = 1, n
                  DO 190 i = 1, min( m, j )
                     work( i ) = work( i ) + abs( a( i, j ) )
  190             CONTINUE
  200          CONTINUE
            END IF
         ELSE
            IF( lsame( diag, 'U' ) ) THEN
               DO 210 i = 1, min( m, n )
                  work( i ) = one
  210          CONTINUE
               DO 220 i = n + 1, m
                  work( i ) = zero
  220          CONTINUE
               DO 240 j = 1, n
                  DO 230 i = j + 1, m
                     work( i ) = work( i ) + abs( a( i, j ) )
  230             CONTINUE
  240          CONTINUE
            ELSE
               DO 250 i = 1, m
                  work( i ) = zero
  250          CONTINUE
               DO 270 j = 1, n
                  DO 260 i = j, m
                     work( i ) = work( i ) + abs( a( i, j ) )
  260             CONTINUE
  270          CONTINUE
            END IF
         END IF
         VALUE = zero
         DO 280 i = 1, m
            sum = work( i )
            IF( VALUE .LT. sum .OR. disnan( sum ) ) VALUE = sum
  280    CONTINUE
      ELSE IF( ( lsame( norm, 'F' ) ) .OR. ( lsame( norm, 'E' ) ) ) THEN
*
*        Find normF(A).
*
         IF( lsame( uplo, 'U' ) ) THEN
            IF( lsame( diag, 'U' ) ) THEN
               scale = one
               sum = min( m, n )
               DO 290 j = 2, n
                  CALL dlassq( min( m, j-1 ), a( 1, j ), 1, scale, sum )
  290          CONTINUE
            ELSE
               scale = zero
               sum = one
               DO 300 j = 1, n
                  CALL dlassq( min( m, j ), a( 1, j ), 1, scale, sum )
  300          CONTINUE
            END IF
         ELSE
            IF( lsame( diag, 'U' ) ) THEN
               scale = one
               sum = min( m, n )
               DO 310 j = 1, n
                  CALL dlassq( m-j, a( min( m, j+1 ), j ), 1, scale,
     $                         sum )
  310          CONTINUE
            ELSE
               scale = zero
               sum = one
               DO 320 j = 1, n
                  CALL dlassq( m-j+1, a( j, j ), 1, scale, sum )
  320          CONTINUE
            END IF
         END IF
         VALUE = scale*sqrt( sum )
      END IF
*
      dlantr = VALUE
      RETURN
*
*     End of DLANTR
*

◆ dlanv2()

subroutine dlanv2	(	double precision	a,
		double precision	b,
		double precision	c,
		double precision	d,
		double precision	rt1r,
		double precision	rt1i,
		double precision	rt2r,
		double precision	rt2i,
		double precision	cs,
		double precision	sn )

DLANV2 computes the Schur factorization of a real 2-by-2 nonsymmetric matrix in standard form.

Download DLANV2 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLANV2 computes the Schur factorization of a real 2-by-2 nonsymmetric
!> matrix in standard form:
!>
!>      [ A  B ] = [ CS -SN ] [ AA  BB ] [ CS  SN ]
!>      [ C  D ]   [ SN  CS ] [ CC  DD ] [-SN  CS ]
!>
!> where either
!> 1) CC = 0 so that AA and DD are real eigenvalues of the matrix, or
!> 2) AA = DD and BB*CC < 0, so that AA + or - sqrt(BB*CC) are complex
!> conjugate eigenvalues.
!>

Parameters

[in,out]	A	!> A is DOUBLE PRECISION !>
[in,out]	B	!> B is DOUBLE PRECISION !>
[in,out]	C	!> C is DOUBLE PRECISION !>
[in,out]	D	!> D is DOUBLE PRECISION !> On entry, the elements of the input matrix. !> On exit, they are overwritten by the elements of the !> standardised Schur form. !>
[out]	RT1R	!> RT1R is DOUBLE PRECISION !>
[out]	RT1I	!> RT1I is DOUBLE PRECISION !>
[out]	RT2R	!> RT2R is DOUBLE PRECISION !>
[out]	RT2I	!> RT2I is DOUBLE PRECISION !> The real and imaginary parts of the eigenvalues. If the !> eigenvalues are a complex conjugate pair, RT1I > 0. !>
[out]	CS	!> CS is DOUBLE PRECISION !>
[out]	SN	!> SN is DOUBLE PRECISION !> Parameters of the rotation matrix. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  Modified by V. Sima, Research Institute for Informatics, Bucharest,
!>  Romania, to reduce the risk of cancellation errors,
!>  when computing real eigenvalues, and to ensure, if possible, that
!>  abs(RT1R) >= abs(RT2R).
!>

Definition at line 126 of file dlanv2.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      DOUBLE PRECISION   A, B, C, CS, D, RT1I, RT1R, RT2I, RT2R, SN
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ZERO, HALF, ONE, TWO
      parameter( zero = 0.0d+0, half = 0.5d+0, one = 1.0d+0,
     $                     two = 2.0d0 )
      DOUBLE PRECISION   MULTPL
      parameter( multpl = 4.0d+0 )
*     ..
*     .. Local Scalars ..
      DOUBLE PRECISION   AA, BB, BCMAX, BCMIS, CC, CS1, DD, EPS, P, SAB,
     $                   SAC, SCALE, SIGMA, SN1, TAU, TEMP, Z, SAFMIN, 
     $                   SAFMN2, SAFMX2
      INTEGER            COUNT
*     ..
*     .. External Functions ..
      DOUBLE PRECISION   DLAMCH, DLAPY2
      EXTERNAL           dlamch, dlapy2
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, max, min, sign, sqrt
*     ..
*     .. Executable Statements ..
*
      safmin = dlamch( 'S' )
      eps = dlamch( 'P' )
      safmn2 = dlamch( 'B' )**int( log( safmin / eps ) /
     $            log( dlamch( 'B' ) ) / two )
      safmx2 = one / safmn2
      IF( c.EQ.zero ) THEN
         cs = one
         sn = zero
*
      ELSE IF( b.EQ.zero ) THEN
*
*        Swap rows and columns
*
         cs = zero
         sn = one
         temp = d
         d = a
         a = temp
         b = -c
         c = zero
*
      ELSE IF( ( a-d ).EQ.zero .AND. sign( one, b ).NE.sign( one, c ) )
     $          THEN
         cs = one
         sn = zero
*
      ELSE
*
         temp = a - d
         p = half*temp
         bcmax = max( abs( b ), abs( c ) )
         bcmis = min( abs( b ), abs( c ) )*sign( one, b )*sign( one, c )
         scale = max( abs( p ), bcmax )
         z = ( p / scale )*p + ( bcmax / scale )*bcmis
*
*        If Z is of the order of the machine accuracy, postpone the
*        decision on the nature of eigenvalues
*
         IF( z.GE.multpl*eps ) THEN
*
*           Real eigenvalues. Compute A and D.
*
            z = p + sign( sqrt( scale )*sqrt( z ), p )
            a = d + z
            d = d - ( bcmax / z )*bcmis
*
*           Compute B and the rotation matrix
*
            tau = dlapy2( c, z )
            cs = z / tau
            sn = c / tau
            b = b - c
            c = zero
*
         ELSE
*
*           Complex eigenvalues, or real (almost) equal eigenvalues.
*           Make diagonal elements equal.
*
            count = 0
            sigma = b + c
   10       CONTINUE
            count = count + 1
            scale = max( abs(temp), abs(sigma) )
            IF( scale.GE.safmx2 ) THEN
               sigma = sigma * safmn2
               temp = temp * safmn2
               IF (count .LE. 20)
     $            GOTO 10
            END IF
            IF( scale.LE.safmn2 ) THEN
               sigma = sigma * safmx2
               temp = temp * safmx2
               IF (count .LE. 20)
     $            GOTO 10
            END IF
            p = half*temp
            tau = dlapy2( sigma, temp )
            cs = sqrt( half*( one+abs( sigma ) / tau ) )
            sn = -( p / ( tau*cs ) )*sign( one, sigma )
*
*           Compute [ AA  BB ] = [ A  B ] [ CS -SN ]
*                   [ CC  DD ]   [ C  D ] [ SN  CS ]
*
            aa = a*cs + b*sn
            bb = -a*sn + b*cs
            cc = c*cs + d*sn
            dd = -c*sn + d*cs
*
*           Compute [ A  B ] = [ CS  SN ] [ AA  BB ]
*                   [ C  D ]   [-SN  CS ] [ CC  DD ]
*
            a = aa*cs + cc*sn
            b = bb*cs + dd*sn
            c = -aa*sn + cc*cs
            d = -bb*sn + dd*cs
*
            temp = half*( a+d )
            a = temp
            d = temp
*
            IF( c.NE.zero ) THEN
               IF( b.NE.zero ) THEN
                  IF( sign( one, b ).EQ.sign( one, c ) ) THEN
*
*                    Real eigenvalues: reduce to upper triangular form
*
                     sab = sqrt( abs( b ) )
                     sac = sqrt( abs( c ) )
                     p = sign( sab*sac, c )
                     tau = one / sqrt( abs( b+c ) )
                     a = temp + p
                     d = temp - p
                     b = b - c
                     c = zero
                     cs1 = sab*tau
                     sn1 = sac*tau
                     temp = cs*cs1 - sn*sn1
                     sn = cs*sn1 + sn*cs1
                     cs = temp
                  END IF
               ELSE
                  b = -c
                  c = zero
                  temp = cs
                  cs = -sn
                  sn = temp
               END IF
            END IF
         END IF
*
      END IF
*
*     Store eigenvalues in (RT1R,RT1I) and (RT2R,RT2I).
*
      rt1r = a
      rt2r = d
      IF( c.EQ.zero ) THEN
         rt1i = zero
         rt2i = zero
      ELSE
         rt1i = sqrt( abs( b ) )*sqrt( abs( c ) )
         rt2i = -rt1i
      END IF
      RETURN
*
*     End of DLANV2
*

◆ dlapll()

subroutine dlapll	(	integer	n,
		double precision, dimension( * )	x,
		integer	incx,
		double precision, dimension( * )	y,
		integer	incy,
		double precision	ssmin )

DLAPLL measures the linear dependence of two vectors.

Download DLAPLL + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> Given two column vectors X and Y, let
!>
!>                      A = ( X Y ).
!>
!> The subroutine first computes the QR factorization of A = Q*R,
!> and then computes the SVD of the 2-by-2 upper triangular matrix R.
!> The smaller singular value of R is returned in SSMIN, which is used
!> as the measurement of the linear dependency of the vectors X and Y.
!>

Parameters

[in]	N	!> N is INTEGER !> The length of the vectors X and Y. !>
[in,out]	X	!> X is DOUBLE PRECISION array, !> dimension (1+(N-1)*INCX) !> On entry, X contains the N-vector X. !> On exit, X is overwritten. !>
[in]	INCX	!> INCX is INTEGER !> The increment between successive elements of X. INCX > 0. !>
[in,out]	Y	!> Y is DOUBLE PRECISION array, !> dimension (1+(N-1)*INCY) !> On entry, Y contains the N-vector Y. !> On exit, Y is overwritten. !>
[in]	INCY	!> INCY is INTEGER !> The increment between successive elements of Y. INCY > 0. !>
[out]	SSMIN	!> SSMIN is DOUBLE PRECISION !> The smallest singular value of the N-by-2 matrix A = ( X Y ). !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 101 of file dlapll.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INCX, INCY, N
      DOUBLE PRECISION   SSMIN
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   X( * ), Y( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ZERO, ONE
      parameter( zero = 0.0d+0, one = 1.0d+0 )
*     ..
*     .. Local Scalars ..
      DOUBLE PRECISION   A11, A12, A22, C, SSMAX, TAU
*     ..
*     .. External Functions ..
      DOUBLE PRECISION   DDOT
      EXTERNAL           ddot
*     ..
*     .. External Subroutines ..
      EXTERNAL           daxpy, dlarfg, dlas2
*     ..
*     .. Executable Statements ..
*
*     Quick return if possible
*
      IF( n.LE.1 ) THEN
         ssmin = zero
         RETURN
      END IF
*
*     Compute the QR factorization of the N-by-2 matrix ( X Y )
*
      CALL dlarfg( n, x( 1 ), x( 1+incx ), incx, tau )
      a11 = x( 1 )
      x( 1 ) = one
*
      c = -tau*ddot( n, x, incx, y, incy )
      CALL daxpy( n, c, x, incx, y, incy )
*
      CALL dlarfg( n-1, y( 1+incy ), y( 1+2*incy ), incy, tau )
*
      a12 = y( 1 )
      a22 = y( 1+incy )
*
*     Compute the SVD of 2-by-2 Upper triangular matrix.
*
      CALL dlas2( a11, a12, a22, ssmin, ssmax )
*
      RETURN
*
*     End of DLAPLL
*

◆ dlapmr()

subroutine dlapmr	(	logical	forwrd,
		integer	m,
		integer	n,
		double precision, dimension( ldx, * )	x,
		integer	ldx,
		integer, dimension( * )	k )

DLAPMR rearranges rows of a matrix as specified by a permutation vector.

Download DLAPMR + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLAPMR rearranges the rows of the M by N matrix X as specified
!> by the permutation K(1),K(2),...,K(M) of the integers 1,...,M.
!> If FORWRD = .TRUE.,  forward permutation:
!>
!>      X(K(I),*) is moved X(I,*) for I = 1,2,...,M.
!>
!> If FORWRD = .FALSE., backward permutation:
!>
!>      X(I,*) is moved to X(K(I),*) for I = 1,2,...,M.
!>

Parameters

[in]	FORWRD	!> FORWRD is LOGICAL !> = .TRUE., forward permutation !> = .FALSE., backward permutation !>
[in]	M	!> M is INTEGER !> The number of rows of the matrix X. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix X. N >= 0. !>
[in,out]	X	!> X is DOUBLE PRECISION array, dimension (LDX,N) !> On entry, the M by N matrix X. !> On exit, X contains the permuted matrix X. !>
[in]	LDX	!> LDX is INTEGER !> The leading dimension of the array X, LDX >= MAX(1,M). !>
[in,out]	K	!> K is INTEGER array, dimension (M) !> On entry, K contains the permutation vector. K is used as !> internal workspace, but reset to its original value on !> output. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 103 of file dlapmr.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      LOGICAL            FORWRD
      INTEGER            LDX, M, N
*     ..
*     .. Array Arguments ..
      INTEGER            K( * )
      DOUBLE PRECISION   X( LDX, * )
*     ..
*
*  =====================================================================
*
*     .. Local Scalars ..
      INTEGER            I, IN, J, JJ
      DOUBLE PRECISION   TEMP
*     ..
*     .. Executable Statements ..
*
      IF( m.LE.1 )
     $   RETURN
*
      DO 10 i = 1, m
         k( i ) = -k( i )
   10 CONTINUE
*
      IF( forwrd ) THEN
*
*        Forward permutation
*
         DO 50 i = 1, m
*
            IF( k( i ).GT.0 )
     $         GO TO 40
*
            j = i
            k( j ) = -k( j )
            in = k( j )
*
   20       CONTINUE
            IF( k( in ).GT.0 )
     $         GO TO 40
*
            DO 30 jj = 1, n
               temp = x( j, jj )
               x( j, jj ) = x( in, jj )
               x( in, jj ) = temp
   30       CONTINUE
*
            k( in ) = -k( in )
            j = in
            in = k( in )
            GO TO 20
*
   40       CONTINUE
*
   50    CONTINUE
*
      ELSE
*
*        Backward permutation
*
         DO 90 i = 1, m
*
            IF( k( i ).GT.0 )
     $         GO TO 80
*
            k( i ) = -k( i )
            j = k( i )
   60       CONTINUE
            IF( j.EQ.i )
     $         GO TO 80
*
            DO 70 jj = 1, n
               temp = x( i, jj )
               x( i, jj ) = x( j, jj )
               x( j, jj ) = temp
   70       CONTINUE
*
            k( j ) = -k( j )
            j = k( j )
            GO TO 60
*
   80       CONTINUE
*
   90    CONTINUE
*
      END IF
*
      RETURN
*
*     End of DLAPMR
*

◆ dlapmt()

subroutine dlapmt	(	logical	forwrd,
		integer	m,
		integer	n,
		double precision, dimension( ldx, * )	x,
		integer	ldx,
		integer, dimension( * )	k )

DLAPMT performs a forward or backward permutation of the columns of a matrix.

Download DLAPMT + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLAPMT rearranges the columns of the M by N matrix X as specified
!> by the permutation K(1),K(2),...,K(N) of the integers 1,...,N.
!> If FORWRD = .TRUE.,  forward permutation:
!>
!>      X(*,K(J)) is moved X(*,J) for J = 1,2,...,N.
!>
!> If FORWRD = .FALSE., backward permutation:
!>
!>      X(*,J) is moved to X(*,K(J)) for J = 1,2,...,N.
!>

Parameters

[in]	FORWRD	!> FORWRD is LOGICAL !> = .TRUE., forward permutation !> = .FALSE., backward permutation !>
[in]	M	!> M is INTEGER !> The number of rows of the matrix X. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix X. N >= 0. !>
[in,out]	X	!> X is DOUBLE PRECISION array, dimension (LDX,N) !> On entry, the M by N matrix X. !> On exit, X contains the permuted matrix X. !>
[in]	LDX	!> LDX is INTEGER !> The leading dimension of the array X, LDX >= MAX(1,M). !>
[in,out]	K	!> K is INTEGER array, dimension (N) !> On entry, K contains the permutation vector. K is used as !> internal workspace, but reset to its original value on !> output. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 103 of file dlapmt.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      LOGICAL            FORWRD
      INTEGER            LDX, M, N
*     ..
*     .. Array Arguments ..
      INTEGER            K( * )
      DOUBLE PRECISION   X( LDX, * )
*     ..
*
*  =====================================================================
*
*     .. Local Scalars ..
      INTEGER            I, II, IN, J
      DOUBLE PRECISION   TEMP
*     ..
*     .. Executable Statements ..
*
      IF( n.LE.1 )
     $   RETURN
*
      DO 10 i = 1, n
         k( i ) = -k( i )
   10 CONTINUE
*
      IF( forwrd ) THEN
*
*        Forward permutation
*
         DO 50 i = 1, n
*
            IF( k( i ).GT.0 )
     $         GO TO 40
*
            j = i
            k( j ) = -k( j )
            in = k( j )
*
   20       CONTINUE
            IF( k( in ).GT.0 )
     $         GO TO 40
*
            DO 30 ii = 1, m
               temp = x( ii, j )
               x( ii, j ) = x( ii, in )
               x( ii, in ) = temp
   30       CONTINUE
*
            k( in ) = -k( in )
            j = in
            in = k( in )
            GO TO 20
*
   40       CONTINUE
*
   50    CONTINUE
*
      ELSE
*
*        Backward permutation
*
         DO 90 i = 1, n
*
            IF( k( i ).GT.0 )
     $         GO TO 80
*
            k( i ) = -k( i )
            j = k( i )
   60       CONTINUE
            IF( j.EQ.i )
     $         GO TO 80
*
            DO 70 ii = 1, m
               temp = x( ii, i )
               x( ii, i ) = x( ii, j )
               x( ii, j ) = temp
   70       CONTINUE
*
            k( j ) = -k( j )
            j = k( j )
            GO TO 60
*
   80       CONTINUE
*
   90    CONTINUE
*
      END IF
*
      RETURN
*
*     End of DLAPMT
*

◆ dlaqp2()

subroutine dlaqp2	(	integer	m,
		integer	n,
		integer	offset,
		double precision, dimension( lda, * )	a,
		integer	lda,
		integer, dimension( * )	jpvt,
		double precision, dimension( * )	tau,
		double precision, dimension( * )	vn1,
		double precision, dimension( * )	vn2,
		double precision, dimension( * )	work )

DLAQP2 computes a QR factorization with column pivoting of the matrix block.

Download DLAQP2 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLAQP2 computes a QR factorization with column pivoting of
!> the block A(OFFSET+1:M,1:N).
!> The block A(1:OFFSET,1:N) is accordingly pivoted, but not factorized.
!>

Parameters

[in]	M	!> M is INTEGER !> The number of rows of the matrix A. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix A. N >= 0. !>
[in]	OFFSET	!> OFFSET is INTEGER !> The number of rows of the matrix A that must be pivoted !> but no factorized. OFFSET >= 0. !>
[in,out]	A	!> A is DOUBLE PRECISION array, dimension (LDA,N) !> On entry, the M-by-N matrix A. !> On exit, the upper triangle of block A(OFFSET+1:M,1:N) is !> the triangular factor obtained; the elements in block !> A(OFFSET+1:M,1:N) below the diagonal, together with the !> array TAU, represent the orthogonal matrix Q as a product of !> elementary reflectors. Block A(1:OFFSET,1:N) has been !> accordingly pivoted, but no factorized. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,M). !>
[in,out]	JPVT	!> JPVT is INTEGER array, dimension (N) !> On entry, if JPVT(i) .ne. 0, the i-th column of A is permuted !> to the front of AP (a leading column); if JPVT(i) = 0, !> the i-th column of A is a free column. !> On exit, if JPVT(i) = k, then the i-th column of AP !> was the k-th column of A. !>
[out]	TAU	!> TAU is DOUBLE PRECISION array, dimension (min(M,N)) !> The scalar factors of the elementary reflectors. !>
[in,out]	VN1	!> VN1 is DOUBLE PRECISION array, dimension (N) !> The vector with the partial column norms. !>
[in,out]	VN2	!> VN2 is DOUBLE PRECISION array, dimension (N) !> The vector with the exact column norms. !>
[out]	WORK	!> WORK is DOUBLE PRECISION array, dimension (N) !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: G. Quintana-Orti, Depto. de Informatica, Universidad Jaime I, Spain X. Sun, Computer Science Dept., Duke University, USA
Partial column norm updating strategy modified on April 2011 Z. Drmac and Z. Bujanovic, Dept. of Mathematics, University of Zagreb, Croatia.

References:: LAPACK Working Note 176 [PDF]

Definition at line 147 of file dlaqp2.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            LDA, M, N, OFFSET
*     ..
*     .. Array Arguments ..
      INTEGER            JPVT( * )
      DOUBLE PRECISION   A( LDA, * ), TAU( * ), VN1( * ), VN2( * ),
     $                   WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ZERO, ONE
      parameter( zero = 0.0d+0, one = 1.0d+0 )
*     ..
*     .. Local Scalars ..
      INTEGER            I, ITEMP, J, MN, OFFPI, PVT
      DOUBLE PRECISION   AII, TEMP, TEMP2, TOL3Z
*     ..
*     .. External Subroutines ..
      EXTERNAL           dlarf, dlarfg, dswap
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, max, min, sqrt
*     ..
*     .. External Functions ..
      INTEGER            IDAMAX
      DOUBLE PRECISION   DLAMCH, DNRM2
      EXTERNAL           idamax, dlamch, dnrm2
*     ..
*     .. Executable Statements ..
*
      mn = min( m-offset, n )
      tol3z = sqrt(dlamch('Epsilon'))
*
*     Compute factorization.
*
      DO 20 i = 1, mn
*
         offpi = offset + i
*
*        Determine ith pivot column and swap if necessary.
*
         pvt = ( i-1 ) + idamax( n-i+1, vn1( i ), 1 )
*
         IF( pvt.NE.i ) THEN
            CALL dswap( m, a( 1, pvt ), 1, a( 1, i ), 1 )
            itemp = jpvt( pvt )
            jpvt( pvt ) = jpvt( i )
            jpvt( i ) = itemp
            vn1( pvt ) = vn1( i )
            vn2( pvt ) = vn2( i )
         END IF
*
*        Generate elementary reflector H(i).
*
         IF( offpi.LT.m ) THEN
            CALL dlarfg( m-offpi+1, a( offpi, i ), a( offpi+1, i ), 1,
     $                   tau( i ) )
         ELSE
            CALL dlarfg( 1, a( m, i ), a( m, i ), 1, tau( i ) )
         END IF
*
         IF( i.LT.n ) THEN
*
*           Apply H(i)**T to A(offset+i:m,i+1:n) from the left.
*
            aii = a( offpi, i )
            a( offpi, i ) = one
            CALL dlarf( 'Left', m-offpi+1, n-i, a( offpi, i ), 1,
     $                  tau( i ), a( offpi, i+1 ), lda, work( 1 ) )
            a( offpi, i ) = aii
         END IF
*
*        Update partial column norms.
*
         DO 10 j = i + 1, n
            IF( vn1( j ).NE.zero ) THEN
*
*              NOTE: The following 4 lines follow from the analysis in
*              Lapack Working Note 176.
*
               temp = one - ( abs( a( offpi, j ) ) / vn1( j ) )**2
               temp = max( temp, zero )
               temp2 = temp*( vn1( j ) / vn2( j ) )**2
               IF( temp2 .LE. tol3z ) THEN
                  IF( offpi.LT.m ) THEN
                     vn1( j ) = dnrm2( m-offpi, a( offpi+1, j ), 1 )
                     vn2( j ) = vn1( j )
                  ELSE
                     vn1( j ) = zero
                     vn2( j ) = zero
                  END IF
               ELSE
                  vn1( j ) = vn1( j )*sqrt( temp )
               END IF
            END IF
   10    CONTINUE
*
   20 CONTINUE
*
      RETURN
*
*     End of DLAQP2
*

◆ dlaqps()

subroutine dlaqps	(	integer	m,
		integer	n,
		integer	offset,
		integer	nb,
		integer	kb,
		double precision, dimension( lda, * )	a,
		integer	lda,
		integer, dimension( * )	jpvt,
		double precision, dimension( * )	tau,
		double precision, dimension( * )	vn1,
		double precision, dimension( * )	vn2,
		double precision, dimension( * )	auxv,
		double precision, dimension( ldf, * )	f,
		integer	ldf )

DLAQPS computes a step of QR factorization with column pivoting of a real m-by-n matrix A by using BLAS level 3.

Download DLAQPS + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLAQPS computes a step of QR factorization with column pivoting
!> of a real M-by-N matrix A by using Blas-3.  It tries to factorize
!> NB columns from A starting from the row OFFSET+1, and updates all
!> of the matrix with Blas-3 xGEMM.
!>
!> In some cases, due to catastrophic cancellations, it cannot
!> factorize NB columns.  Hence, the actual number of factorized
!> columns is returned in KB.
!>
!> Block A(1:OFFSET,1:N) is accordingly pivoted, but not factorized.
!>

Parameters

[in]	M	!> M is INTEGER !> The number of rows of the matrix A. M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix A. N >= 0 !>
[in]	OFFSET	!> OFFSET is INTEGER !> The number of rows of A that have been factorized in !> previous steps. !>
[in]	NB	!> NB is INTEGER !> The number of columns to factorize. !>
[out]	KB	!> KB is INTEGER !> The number of columns actually factorized. !>
[in,out]	A	!> A is DOUBLE PRECISION array, dimension (LDA,N) !> On entry, the M-by-N matrix A. !> On exit, block A(OFFSET+1:M,1:KB) is the triangular !> factor obtained and block A(1:OFFSET,1:N) has been !> accordingly pivoted, but no factorized. !> The rest of the matrix, block A(OFFSET+1:M,KB+1:N) has !> been updated. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,M). !>
[in,out]	JPVT	!> JPVT is INTEGER array, dimension (N) !> JPVT(I) = K <==> Column K of the full matrix A has been !> permuted into position I in AP. !>
[out]	TAU	!> TAU is DOUBLE PRECISION array, dimension (KB) !> The scalar factors of the elementary reflectors. !>
[in,out]	VN1	!> VN1 is DOUBLE PRECISION array, dimension (N) !> The vector with the partial column norms. !>
[in,out]	VN2	!> VN2 is DOUBLE PRECISION array, dimension (N) !> The vector with the exact column norms. !>
[in,out]	AUXV	!> AUXV is DOUBLE PRECISION array, dimension (NB) !> Auxiliary vector. !>
[in,out]	F	!> F is DOUBLE PRECISION array, dimension (LDF,NB) !> Matrix F*T = LY*TA. !>
[in]	LDF	!> LDF is INTEGER !> The leading dimension of the array F. LDF >= max(1,N). !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: G. Quintana-Orti, Depto. de Informatica, Universidad Jaime I, Spain X. Sun, Computer Science Dept., Duke University, USA
Partial column norm updating strategy modified on April 2011 Z. Drmac and Z. Bujanovic, Dept. of Mathematics, University of Zagreb, Croatia.

References:: LAPACK Working Note 176 [PDF]

Definition at line 175 of file dlaqps.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            KB, LDA, LDF, M, N, NB, OFFSET
*     ..
*     .. Array Arguments ..
      INTEGER            JPVT( * )
      DOUBLE PRECISION   A( LDA, * ), AUXV( * ), F( LDF, * ), TAU( * ),
     $                   VN1( * ), VN2( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ZERO, ONE
      parameter( zero = 0.0d+0, one = 1.0d+0 )
*     ..
*     .. Local Scalars ..
      INTEGER            ITEMP, J, K, LASTRK, LSTICC, PVT, RK
      DOUBLE PRECISION   AKK, TEMP, TEMP2, TOL3Z
*     ..
*     .. External Subroutines ..
      EXTERNAL           dgemm, dgemv, dlarfg, dswap
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, dble, max, min, nint, sqrt
*     ..
*     .. External Functions ..
      INTEGER            IDAMAX
      DOUBLE PRECISION   DLAMCH, DNRM2
      EXTERNAL           idamax, dlamch, dnrm2
*     ..
*     .. Executable Statements ..
*
      lastrk = min( m, n+offset )
      lsticc = 0
      k = 0
      tol3z = sqrt(dlamch('Epsilon'))
*
*     Beginning of while loop.
*
   10 CONTINUE
      IF( ( k.LT.nb ) .AND. ( lsticc.EQ.0 ) ) THEN
         k = k + 1
         rk = offset + k
*
*        Determine ith pivot column and swap if necessary
*
         pvt = ( k-1 ) + idamax( n-k+1, vn1( k ), 1 )
         IF( pvt.NE.k ) THEN
            CALL dswap( m, a( 1, pvt ), 1, a( 1, k ), 1 )
            CALL dswap( k-1, f( pvt, 1 ), ldf, f( k, 1 ), ldf )
            itemp = jpvt( pvt )
            jpvt( pvt ) = jpvt( k )
            jpvt( k ) = itemp
            vn1( pvt ) = vn1( k )
            vn2( pvt ) = vn2( k )
         END IF
*
*        Apply previous Householder reflectors to column K:
*        A(RK:M,K) := A(RK:M,K) - A(RK:M,1:K-1)*F(K,1:K-1)**T.
*
         IF( k.GT.1 ) THEN
            CALL dgemv( 'No transpose', m-rk+1, k-1, -one, a( rk, 1 ),
     $                  lda, f( k, 1 ), ldf, one, a( rk, k ), 1 )
         END IF
*
*        Generate elementary reflector H(k).
*
         IF( rk.LT.m ) THEN
            CALL dlarfg( m-rk+1, a( rk, k ), a( rk+1, k ), 1, tau( k ) )
         ELSE
            CALL dlarfg( 1, a( rk, k ), a( rk, k ), 1, tau( k ) )
         END IF
*
         akk = a( rk, k )
         a( rk, k ) = one
*
*        Compute Kth column of F:
*
*        Compute  F(K+1:N,K) := tau(K)*A(RK:M,K+1:N)**T*A(RK:M,K).
*
         IF( k.LT.n ) THEN
            CALL dgemv( 'Transpose', m-rk+1, n-k, tau( k ),
     $                  a( rk, k+1 ), lda, a( rk, k ), 1, zero,
     $                  f( k+1, k ), 1 )
         END IF
*
*        Padding F(1:K,K) with zeros.
*
         DO 20 j = 1, k
            f( j, k ) = zero
   20    CONTINUE
*
*        Incremental updating of F:
*        F(1:N,K) := F(1:N,K) - tau(K)*F(1:N,1:K-1)*A(RK:M,1:K-1)**T
*                    *A(RK:M,K).
*
         IF( k.GT.1 ) THEN
            CALL dgemv( 'Transpose', m-rk+1, k-1, -tau( k ), a( rk, 1 ),
     $                  lda, a( rk, k ), 1, zero, auxv( 1 ), 1 )
*
            CALL dgemv( 'No transpose', n, k-1, one, f( 1, 1 ), ldf,
     $                  auxv( 1 ), 1, one, f( 1, k ), 1 )
         END IF
*
*        Update the current row of A:
*        A(RK,K+1:N) := A(RK,K+1:N) - A(RK,1:K)*F(K+1:N,1:K)**T.
*
         IF( k.LT.n ) THEN
            CALL dgemv( 'No transpose', n-k, k, -one, f( k+1, 1 ), ldf,
     $                  a( rk, 1 ), lda, one, a( rk, k+1 ), lda )
         END IF
*
*        Update partial column norms.
*
         IF( rk.LT.lastrk ) THEN
            DO 30 j = k + 1, n
               IF( vn1( j ).NE.zero ) THEN
*
*                 NOTE: The following 4 lines follow from the analysis in
*                 Lapack Working Note 176.
*
                  temp = abs( a( rk, j ) ) / vn1( j )
                  temp = max( zero, ( one+temp )*( one-temp ) )
                  temp2 = temp*( vn1( j ) / vn2( j ) )**2
                  IF( temp2 .LE. tol3z ) THEN
                     vn2( j ) = dble( lsticc )
                     lsticc = j
                  ELSE
                     vn1( j ) = vn1( j )*sqrt( temp )
                  END IF
               END IF
   30       CONTINUE
         END IF
*
         a( rk, k ) = akk
*
*        End of while loop.
*
         GO TO 10
      END IF
      kb = k
      rk = offset + kb
*
*     Apply the block reflector to the rest of the matrix:
*     A(OFFSET+KB+1:M,KB+1:N) := A(OFFSET+KB+1:M,KB+1:N) -
*                         A(OFFSET+KB+1:M,1:KB)*F(KB+1:N,1:KB)**T.
*
      IF( kb.LT.min( n, m-offset ) ) THEN
         CALL dgemm( 'No transpose', 'Transpose', m-rk, n-kb, kb, -one,
     $               a( rk+1, 1 ), lda, f( kb+1, 1 ), ldf, one,
     $               a( rk+1, kb+1 ), lda )
      END IF
*
*     Recomputation of difficult columns.
*
   40 CONTINUE
      IF( lsticc.GT.0 ) THEN
         itemp = nint( vn2( lsticc ) )
         vn1( lsticc ) = dnrm2( m-rk, a( rk+1, lsticc ), 1 )
*
*        NOTE: The computation of VN1( LSTICC ) relies on the fact that
*        SNRM2 does not fail on vectors with norm below the value of
*        SQRT(DLAMCH('S'))
*
         vn2( lsticc ) = vn1( lsticc )
         lsticc = itemp
         GO TO 40
      END IF
*
      RETURN
*
*     End of DLAQPS
*

◆ dlaqr0()

subroutine dlaqr0	(	logical	wantt,
		logical	wantz,
		integer	n,
		integer	ilo,
		integer	ihi,
		double precision, dimension( ldh, * )	h,
		integer	ldh,
		double precision, dimension( * )	wr,
		double precision, dimension( * )	wi,
		integer	iloz,
		integer	ihiz,
		double precision, dimension( ldz, * )	z,
		integer	ldz,
		double precision, dimension( * )	work,
		integer	lwork,
		integer	info )

DLAQR0 computes the eigenvalues of a Hessenberg matrix, and optionally the matrices from the Schur decomposition.

Download DLAQR0 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!>    DLAQR0 computes the eigenvalues of a Hessenberg matrix H
!>    and, optionally, the matrices T and Z from the Schur decomposition
!>    H = Z T Z**T, where T is an upper quasi-triangular matrix (the
!>    Schur form), and Z is the orthogonal matrix of Schur vectors.
!>
!>    Optionally Z may be postmultiplied into an input orthogonal
!>    matrix Q so that this routine can give the Schur factorization
!>    of a matrix A which has been reduced to the Hessenberg form H
!>    by the orthogonal matrix Q:  A = Q*H*Q**T = (QZ)*T*(QZ)**T.
!>

Parameters

[in]	WANTT	!> WANTT is LOGICAL !> = .TRUE. : the full Schur form T is required; !> = .FALSE.: only eigenvalues are required. !>
[in]	WANTZ	!> WANTZ is LOGICAL !> = .TRUE. : the matrix of Schur vectors Z is required; !> = .FALSE.: Schur vectors are not required. !>
[in]	N	!> N is INTEGER !> The order of the matrix H. N >= 0. !>
[in]	ILO	!> ILO is INTEGER !>
[in]	IHI	!> IHI is INTEGER !> It is assumed that H is already upper triangular in rows !> and columns 1:ILO-1 and IHI+1:N and, if ILO > 1, !> H(ILO,ILO-1) is zero. ILO and IHI are normally set by a !> previous call to DGEBAL, and then passed to DGEHRD when the !> matrix output by DGEBAL is reduced to Hessenberg form. !> Otherwise, ILO and IHI should be set to 1 and N, !> respectively. If N > 0, then 1 <= ILO <= IHI <= N. !> If N = 0, then ILO = 1 and IHI = 0. !>
[in,out]	H	!> H is DOUBLE PRECISION array, dimension (LDH,N) !> On entry, the upper Hessenberg matrix H. !> On exit, if INFO = 0 and WANTT is .TRUE., then H contains !> the upper quasi-triangular matrix T from the Schur !> decomposition (the Schur form); 2-by-2 diagonal blocks !> (corresponding to complex conjugate pairs of eigenvalues) !> are returned in standard form, with H(i,i) = H(i+1,i+1) !> and H(i+1,i)*H(i,i+1) < 0. If INFO = 0 and WANTT is !> .FALSE., then the contents of H are unspecified on exit. !> (The output value of H when INFO > 0 is given under the !> description of INFO below.) !> !> This subroutine may explicitly set H(i,j) = 0 for i > j and !> j = 1, 2, ... ILO-1 or j = IHI+1, IHI+2, ... N. !>
[in]	LDH	!> LDH is INTEGER !> The leading dimension of the array H. LDH >= max(1,N). !>
[out]	WR	!> WR is DOUBLE PRECISION array, dimension (IHI) !>
[out]	WI	!> WI is DOUBLE PRECISION array, dimension (IHI) !> The real and imaginary parts, respectively, of the computed !> eigenvalues of H(ILO:IHI,ILO:IHI) are stored in WR(ILO:IHI) !> and WI(ILO:IHI). If two eigenvalues are computed as a !> complex conjugate pair, they are stored in consecutive !> elements of WR and WI, say the i-th and (i+1)th, with !> WI(i) > 0 and WI(i+1) < 0. If WANTT is .TRUE., then !> the eigenvalues are stored in the same order as on the !> diagonal of the Schur form returned in H, with !> WR(i) = H(i,i) and, if H(i:i+1,i:i+1) is a 2-by-2 diagonal !> block, WI(i) = sqrt(-H(i+1,i)*H(i,i+1)) and !> WI(i+1) = -WI(i). !>
[in]	ILOZ	!> ILOZ is INTEGER !>
[in]	IHIZ	!> IHIZ is INTEGER !> Specify the rows of Z to which transformations must be !> applied if WANTZ is .TRUE.. !> 1 <= ILOZ <= ILO; IHI <= IHIZ <= N. !>
[in,out]	Z	!> Z is DOUBLE PRECISION array, dimension (LDZ,IHI) !> If WANTZ is .FALSE., then Z is not referenced. !> If WANTZ is .TRUE., then Z(ILO:IHI,ILOZ:IHIZ) is !> replaced by Z(ILO:IHI,ILOZ:IHIZ)*U where U is the !> orthogonal Schur factor of H(ILO:IHI,ILO:IHI). !> (The output value of Z when INFO > 0 is given under !> the description of INFO below.) !>
[in]	LDZ	!> LDZ is INTEGER !> The leading dimension of the array Z. if WANTZ is .TRUE. !> then LDZ >= MAX(1,IHIZ). Otherwise, LDZ >= 1. !>
[out]	WORK	!> WORK is DOUBLE PRECISION array, dimension LWORK !> On exit, if LWORK = -1, WORK(1) returns an estimate of !> the optimal value for LWORK. !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the array WORK. LWORK >= max(1,N) !> is sufficient, but LWORK typically as large as 6*N may !> be required for optimal performance. A workspace query !> to determine the optimal workspace size is recommended. !> !> If LWORK = -1, then DLAQR0 does a workspace query. !> In this case, DLAQR0 checks the input parameters and !> estimates the optimal workspace size for the given !> values of N, ILO and IHI. The estimate is returned !> in WORK(1). No error message related to LWORK is !> issued by XERBLA. Neither H nor Z are accessed. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> > 0: if INFO = i, DLAQR0 failed to compute all of !> the eigenvalues. Elements 1:ilo-1 and i+1:n of WR !> and WI contain those eigenvalues which have been !> successfully computed. (Failures are rare.) !> !> If INFO > 0 and WANT is .FALSE., then on exit, !> the remaining unconverged eigenvalues are the eigen- !> values of the upper Hessenberg matrix rows and !> columns ILO through INFO of the final, output !> value of H. !> !> If INFO > 0 and WANTT is .TRUE., then on exit !> !> () (initial value of H)U = U(final value of H) !> !> where U is an orthogonal matrix. The final !> value of H is upper Hessenberg and quasi-triangular !> in rows and columns INFO+1 through IHI. !> !> If INFO > 0 and WANTZ is .TRUE., then on exit !> !> (final value of Z(ILO:IHI,ILOZ:IHIZ) !> = (initial value of Z(ILO:IHI,ILOZ:IHIZ)U !> !> where U is the orthogonal matrix in (*) (regard- !> less of the value of WANTT.) !> !> If INFO > 0 and WANTZ is .FALSE., then Z is not !> accessed. !>

Contributors:: Karen Braman and Ralph Byers, Department of Mathematics, University of Kansas, USA

References:

 K. Braman, R. Byers and R. Mathias, The Multi-Shift QR
 Algorithm Part I: Maintaining Well Focused Shifts, and Level 3
 Performance, SIAM Journal of Matrix Analysis, volume 23, pages
 929--947, 2002.

K. Braman, R. Byers and R. Mathias, The Multi-Shift QR Algorithm Part II: Aggressive Early Deflation, SIAM Journal of Matrix Analysis, volume 23, pages 948–973, 2002.

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 254 of file dlaqr0.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            IHI, IHIZ, ILO, ILOZ, INFO, LDH, LDZ, LWORK, N
      LOGICAL            WANTT, WANTZ
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   H( LDH, * ), WI( * ), WORK( * ), WR( * ),
     $                   Z( LDZ, * )
*     ..
*
*  ================================================================
*
*     .. Parameters ..
*
*     ==== Matrices of order NTINY or smaller must be processed by
*     .    DLAHQR because of insufficient subdiagonal scratch space.
*     .    (This is a hard limit.) ====
      INTEGER            NTINY
      parameter( ntiny = 15 )
*
*     ==== Exceptional deflation windows:  try to cure rare
*     .    slow convergence by varying the size of the
*     .    deflation window after KEXNW iterations. ====
      INTEGER            KEXNW
      parameter( kexnw = 5 )
*
*     ==== Exceptional shifts: try to cure rare slow convergence
*     .    with ad-hoc exceptional shifts every KEXSH iterations.
*     .    ====
      INTEGER            KEXSH
      parameter( kexsh = 6 )
*
*     ==== The constants WILK1 and WILK2 are used to form the
*     .    exceptional shifts. ====
      DOUBLE PRECISION   WILK1, WILK2
      parameter( wilk1 = 0.75d0, wilk2 = -0.4375d0 )
      DOUBLE PRECISION   ZERO, ONE
      parameter( zero = 0.0d0, one = 1.0d0 )
*     ..
*     .. Local Scalars ..
      DOUBLE PRECISION   AA, BB, CC, CS, DD, SN, SS, SWAP
      INTEGER            I, INF, IT, ITMAX, K, KACC22, KBOT, KDU, KS,
     $                   KT, KTOP, KU, KV, KWH, KWTOP, KWV, LD, LS,
     $                   LWKOPT, NDEC, NDFL, NH, NHO, NIBBLE, NMIN, NS,
     $                   NSMAX, NSR, NVE, NW, NWMAX, NWR, NWUPBD
      LOGICAL            SORTED
      CHARACTER          JBCMPZ*2
*     ..
*     .. External Functions ..
      INTEGER            ILAENV
      EXTERNAL           ilaenv
*     ..
*     .. Local Arrays ..
      DOUBLE PRECISION   ZDUM( 1, 1 )
*     ..
*     .. External Subroutines ..
      EXTERNAL           dlacpy, dlahqr, dlanv2, dlaqr3, dlaqr4, dlaqr5
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, dble, int, max, min, mod
*     ..
*     .. Executable Statements ..
      info = 0
*
*     ==== Quick return for N = 0: nothing to do. ====
*
      IF( n.EQ.0 ) THEN
         work( 1 ) = one
         RETURN
      END IF
*
      IF( n.LE.ntiny ) THEN
*
*        ==== Tiny matrices must use DLAHQR. ====
*
         lwkopt = 1
         IF( lwork.NE.-1 )
     $      CALL dlahqr( wantt, wantz, n, ilo, ihi, h, ldh, wr, wi,
     $                   iloz, ihiz, z, ldz, info )
      ELSE
*
*        ==== Use small bulge multi-shift QR with aggressive early
*        .    deflation on larger-than-tiny matrices. ====
*
*        ==== Hope for the best. ====
*
         info = 0
*
*        ==== Set up job flags for ILAENV. ====
*
         IF( wantt ) THEN
            jbcmpz( 1: 1 ) = 'S'
         ELSE
            jbcmpz( 1: 1 ) = 'E'
         END IF
         IF( wantz ) THEN
            jbcmpz( 2: 2 ) = 'V'
         ELSE
            jbcmpz( 2: 2 ) = 'N'
         END IF
*
*        ==== NWR = recommended deflation window size.  At this
*        .    point,  N .GT. NTINY = 15, so there is enough
*        .    subdiagonal workspace for NWR.GE.2 as required.
*        .    (In fact, there is enough subdiagonal space for
*        .    NWR.GE.4.) ====
*
         nwr = ilaenv( 13, 'DLAQR0', jbcmpz, n, ilo, ihi, lwork )
         nwr = max( 2, nwr )
         nwr = min( ihi-ilo+1, ( n-1 ) / 3, nwr )
*
*        ==== NSR = recommended number of simultaneous shifts.
*        .    At this point N .GT. NTINY = 15, so there is at
*        .    enough subdiagonal workspace for NSR to be even
*        .    and greater than or equal to two as required. ====
*
         nsr = ilaenv( 15, 'DLAQR0', jbcmpz, n, ilo, ihi, lwork )
         nsr = min( nsr, ( n-3 ) / 6, ihi-ilo )
         nsr = max( 2, nsr-mod( nsr, 2 ) )
*
*        ==== Estimate optimal workspace ====
*
*        ==== Workspace query call to DLAQR3 ====
*
         CALL dlaqr3( wantt, wantz, n, ilo, ihi, nwr+1, h, ldh, iloz,
     $                ihiz, z, ldz, ls, ld, wr, wi, h, ldh, n, h, ldh,
     $                n, h, ldh, work, -1 )
*
*        ==== Optimal workspace = MAX(DLAQR5, DLAQR3) ====
*
         lwkopt = max( 3*nsr / 2, int( work( 1 ) ) )
*
*        ==== Quick return in case of workspace query. ====
*
         IF( lwork.EQ.-1 ) THEN
            work( 1 ) = dble( lwkopt )
            RETURN
         END IF
*
*        ==== DLAHQR/DLAQR0 crossover point ====
*
         nmin = ilaenv( 12, 'DLAQR0', jbcmpz, n, ilo, ihi, lwork )
         nmin = max( ntiny, nmin )
*
*        ==== Nibble crossover point ====
*
         nibble = ilaenv( 14, 'DLAQR0', jbcmpz, n, ilo, ihi, lwork )
         nibble = max( 0, nibble )
*
*        ==== Accumulate reflections during ttswp?  Use block
*        .    2-by-2 structure during matrix-matrix multiply? ====
*
         kacc22 = ilaenv( 16, 'DLAQR0', jbcmpz, n, ilo, ihi, lwork )
         kacc22 = max( 0, kacc22 )
         kacc22 = min( 2, kacc22 )
*
*        ==== NWMAX = the largest possible deflation window for
*        .    which there is sufficient workspace. ====
*
         nwmax = min( ( n-1 ) / 3, lwork / 2 )
         nw = nwmax
*
*        ==== NSMAX = the Largest number of simultaneous shifts
*        .    for which there is sufficient workspace. ====
*
         nsmax = min( ( n-3 ) / 6, 2*lwork / 3 )
         nsmax = nsmax - mod( nsmax, 2 )
*
*        ==== NDFL: an iteration count restarted at deflation. ====
*
         ndfl = 1
*
*        ==== ITMAX = iteration limit ====
*
         itmax = max( 30, 2*kexsh )*max( 10, ( ihi-ilo+1 ) )
*
*        ==== Last row and column in the active block ====
*
         kbot = ihi
*
*        ==== Main Loop ====
*
         DO 80 it = 1, itmax
*
*           ==== Done when KBOT falls below ILO ====
*
            IF( kbot.LT.ilo )
     $         GO TO 90
*
*           ==== Locate active block ====
*
            DO 10 k = kbot, ilo + 1, -1
               IF( h( k, k-1 ).EQ.zero )
     $            GO TO 20
   10       CONTINUE
            k = ilo
   20       CONTINUE
            ktop = k
*
*           ==== Select deflation window size:
*           .    Typical Case:
*           .      If possible and advisable, nibble the entire
*           .      active block.  If not, use size MIN(NWR,NWMAX)
*           .      or MIN(NWR+1,NWMAX) depending upon which has
*           .      the smaller corresponding subdiagonal entry
*           .      (a heuristic).
*           .
*           .    Exceptional Case:
*           .      If there have been no deflations in KEXNW or
*           .      more iterations, then vary the deflation window
*           .      size.   At first, because, larger windows are,
*           .      in general, more powerful than smaller ones,
*           .      rapidly increase the window to the maximum possible.
*           .      Then, gradually reduce the window size. ====
*
            nh = kbot - ktop + 1
            nwupbd = min( nh, nwmax )
            IF( ndfl.LT.kexnw ) THEN
               nw = min( nwupbd, nwr )
            ELSE
               nw = min( nwupbd, 2*nw )
            END IF
            IF( nw.LT.nwmax ) THEN
               IF( nw.GE.nh-1 ) THEN
                  nw = nh
               ELSE
                  kwtop = kbot - nw + 1
                  IF( abs( h( kwtop, kwtop-1 ) ).GT.
     $                abs( h( kwtop-1, kwtop-2 ) ) )nw = nw + 1
               END IF
            END IF
            IF( ndfl.LT.kexnw ) THEN
               ndec = -1
            ELSE IF( ndec.GE.0 .OR. nw.GE.nwupbd ) THEN
               ndec = ndec + 1
               IF( nw-ndec.LT.2 )
     $            ndec = 0
               nw = nw - ndec
            END IF
*
*           ==== Aggressive early deflation:
*           .    split workspace under the subdiagonal into
*           .      - an nw-by-nw work array V in the lower
*           .        left-hand-corner,
*           .      - an NW-by-at-least-NW-but-more-is-better
*           .        (NW-by-NHO) horizontal work array along
*           .        the bottom edge,
*           .      - an at-least-NW-but-more-is-better (NHV-by-NW)
*           .        vertical work array along the left-hand-edge.
*           .        ====
*
            kv = n - nw + 1
            kt = nw + 1
            nho = ( n-nw-1 ) - kt + 1
            kwv = nw + 2
            nve = ( n-nw ) - kwv + 1
*
*           ==== Aggressive early deflation ====
*
            CALL dlaqr3( wantt, wantz, n, ktop, kbot, nw, h, ldh, iloz,
     $                   ihiz, z, ldz, ls, ld, wr, wi, h( kv, 1 ), ldh,
     $                   nho, h( kv, kt ), ldh, nve, h( kwv, 1 ), ldh,
     $                   work, lwork )
*
*           ==== Adjust KBOT accounting for new deflations. ====
*
            kbot = kbot - ld
*
*           ==== KS points to the shifts. ====
*
            ks = kbot - ls + 1
*
*           ==== Skip an expensive QR sweep if there is a (partly
*           .    heuristic) reason to expect that many eigenvalues
*           .    will deflate without it.  Here, the QR sweep is
*           .    skipped if many eigenvalues have just been deflated
*           .    or if the remaining active block is small.
*
            IF( ( ld.EQ.0 ) .OR. ( ( 100*ld.LE.nw*nibble ) .AND. ( kbot-
     $          ktop+1.GT.min( nmin, nwmax ) ) ) ) THEN
*
*              ==== NS = nominal number of simultaneous shifts.
*              .    This may be lowered (slightly) if DLAQR3
*              .    did not provide that many shifts. ====
*
               ns = min( nsmax, nsr, max( 2, kbot-ktop ) )
               ns = ns - mod( ns, 2 )
*
*              ==== If there have been no deflations
*              .    in a multiple of KEXSH iterations,
*              .    then try exceptional shifts.
*              .    Otherwise use shifts provided by
*              .    DLAQR3 above or from the eigenvalues
*              .    of a trailing principal submatrix. ====
*
               IF( mod( ndfl, kexsh ).EQ.0 ) THEN
                  ks = kbot - ns + 1
                  DO 30 i = kbot, max( ks+1, ktop+2 ), -2
                     ss = abs( h( i, i-1 ) ) + abs( h( i-1, i-2 ) )
                     aa = wilk1*ss + h( i, i )
                     bb = ss
                     cc = wilk2*ss
                     dd = aa
                     CALL dlanv2( aa, bb, cc, dd, wr( i-1 ), wi( i-1 ),
     $                            wr( i ), wi( i ), cs, sn )
   30             CONTINUE
                  IF( ks.EQ.ktop ) THEN
                     wr( ks+1 ) = h( ks+1, ks+1 )
                     wi( ks+1 ) = zero
                     wr( ks ) = wr( ks+1 )
                     wi( ks ) = wi( ks+1 )
                  END IF
               ELSE
*
*                 ==== Got NS/2 or fewer shifts? Use DLAQR4 or
*                 .    DLAHQR on a trailing principal submatrix to
*                 .    get more. (Since NS.LE.NSMAX.LE.(N-3)/6,
*                 .    there is enough space below the subdiagonal
*                 .    to fit an NS-by-NS scratch array.) ====
*
                  IF( kbot-ks+1.LE.ns / 2 ) THEN
                     ks = kbot - ns + 1
                     kt = n - ns + 1
                     CALL dlacpy( 'A', ns, ns, h( ks, ks ), ldh,
     $                            h( kt, 1 ), ldh )
                     IF( ns.GT.nmin ) THEN
                        CALL dlaqr4( .false., .false., ns, 1, ns,
     $                               h( kt, 1 ), ldh, wr( ks ),
     $                               wi( ks ), 1, 1, zdum, 1, work,
     $                               lwork, inf )
                     ELSE
                        CALL dlahqr( .false., .false., ns, 1, ns,
     $                               h( kt, 1 ), ldh, wr( ks ),
     $                               wi( ks ), 1, 1, zdum, 1, inf )
                     END IF
                     ks = ks + inf
*
*                    ==== In case of a rare QR failure use
*                    .    eigenvalues of the trailing 2-by-2
*                    .    principal submatrix.  ====
*
                     IF( ks.GE.kbot ) THEN
                        aa = h( kbot-1, kbot-1 )
                        cc = h( kbot, kbot-1 )
                        bb = h( kbot-1, kbot )
                        dd = h( kbot, kbot )
                        CALL dlanv2( aa, bb, cc, dd, wr( kbot-1 ),
     $                               wi( kbot-1 ), wr( kbot ),
     $                               wi( kbot ), cs, sn )
                        ks = kbot - 1
                     END IF
                  END IF
*
                  IF( kbot-ks+1.GT.ns ) THEN
*
*                    ==== Sort the shifts (Helps a little)
*                    .    Bubble sort keeps complex conjugate
*                    .    pairs together. ====
*
                     sorted = .false.
                     DO 50 k = kbot, ks + 1, -1
                        IF( sorted )
     $                     GO TO 60
                        sorted = .true.
                        DO 40 i = ks, k - 1
                           IF( abs( wr( i ) )+abs( wi( i ) ).LT.
     $                         abs( wr( i+1 ) )+abs( wi( i+1 ) ) ) THEN
                              sorted = .false.
*
                              swap = wr( i )
                              wr( i ) = wr( i+1 )
                              wr( i+1 ) = swap
*
                              swap = wi( i )
                              wi( i ) = wi( i+1 )
                              wi( i+1 ) = swap
                           END IF
   40                   CONTINUE
   50                CONTINUE
   60                CONTINUE
                  END IF
*
*                 ==== Shuffle shifts into pairs of real shifts
*                 .    and pairs of complex conjugate shifts
*                 .    assuming complex conjugate shifts are
*                 .    already adjacent to one another. (Yes,
*                 .    they are.)  ====
*
                  DO 70 i = kbot, ks + 2, -2
                     IF( wi( i ).NE.-wi( i-1 ) ) THEN
*
                        swap = wr( i )
                        wr( i ) = wr( i-1 )
                        wr( i-1 ) = wr( i-2 )
                        wr( i-2 ) = swap
*
                        swap = wi( i )
                        wi( i ) = wi( i-1 )
                        wi( i-1 ) = wi( i-2 )
                        wi( i-2 ) = swap
                     END IF
   70             CONTINUE
               END IF
*
*              ==== If there are only two shifts and both are
*              .    real, then use only one.  ====
*
               IF( kbot-ks+1.EQ.2 ) THEN
                  IF( wi( kbot ).EQ.zero ) THEN
                     IF( abs( wr( kbot )-h( kbot, kbot ) ).LT.
     $                   abs( wr( kbot-1 )-h( kbot, kbot ) ) ) THEN
                        wr( kbot-1 ) = wr( kbot )
                     ELSE
                        wr( kbot ) = wr( kbot-1 )
                     END IF
                  END IF
               END IF
*
*              ==== Use up to NS of the the smallest magnitude
*              .    shifts.  If there aren't NS shifts available,
*              .    then use them all, possibly dropping one to
*              .    make the number of shifts even. ====
*
               ns = min( ns, kbot-ks+1 )
               ns = ns - mod( ns, 2 )
               ks = kbot - ns + 1
*
*              ==== Small-bulge multi-shift QR sweep:
*              .    split workspace under the subdiagonal into
*              .    - a KDU-by-KDU work array U in the lower
*              .      left-hand-corner,
*              .    - a KDU-by-at-least-KDU-but-more-is-better
*              .      (KDU-by-NHo) horizontal work array WH along
*              .      the bottom edge,
*              .    - and an at-least-KDU-but-more-is-better-by-KDU
*              .      (NVE-by-KDU) vertical work WV arrow along
*              .      the left-hand-edge. ====
*
               kdu = 2*ns
               ku = n - kdu + 1
               kwh = kdu + 1
               nho = ( n-kdu+1-4 ) - ( kdu+1 ) + 1
               kwv = kdu + 4
               nve = n - kdu - kwv + 1
*
*              ==== Small-bulge multi-shift QR sweep ====
*
               CALL dlaqr5( wantt, wantz, kacc22, n, ktop, kbot, ns,
     $                      wr( ks ), wi( ks ), h, ldh, iloz, ihiz, z,
     $                      ldz, work, 3, h( ku, 1 ), ldh, nve,
     $                      h( kwv, 1 ), ldh, nho, h( ku, kwh ), ldh )
            END IF
*
*           ==== Note progress (or the lack of it). ====
*
            IF( ld.GT.0 ) THEN
               ndfl = 1
            ELSE
               ndfl = ndfl + 1
            END IF
*
*           ==== End of main loop ====
   80    CONTINUE
*
*        ==== Iteration limit exceeded.  Set INFO to show where
*        .    the problem occurred and exit. ====
*
         info = kbot
   90    CONTINUE
      END IF
*
*     ==== Return the optimal value of LWORK. ====
*
      work( 1 ) = dble( lwkopt )
*
*     ==== End of DLAQR0 ====
*

◆ dlaqr1()

subroutine dlaqr1	(	integer	n,
		double precision, dimension( ldh, * )	h,
		integer	ldh,
		double precision	sr1,
		double precision	si1,
		double precision	sr2,
		double precision	si2,
		double precision, dimension( * )	v )

DLAQR1 sets a scalar multiple of the first column of the product of 2-by-2 or 3-by-3 matrix H and specified shifts.

Download DLAQR1 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!>      Given a 2-by-2 or 3-by-3 matrix H, DLAQR1 sets v to a
!>      scalar multiple of the first column of the product
!>
!>      (*)  K = (H - (sr1 + i*si1)*I)*(H - (sr2 + i*si2)*I)
!>
!>      scaling to avoid overflows and most underflows. It
!>      is assumed that either
!>
!>              1) sr1 = sr2 and si1 = -si2
!>          or
!>              2) si1 = si2 = 0.
!>
!>      This is useful for starting double implicit shift bulges
!>      in the QR algorithm.
!>

Parameters

[in]	N	!> N is INTEGER !> Order of the matrix H. N must be either 2 or 3. !>
[in]	H	!> H is DOUBLE PRECISION array, dimension (LDH,N) !> The 2-by-2 or 3-by-3 matrix H in (*). !>
[in]	LDH	!> LDH is INTEGER !> The leading dimension of H as declared in !> the calling procedure. LDH >= N !>
[in]	SR1	!> SR1 is DOUBLE PRECISION !>
[in]	SI1	!> SI1 is DOUBLE PRECISION !>
[in]	SR2	!> SR2 is DOUBLE PRECISION !>
[in]	SI2	!> SI2 is DOUBLE PRECISION !> The shifts in (*). !>
[out]	V	!> V is DOUBLE PRECISION array, dimension (N) !> A scalar multiple of the first column of the !> matrix K in (*). !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: Karen Braman and Ralph Byers, Department of Mathematics, University of Kansas, USA

Definition at line 120 of file dlaqr1.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      DOUBLE PRECISION   SI1, SI2, SR1, SR2
      INTEGER            LDH, N
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   H( LDH, * ), V( * )
*     ..
*
*  ================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ZERO
      parameter( zero = 0.0d0 )
*     ..
*     .. Local Scalars ..
      DOUBLE PRECISION   H21S, H31S, S
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs
*     ..
*     .. Executable Statements ..
*
*     Quick return if possible
*
      IF( n.NE.2 .AND. n.NE.3 ) THEN
         RETURN
      END IF
*
      IF( n.EQ.2 ) THEN
         s = abs( h( 1, 1 )-sr2 ) + abs( si2 ) + abs( h( 2, 1 ) )
         IF( s.EQ.zero ) THEN
            v( 1 ) = zero
            v( 2 ) = zero
         ELSE
            h21s = h( 2, 1 ) / s
            v( 1 ) = h21s*h( 1, 2 ) + ( h( 1, 1 )-sr1 )*
     $               ( ( h( 1, 1 )-sr2 ) / s ) - si1*( si2 / s )
            v( 2 ) = h21s*( h( 1, 1 )+h( 2, 2 )-sr1-sr2 )
         END IF
      ELSE
         s = abs( h( 1, 1 )-sr2 ) + abs( si2 ) + abs( h( 2, 1 ) ) +
     $       abs( h( 3, 1 ) )
         IF( s.EQ.zero ) THEN
            v( 1 ) = zero
            v( 2 ) = zero
            v( 3 ) = zero
         ELSE
            h21s = h( 2, 1 ) / s
            h31s = h( 3, 1 ) / s
            v( 1 ) = ( h( 1, 1 )-sr1 )*( ( h( 1, 1 )-sr2 ) / s ) -
     $               si1*( si2 / s ) + h( 1, 2 )*h21s + h( 1, 3 )*h31s
            v( 2 ) = h21s*( h( 1, 1 )+h( 2, 2 )-sr1-sr2 ) +
     $               h( 2, 3 )*h31s
            v( 3 ) = h31s*( h( 1, 1 )+h( 3, 3 )-sr1-sr2 ) +
     $               h21s*h( 3, 2 )
         END IF
      END IF

◆ dlaqr2()

subroutine dlaqr2	(	logical	wantt,
		logical	wantz,
		integer	n,
		integer	ktop,
		integer	kbot,
		integer	nw,
		double precision, dimension( ldh, * )	h,
		integer	ldh,
		integer	iloz,
		integer	ihiz,
		double precision, dimension( ldz, * )	z,
		integer	ldz,
		integer	ns,
		integer	nd,
		double precision, dimension( * )	sr,
		double precision, dimension( * )	si,
		double precision, dimension( ldv, * )	v,
		integer	ldv,
		integer	nh,
		double precision, dimension( ldt, * )	t,
		integer	ldt,
		integer	nv,
		double precision, dimension( ldwv, * )	wv,
		integer	ldwv,
		double precision, dimension( * )	work,
		integer	lwork )

DLAQR2 performs the orthogonal similarity transformation of a Hessenberg matrix to detect and deflate fully converged eigenvalues from a trailing principal submatrix (aggressive early deflation).

Download DLAQR2 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!>    DLAQR2 is identical to DLAQR3 except that it avoids
!>    recursion by calling DLAHQR instead of DLAQR4.
!>
!>    Aggressive early deflation:
!>
!>    This subroutine accepts as input an upper Hessenberg matrix
!>    H and performs an orthogonal similarity transformation
!>    designed to detect and deflate fully converged eigenvalues from
!>    a trailing principal submatrix.  On output H has been over-
!>    written by a new Hessenberg matrix that is a perturbation of
!>    an orthogonal similarity transformation of H.  It is to be
!>    hoped that the final version of H has many zero subdiagonal
!>    entries.
!>

Parameters

[in]	WANTT	!> WANTT is LOGICAL !> If .TRUE., then the Hessenberg matrix H is fully updated !> so that the quasi-triangular Schur factor may be !> computed (in cooperation with the calling subroutine). !> If .FALSE., then only enough of H is updated to preserve !> the eigenvalues. !>
[in]	WANTZ	!> WANTZ is LOGICAL !> If .TRUE., then the orthogonal matrix Z is updated so !> so that the orthogonal Schur factor may be computed !> (in cooperation with the calling subroutine). !> If .FALSE., then Z is not referenced. !>
[in]	N	!> N is INTEGER !> The order of the matrix H and (if WANTZ is .TRUE.) the !> order of the orthogonal matrix Z. !>
[in]	KTOP	!> KTOP is INTEGER !> It is assumed that either KTOP = 1 or H(KTOP,KTOP-1)=0. !> KBOT and KTOP together determine an isolated block !> along the diagonal of the Hessenberg matrix. !>
[in]	KBOT	!> KBOT is INTEGER !> It is assumed without a check that either !> KBOT = N or H(KBOT+1,KBOT)=0. KBOT and KTOP together !> determine an isolated block along the diagonal of the !> Hessenberg matrix. !>
[in]	NW	!> NW is INTEGER !> Deflation window size. 1 <= NW <= (KBOT-KTOP+1). !>
[in,out]	H	!> H is DOUBLE PRECISION array, dimension (LDH,N) !> On input the initial N-by-N section of H stores the !> Hessenberg matrix undergoing aggressive early deflation. !> On output H has been transformed by an orthogonal !> similarity transformation, perturbed, and the returned !> to Hessenberg form that (it is to be hoped) has some !> zero subdiagonal entries. !>
[in]	LDH	!> LDH is INTEGER !> Leading dimension of H just as declared in the calling !> subroutine. N <= LDH !>
[in]	ILOZ	!> ILOZ is INTEGER !>
[in]	IHIZ	!> IHIZ is INTEGER !> Specify the rows of Z to which transformations must be !> applied if WANTZ is .TRUE.. 1 <= ILOZ <= IHIZ <= N. !>
[in,out]	Z	!> Z is DOUBLE PRECISION array, dimension (LDZ,N) !> IF WANTZ is .TRUE., then on output, the orthogonal !> similarity transformation mentioned above has been !> accumulated into Z(ILOZ:IHIZ,ILOZ:IHIZ) from the right. !> If WANTZ is .FALSE., then Z is unreferenced. !>
[in]	LDZ	!> LDZ is INTEGER !> The leading dimension of Z just as declared in the !> calling subroutine. 1 <= LDZ. !>
[out]	NS	!> NS is INTEGER !> The number of unconverged (ie approximate) eigenvalues !> returned in SR and SI that may be used as shifts by the !> calling subroutine. !>
[out]	ND	!> ND is INTEGER !> The number of converged eigenvalues uncovered by this !> subroutine. !>
[out]	SR	!> SR is DOUBLE PRECISION array, dimension (KBOT) !>
[out]	SI	!> SI is DOUBLE PRECISION array, dimension (KBOT) !> On output, the real and imaginary parts of approximate !> eigenvalues that may be used for shifts are stored in !> SR(KBOT-ND-NS+1) through SR(KBOT-ND) and !> SI(KBOT-ND-NS+1) through SI(KBOT-ND), respectively. !> The real and imaginary parts of converged eigenvalues !> are stored in SR(KBOT-ND+1) through SR(KBOT) and !> SI(KBOT-ND+1) through SI(KBOT), respectively. !>
[out]	V	!> V is DOUBLE PRECISION array, dimension (LDV,NW) !> An NW-by-NW work array. !>
[in]	LDV	!> LDV is INTEGER !> The leading dimension of V just as declared in the !> calling subroutine. NW <= LDV !>
[in]	NH	!> NH is INTEGER !> The number of columns of T. NH >= NW. !>
[out]	T	!> T is DOUBLE PRECISION array, dimension (LDT,NW) !>
[in]	LDT	!> LDT is INTEGER !> The leading dimension of T just as declared in the !> calling subroutine. NW <= LDT !>
[in]	NV	!> NV is INTEGER !> The number of rows of work array WV available for !> workspace. NV >= NW. !>
[out]	WV	!> WV is DOUBLE PRECISION array, dimension (LDWV,NW) !>
[in]	LDWV	!> LDWV is INTEGER !> The leading dimension of W just as declared in the !> calling subroutine. NW <= LDV !>
[out]	WORK	!> WORK is DOUBLE PRECISION array, dimension (LWORK) !> On exit, WORK(1) is set to an estimate of the optimal value !> of LWORK for the given values of N, NW, KTOP and KBOT. !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the work array WORK. LWORK = 2*NW !> suffices, but greater efficiency may result from larger !> values of LWORK. !> !> If LWORK = -1, then a workspace query is assumed; DLAQR2 !> only estimates the optimal workspace size for the given !> values of N, NW, KTOP and KBOT. The estimate is returned !> in WORK(1). No error message related to LWORK is issued !> by XERBLA. Neither H nor Z are accessed. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: Karen Braman and Ralph Byers, Department of Mathematics, University of Kansas, USA

Definition at line 275 of file dlaqr2.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            IHIZ, ILOZ, KBOT, KTOP, LDH, LDT, LDV, LDWV,
     $                   LDZ, LWORK, N, ND, NH, NS, NV, NW
      LOGICAL            WANTT, WANTZ
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   H( LDH, * ), SI( * ), SR( * ), T( LDT, * ),
     $                   V( LDV, * ), WORK( * ), WV( LDWV, * ),
     $                   Z( LDZ, * )
*     ..
*
*  ================================================================
*     .. Parameters ..
      DOUBLE PRECISION   ZERO, ONE
      parameter( zero = 0.0d0, one = 1.0d0 )
*     ..
*     .. Local Scalars ..
      DOUBLE PRECISION   AA, BB, BETA, CC, CS, DD, EVI, EVK, FOO, S,
     $                   SAFMAX, SAFMIN, SMLNUM, SN, TAU, ULP
      INTEGER            I, IFST, ILST, INFO, INFQR, J, JW, K, KCOL,
     $                   KEND, KLN, KROW, KWTOP, LTOP, LWK1, LWK2,
     $                   LWKOPT
      LOGICAL            BULGE, SORTED
*     ..
*     .. External Functions ..
      DOUBLE PRECISION   DLAMCH
      EXTERNAL           dlamch
*     ..
*     .. External Subroutines ..
      EXTERNAL           dcopy, dgehrd, dgemm, dlabad, dlacpy, dlahqr,
     $                   dlanv2, dlarf, dlarfg, dlaset, dormhr, dtrexc
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, dble, int, max, min, sqrt
*     ..
*     .. Executable Statements ..
*
*     ==== Estimate optimal workspace. ====
*
      jw = min( nw, kbot-ktop+1 )
      IF( jw.LE.2 ) THEN
         lwkopt = 1
      ELSE
*
*        ==== Workspace query call to DGEHRD ====
*
         CALL dgehrd( jw, 1, jw-1, t, ldt, work, work, -1, info )
         lwk1 = int( work( 1 ) )
*
*        ==== Workspace query call to DORMHR ====
*
         CALL dormhr( 'R', 'N', jw, jw, 1, jw-1, t, ldt, work, v, ldv,
     $                work, -1, info )
         lwk2 = int( work( 1 ) )
*
*        ==== Optimal workspace ====
*
         lwkopt = jw + max( lwk1, lwk2 )
      END IF
*
*     ==== Quick return in case of workspace query. ====
*
      IF( lwork.EQ.-1 ) THEN
         work( 1 ) = dble( lwkopt )
         RETURN
      END IF
*
*     ==== Nothing to do ...
*     ... for an empty active block ... ====
      ns = 0
      nd = 0
      work( 1 ) = one
      IF( ktop.GT.kbot )
     $   RETURN
*     ... nor for an empty deflation window. ====
      IF( nw.LT.1 )
     $   RETURN
*
*     ==== Machine constants ====
*
      safmin = dlamch( 'SAFE MINIMUM' )
      safmax = one / safmin
      CALL dlabad( safmin, safmax )
      ulp = dlamch( 'PRECISION' )
      smlnum = safmin*( dble( n ) / ulp )
*
*     ==== Setup deflation window ====
*
      jw = min( nw, kbot-ktop+1 )
      kwtop = kbot - jw + 1
      IF( kwtop.EQ.ktop ) THEN
         s = zero
      ELSE
         s = h( kwtop, kwtop-1 )
      END IF
*
      IF( kbot.EQ.kwtop ) THEN
*
*        ==== 1-by-1 deflation window: not much to do ====
*
         sr( kwtop ) = h( kwtop, kwtop )
         si( kwtop ) = zero
         ns = 1
         nd = 0
         IF( abs( s ).LE.max( smlnum, ulp*abs( h( kwtop, kwtop ) ) ) )
     $        THEN
            ns = 0
            nd = 1
            IF( kwtop.GT.ktop )
     $         h( kwtop, kwtop-1 ) = zero
         END IF
         work( 1 ) = one
         RETURN
      END IF
*
*     ==== Convert to spike-triangular form.  (In case of a
*     .    rare QR failure, this routine continues to do
*     .    aggressive early deflation using that part of
*     .    the deflation window that converged using INFQR
*     .    here and there to keep track.) ====
*
      CALL dlacpy( 'U', jw, jw, h( kwtop, kwtop ), ldh, t, ldt )
      CALL dcopy( jw-1, h( kwtop+1, kwtop ), ldh+1, t( 2, 1 ), ldt+1 )
*
      CALL dlaset( 'A', jw, jw, zero, one, v, ldv )
      CALL dlahqr( .true., .true., jw, 1, jw, t, ldt, sr( kwtop ),
     $             si( kwtop ), 1, jw, v, ldv, infqr )
*
*     ==== DTREXC needs a clean margin near the diagonal ====
*
      DO 10 j = 1, jw - 3
         t( j+2, j ) = zero
         t( j+3, j ) = zero
   10 CONTINUE
      IF( jw.GT.2 )
     $   t( jw, jw-2 ) = zero
*
*     ==== Deflation detection loop ====
*
      ns = jw
      ilst = infqr + 1
   20 CONTINUE
      IF( ilst.LE.ns ) THEN
         IF( ns.EQ.1 ) THEN
            bulge = .false.
         ELSE
            bulge = t( ns, ns-1 ).NE.zero
         END IF
*
*        ==== Small spike tip test for deflation ====
*
         IF( .NOT.bulge ) THEN
*
*           ==== Real eigenvalue ====
*
            foo = abs( t( ns, ns ) )
            IF( foo.EQ.zero )
     $         foo = abs( s )
            IF( abs( s*v( 1, ns ) ).LE.max( smlnum, ulp*foo ) ) THEN
*
*              ==== Deflatable ====
*
               ns = ns - 1
            ELSE
*
*              ==== Undeflatable.   Move it up out of the way.
*              .    (DTREXC can not fail in this case.) ====
*
               ifst = ns
               CALL dtrexc( 'V', jw, t, ldt, v, ldv, ifst, ilst, work,
     $                      info )
               ilst = ilst + 1
            END IF
         ELSE
*
*           ==== Complex conjugate pair ====
*
            foo = abs( t( ns, ns ) ) + sqrt( abs( t( ns, ns-1 ) ) )*
     $            sqrt( abs( t( ns-1, ns ) ) )
            IF( foo.EQ.zero )
     $         foo = abs( s )
            IF( max( abs( s*v( 1, ns ) ), abs( s*v( 1, ns-1 ) ) ).LE.
     $          max( smlnum, ulp*foo ) ) THEN
*
*              ==== Deflatable ====
*
               ns = ns - 2
            ELSE
*
*              ==== Undeflatable. Move them up out of the way.
*              .    Fortunately, DTREXC does the right thing with
*              .    ILST in case of a rare exchange failure. ====
*
               ifst = ns
               CALL dtrexc( 'V', jw, t, ldt, v, ldv, ifst, ilst, work,
     $                      info )
               ilst = ilst + 2
            END IF
         END IF
*
*        ==== End deflation detection loop ====
*
         GO TO 20
      END IF
*
*        ==== Return to Hessenberg form ====
*
      IF( ns.EQ.0 )
     $   s = zero
*
      IF( ns.LT.jw ) THEN
*
*        ==== sorting diagonal blocks of T improves accuracy for
*        .    graded matrices.  Bubble sort deals well with
*        .    exchange failures. ====
*
         sorted = .false.
         i = ns + 1
   30    CONTINUE
         IF( sorted )
     $      GO TO 50
         sorted = .true.
*
         kend = i - 1
         i = infqr + 1
         IF( i.EQ.ns ) THEN
            k = i + 1
         ELSE IF( t( i+1, i ).EQ.zero ) THEN
            k = i + 1
         ELSE
            k = i + 2
         END IF
   40    CONTINUE
         IF( k.LE.kend ) THEN
            IF( k.EQ.i+1 ) THEN
               evi = abs( t( i, i ) )
            ELSE
               evi = abs( t( i, i ) ) + sqrt( abs( t( i+1, i ) ) )*
     $               sqrt( abs( t( i, i+1 ) ) )
            END IF
*
            IF( k.EQ.kend ) THEN
               evk = abs( t( k, k ) )
            ELSE IF( t( k+1, k ).EQ.zero ) THEN
               evk = abs( t( k, k ) )
            ELSE
               evk = abs( t( k, k ) ) + sqrt( abs( t( k+1, k ) ) )*
     $               sqrt( abs( t( k, k+1 ) ) )
            END IF
*
            IF( evi.GE.evk ) THEN
               i = k
            ELSE
               sorted = .false.
               ifst = i
               ilst = k
               CALL dtrexc( 'V', jw, t, ldt, v, ldv, ifst, ilst, work,
     $                      info )
               IF( info.EQ.0 ) THEN
                  i = ilst
               ELSE
                  i = k
               END IF
            END IF
            IF( i.EQ.kend ) THEN
               k = i + 1
            ELSE IF( t( i+1, i ).EQ.zero ) THEN
               k = i + 1
            ELSE
               k = i + 2
            END IF
            GO TO 40
         END IF
         GO TO 30
   50    CONTINUE
      END IF
*
*     ==== Restore shift/eigenvalue array from T ====
*
      i = jw
   60 CONTINUE
      IF( i.GE.infqr+1 ) THEN
         IF( i.EQ.infqr+1 ) THEN
            sr( kwtop+i-1 ) = t( i, i )
            si( kwtop+i-1 ) = zero
            i = i - 1
         ELSE IF( t( i, i-1 ).EQ.zero ) THEN
            sr( kwtop+i-1 ) = t( i, i )
            si( kwtop+i-1 ) = zero
            i = i - 1
         ELSE
            aa = t( i-1, i-1 )
            cc = t( i, i-1 )
            bb = t( i-1, i )
            dd = t( i, i )
            CALL dlanv2( aa, bb, cc, dd, sr( kwtop+i-2 ),
     $                   si( kwtop+i-2 ), sr( kwtop+i-1 ),
     $                   si( kwtop+i-1 ), cs, sn )
            i = i - 2
         END IF
         GO TO 60
      END IF
*
      IF( ns.LT.jw .OR. s.EQ.zero ) THEN
         IF( ns.GT.1 .AND. s.NE.zero ) THEN
*
*           ==== Reflect spike back into lower triangle ====
*
            CALL dcopy( ns, v, ldv, work, 1 )
            beta = work( 1 )
            CALL dlarfg( ns, beta, work( 2 ), 1, tau )
            work( 1 ) = one
*
            CALL dlaset( 'L', jw-2, jw-2, zero, zero, t( 3, 1 ), ldt )
*
            CALL dlarf( 'L', ns, jw, work, 1, tau, t, ldt,
     $                  work( jw+1 ) )
            CALL dlarf( 'R', ns, ns, work, 1, tau, t, ldt,
     $                  work( jw+1 ) )
            CALL dlarf( 'R', jw, ns, work, 1, tau, v, ldv,
     $                  work( jw+1 ) )
*
            CALL dgehrd( jw, 1, ns, t, ldt, work, work( jw+1 ),
     $                   lwork-jw, info )
         END IF
*
*        ==== Copy updated reduced window into place ====
*
         IF( kwtop.GT.1 )
     $      h( kwtop, kwtop-1 ) = s*v( 1, 1 )
         CALL dlacpy( 'U', jw, jw, t, ldt, h( kwtop, kwtop ), ldh )
         CALL dcopy( jw-1, t( 2, 1 ), ldt+1, h( kwtop+1, kwtop ),
     $               ldh+1 )
*
*        ==== Accumulate orthogonal matrix in order update
*        .    H and Z, if requested.  ====
*
         IF( ns.GT.1 .AND. s.NE.zero )
     $      CALL dormhr( 'R', 'N', jw, ns, 1, ns, t, ldt, work, v, ldv,
     $                   work( jw+1 ), lwork-jw, info )
*
*        ==== Update vertical slab in H ====
*
         IF( wantt ) THEN
            ltop = 1
         ELSE
            ltop = ktop
         END IF
         DO 70 krow = ltop, kwtop - 1, nv
            kln = min( nv, kwtop-krow )
            CALL dgemm( 'N', 'N', kln, jw, jw, one, h( krow, kwtop ),
     $                  ldh, v, ldv, zero, wv, ldwv )
            CALL dlacpy( 'A', kln, jw, wv, ldwv, h( krow, kwtop ), ldh )
   70    CONTINUE
*
*        ==== Update horizontal slab in H ====
*
         IF( wantt ) THEN
            DO 80 kcol = kbot + 1, n, nh
               kln = min( nh, n-kcol+1 )
               CALL dgemm( 'C', 'N', jw, kln, jw, one, v, ldv,
     $                     h( kwtop, kcol ), ldh, zero, t, ldt )
               CALL dlacpy( 'A', jw, kln, t, ldt, h( kwtop, kcol ),
     $                      ldh )
   80       CONTINUE
         END IF
*
*        ==== Update vertical slab in Z ====
*
         IF( wantz ) THEN
            DO 90 krow = iloz, ihiz, nv
               kln = min( nv, ihiz-krow+1 )
               CALL dgemm( 'N', 'N', kln, jw, jw, one, z( krow, kwtop ),
     $                     ldz, v, ldv, zero, wv, ldwv )
               CALL dlacpy( 'A', kln, jw, wv, ldwv, z( krow, kwtop ),
     $                      ldz )
   90       CONTINUE
         END IF
      END IF
*
*     ==== Return the number of deflations ... ====
*
      nd = jw - ns
*
*     ==== ... and the number of shifts. (Subtracting
*     .    INFQR from the spike length takes care
*     .    of the case of a rare QR failure while
*     .    calculating eigenvalues of the deflation
*     .    window.)  ====
*
      ns = ns - infqr
*
*      ==== Return optimal workspace. ====
*
      work( 1 ) = dble( lwkopt )
*
*     ==== End of DLAQR2 ====
*

◆ dlaqr3()

subroutine dlaqr3	(	logical	wantt,
		logical	wantz,
		integer	n,
		integer	ktop,
		integer	kbot,
		integer	nw,
		double precision, dimension( ldh, * )	h,
		integer	ldh,
		integer	iloz,
		integer	ihiz,
		double precision, dimension( ldz, * )	z,
		integer	ldz,
		integer	ns,
		integer	nd,
		double precision, dimension( * )	sr,
		double precision, dimension( * )	si,
		double precision, dimension( ldv, * )	v,
		integer	ldv,
		integer	nh,
		double precision, dimension( ldt, * )	t,
		integer	ldt,
		integer	nv,
		double precision, dimension( ldwv, * )	wv,
		integer	ldwv,
		double precision, dimension( * )	work,
		integer	lwork )

DLAQR3 performs the orthogonal similarity transformation of a Hessenberg matrix to detect and deflate fully converged eigenvalues from a trailing principal submatrix (aggressive early deflation).

Download DLAQR3 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!>    Aggressive early deflation:
!>
!>    DLAQR3 accepts as input an upper Hessenberg matrix
!>    H and performs an orthogonal similarity transformation
!>    designed to detect and deflate fully converged eigenvalues from
!>    a trailing principal submatrix.  On output H has been over-
!>    written by a new Hessenberg matrix that is a perturbation of
!>    an orthogonal similarity transformation of H.  It is to be
!>    hoped that the final version of H has many zero subdiagonal
!>    entries.
!>

Parameters

[in]	WANTT	!> WANTT is LOGICAL !> If .TRUE., then the Hessenberg matrix H is fully updated !> so that the quasi-triangular Schur factor may be !> computed (in cooperation with the calling subroutine). !> If .FALSE., then only enough of H is updated to preserve !> the eigenvalues. !>
[in]	WANTZ	!> WANTZ is LOGICAL !> If .TRUE., then the orthogonal matrix Z is updated so !> so that the orthogonal Schur factor may be computed !> (in cooperation with the calling subroutine). !> If .FALSE., then Z is not referenced. !>
[in]	N	!> N is INTEGER !> The order of the matrix H and (if WANTZ is .TRUE.) the !> order of the orthogonal matrix Z. !>
[in]	KTOP	!> KTOP is INTEGER !> It is assumed that either KTOP = 1 or H(KTOP,KTOP-1)=0. !> KBOT and KTOP together determine an isolated block !> along the diagonal of the Hessenberg matrix. !>
[in]	KBOT	!> KBOT is INTEGER !> It is assumed without a check that either !> KBOT = N or H(KBOT+1,KBOT)=0. KBOT and KTOP together !> determine an isolated block along the diagonal of the !> Hessenberg matrix. !>
[in]	NW	!> NW is INTEGER !> Deflation window size. 1 <= NW <= (KBOT-KTOP+1). !>
[in,out]	H	!> H is DOUBLE PRECISION array, dimension (LDH,N) !> On input the initial N-by-N section of H stores the !> Hessenberg matrix undergoing aggressive early deflation. !> On output H has been transformed by an orthogonal !> similarity transformation, perturbed, and the returned !> to Hessenberg form that (it is to be hoped) has some !> zero subdiagonal entries. !>
[in]	LDH	!> LDH is INTEGER !> Leading dimension of H just as declared in the calling !> subroutine. N <= LDH !>
[in]	ILOZ	!> ILOZ is INTEGER !>
[in]	IHIZ	!> IHIZ is INTEGER !> Specify the rows of Z to which transformations must be !> applied if WANTZ is .TRUE.. 1 <= ILOZ <= IHIZ <= N. !>
[in,out]	Z	!> Z is DOUBLE PRECISION array, dimension (LDZ,N) !> IF WANTZ is .TRUE., then on output, the orthogonal !> similarity transformation mentioned above has been !> accumulated into Z(ILOZ:IHIZ,ILOZ:IHIZ) from the right. !> If WANTZ is .FALSE., then Z is unreferenced. !>
[in]	LDZ	!> LDZ is INTEGER !> The leading dimension of Z just as declared in the !> calling subroutine. 1 <= LDZ. !>
[out]	NS	!> NS is INTEGER !> The number of unconverged (ie approximate) eigenvalues !> returned in SR and SI that may be used as shifts by the !> calling subroutine. !>
[out]	ND	!> ND is INTEGER !> The number of converged eigenvalues uncovered by this !> subroutine. !>
[out]	SR	!> SR is DOUBLE PRECISION array, dimension (KBOT) !>
[out]	SI	!> SI is DOUBLE PRECISION array, dimension (KBOT) !> On output, the real and imaginary parts of approximate !> eigenvalues that may be used for shifts are stored in !> SR(KBOT-ND-NS+1) through SR(KBOT-ND) and !> SI(KBOT-ND-NS+1) through SI(KBOT-ND), respectively. !> The real and imaginary parts of converged eigenvalues !> are stored in SR(KBOT-ND+1) through SR(KBOT) and !> SI(KBOT-ND+1) through SI(KBOT), respectively. !>
[out]	V	!> V is DOUBLE PRECISION array, dimension (LDV,NW) !> An NW-by-NW work array. !>
[in]	LDV	!> LDV is INTEGER !> The leading dimension of V just as declared in the !> calling subroutine. NW <= LDV !>
[in]	NH	!> NH is INTEGER !> The number of columns of T. NH >= NW. !>
[out]	T	!> T is DOUBLE PRECISION array, dimension (LDT,NW) !>
[in]	LDT	!> LDT is INTEGER !> The leading dimension of T just as declared in the !> calling subroutine. NW <= LDT !>
[in]	NV	!> NV is INTEGER !> The number of rows of work array WV available for !> workspace. NV >= NW. !>
[out]	WV	!> WV is DOUBLE PRECISION array, dimension (LDWV,NW) !>
[in]	LDWV	!> LDWV is INTEGER !> The leading dimension of W just as declared in the !> calling subroutine. NW <= LDV !>
[out]	WORK	!> WORK is DOUBLE PRECISION array, dimension (LWORK) !> On exit, WORK(1) is set to an estimate of the optimal value !> of LWORK for the given values of N, NW, KTOP and KBOT. !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the work array WORK. LWORK = 2*NW !> suffices, but greater efficiency may result from larger !> values of LWORK. !> !> If LWORK = -1, then a workspace query is assumed; DLAQR3 !> only estimates the optimal workspace size for the given !> values of N, NW, KTOP and KBOT. The estimate is returned !> in WORK(1). No error message related to LWORK is issued !> by XERBLA. Neither H nor Z are accessed. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: Karen Braman and Ralph Byers, Department of Mathematics, University of Kansas, USA

Definition at line 272 of file dlaqr3.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            IHIZ, ILOZ, KBOT, KTOP, LDH, LDT, LDV, LDWV,
     $                   LDZ, LWORK, N, ND, NH, NS, NV, NW
      LOGICAL            WANTT, WANTZ
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   H( LDH, * ), SI( * ), SR( * ), T( LDT, * ),
     $                   V( LDV, * ), WORK( * ), WV( LDWV, * ),
     $                   Z( LDZ, * )
*     ..
*
*  ================================================================
*     .. Parameters ..
      DOUBLE PRECISION   ZERO, ONE
      parameter( zero = 0.0d0, one = 1.0d0 )
*     ..
*     .. Local Scalars ..
      DOUBLE PRECISION   AA, BB, BETA, CC, CS, DD, EVI, EVK, FOO, S,
     $                   SAFMAX, SAFMIN, SMLNUM, SN, TAU, ULP
      INTEGER            I, IFST, ILST, INFO, INFQR, J, JW, K, KCOL,
     $                   KEND, KLN, KROW, KWTOP, LTOP, LWK1, LWK2, LWK3,
     $                   LWKOPT, NMIN
      LOGICAL            BULGE, SORTED
*     ..
*     .. External Functions ..
      DOUBLE PRECISION   DLAMCH
      INTEGER            ILAENV
      EXTERNAL           dlamch, ilaenv
*     ..
*     .. External Subroutines ..
      EXTERNAL           dcopy, dgehrd, dgemm, dlabad, dlacpy, dlahqr,
     $                   dlanv2, dlaqr4, dlarf, dlarfg, dlaset, dormhr,
     $                   dtrexc
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, dble, int, max, min, sqrt
*     ..
*     .. Executable Statements ..
*
*     ==== Estimate optimal workspace. ====
*
      jw = min( nw, kbot-ktop+1 )
      IF( jw.LE.2 ) THEN
         lwkopt = 1
      ELSE
*
*        ==== Workspace query call to DGEHRD ====
*
         CALL dgehrd( jw, 1, jw-1, t, ldt, work, work, -1, info )
         lwk1 = int( work( 1 ) )
*
*        ==== Workspace query call to DORMHR ====
*
         CALL dormhr( 'R', 'N', jw, jw, 1, jw-1, t, ldt, work, v, ldv,
     $                work, -1, info )
         lwk2 = int( work( 1 ) )
*
*        ==== Workspace query call to DLAQR4 ====
*
         CALL dlaqr4( .true., .true., jw, 1, jw, t, ldt, sr, si, 1, jw,
     $                v, ldv, work, -1, infqr )
         lwk3 = int( work( 1 ) )
*
*        ==== Optimal workspace ====
*
         lwkopt = max( jw+max( lwk1, lwk2 ), lwk3 )
      END IF
*
*     ==== Quick return in case of workspace query. ====
*
      IF( lwork.EQ.-1 ) THEN
         work( 1 ) = dble( lwkopt )
         RETURN
      END IF
*
*     ==== Nothing to do ...
*     ... for an empty active block ... ====
      ns = 0
      nd = 0
      work( 1 ) = one
      IF( ktop.GT.kbot )
     $   RETURN
*     ... nor for an empty deflation window. ====
      IF( nw.LT.1 )
     $   RETURN
*
*     ==== Machine constants ====
*
      safmin = dlamch( 'SAFE MINIMUM' )
      safmax = one / safmin
      CALL dlabad( safmin, safmax )
      ulp = dlamch( 'PRECISION' )
      smlnum = safmin*( dble( n ) / ulp )
*
*     ==== Setup deflation window ====
*
      jw = min( nw, kbot-ktop+1 )
      kwtop = kbot - jw + 1
      IF( kwtop.EQ.ktop ) THEN
         s = zero
      ELSE
         s = h( kwtop, kwtop-1 )
      END IF
*
      IF( kbot.EQ.kwtop ) THEN
*
*        ==== 1-by-1 deflation window: not much to do ====
*
         sr( kwtop ) = h( kwtop, kwtop )
         si( kwtop ) = zero
         ns = 1
         nd = 0
         IF( abs( s ).LE.max( smlnum, ulp*abs( h( kwtop, kwtop ) ) ) )
     $        THEN
            ns = 0
            nd = 1
            IF( kwtop.GT.ktop )
     $         h( kwtop, kwtop-1 ) = zero
         END IF
         work( 1 ) = one
         RETURN
      END IF
*
*     ==== Convert to spike-triangular form.  (In case of a
*     .    rare QR failure, this routine continues to do
*     .    aggressive early deflation using that part of
*     .    the deflation window that converged using INFQR
*     .    here and there to keep track.) ====
*
      CALL dlacpy( 'U', jw, jw, h( kwtop, kwtop ), ldh, t, ldt )
      CALL dcopy( jw-1, h( kwtop+1, kwtop ), ldh+1, t( 2, 1 ), ldt+1 )
*
      CALL dlaset( 'A', jw, jw, zero, one, v, ldv )
      nmin = ilaenv( 12, 'DLAQR3', 'SV', jw, 1, jw, lwork )
      IF( jw.GT.nmin ) THEN
         CALL dlaqr4( .true., .true., jw, 1, jw, t, ldt, sr( kwtop ),
     $                si( kwtop ), 1, jw, v, ldv, work, lwork, infqr )
      ELSE
         CALL dlahqr( .true., .true., jw, 1, jw, t, ldt, sr( kwtop ),
     $                si( kwtop ), 1, jw, v, ldv, infqr )
      END IF
*
*     ==== DTREXC needs a clean margin near the diagonal ====
*
      DO 10 j = 1, jw - 3
         t( j+2, j ) = zero
         t( j+3, j ) = zero
   10 CONTINUE
      IF( jw.GT.2 )
     $   t( jw, jw-2 ) = zero
*
*     ==== Deflation detection loop ====
*
      ns = jw
      ilst = infqr + 1
   20 CONTINUE
      IF( ilst.LE.ns ) THEN
         IF( ns.EQ.1 ) THEN
            bulge = .false.
         ELSE
            bulge = t( ns, ns-1 ).NE.zero
         END IF
*
*        ==== Small spike tip test for deflation ====
*
         IF( .NOT. bulge ) THEN
*
*           ==== Real eigenvalue ====
*
            foo = abs( t( ns, ns ) )
            IF( foo.EQ.zero )
     $         foo = abs( s )
            IF( abs( s*v( 1, ns ) ).LE.max( smlnum, ulp*foo ) ) THEN
*
*              ==== Deflatable ====
*
               ns = ns - 1
            ELSE
*
*              ==== Undeflatable.   Move it up out of the way.
*              .    (DTREXC can not fail in this case.) ====
*
               ifst = ns
               CALL dtrexc( 'V', jw, t, ldt, v, ldv, ifst, ilst, work,
     $                      info )
               ilst = ilst + 1
            END IF
         ELSE
*
*           ==== Complex conjugate pair ====
*
            foo = abs( t( ns, ns ) ) + sqrt( abs( t( ns, ns-1 ) ) )*
     $            sqrt( abs( t( ns-1, ns ) ) )
            IF( foo.EQ.zero )
     $         foo = abs( s )
            IF( max( abs( s*v( 1, ns ) ), abs( s*v( 1, ns-1 ) ) ).LE.
     $          max( smlnum, ulp*foo ) ) THEN
*
*              ==== Deflatable ====
*
               ns = ns - 2
            ELSE
*
*              ==== Undeflatable. Move them up out of the way.
*              .    Fortunately, DTREXC does the right thing with
*              .    ILST in case of a rare exchange failure. ====
*
               ifst = ns
               CALL dtrexc( 'V', jw, t, ldt, v, ldv, ifst, ilst, work,
     $                      info )
               ilst = ilst + 2
            END IF
         END IF
*
*        ==== End deflation detection loop ====
*
         GO TO 20
      END IF
*
*        ==== Return to Hessenberg form ====
*
      IF( ns.EQ.0 )
     $   s = zero
*
      IF( ns.LT.jw ) THEN
*
*        ==== sorting diagonal blocks of T improves accuracy for
*        .    graded matrices.  Bubble sort deals well with
*        .    exchange failures. ====
*
         sorted = .false.
         i = ns + 1
   30    CONTINUE
         IF( sorted )
     $      GO TO 50
         sorted = .true.
*
         kend = i - 1
         i = infqr + 1
         IF( i.EQ.ns ) THEN
            k = i + 1
         ELSE IF( t( i+1, i ).EQ.zero ) THEN
            k = i + 1
         ELSE
            k = i + 2
         END IF
   40    CONTINUE
         IF( k.LE.kend ) THEN
            IF( k.EQ.i+1 ) THEN
               evi = abs( t( i, i ) )
            ELSE
               evi = abs( t( i, i ) ) + sqrt( abs( t( i+1, i ) ) )*
     $               sqrt( abs( t( i, i+1 ) ) )
            END IF
*
            IF( k.EQ.kend ) THEN
               evk = abs( t( k, k ) )
            ELSE IF( t( k+1, k ).EQ.zero ) THEN
               evk = abs( t( k, k ) )
            ELSE
               evk = abs( t( k, k ) ) + sqrt( abs( t( k+1, k ) ) )*
     $               sqrt( abs( t( k, k+1 ) ) )
            END IF
*
            IF( evi.GE.evk ) THEN
               i = k
            ELSE
               sorted = .false.
               ifst = i
               ilst = k
               CALL dtrexc( 'V', jw, t, ldt, v, ldv, ifst, ilst, work,
     $                      info )
               IF( info.EQ.0 ) THEN
                  i = ilst
               ELSE
                  i = k
               END IF
            END IF
            IF( i.EQ.kend ) THEN
               k = i + 1
            ELSE IF( t( i+1, i ).EQ.zero ) THEN
               k = i + 1
            ELSE
               k = i + 2
            END IF
            GO TO 40
         END IF
         GO TO 30
   50    CONTINUE
      END IF
*
*     ==== Restore shift/eigenvalue array from T ====
*
      i = jw
   60 CONTINUE
      IF( i.GE.infqr+1 ) THEN
         IF( i.EQ.infqr+1 ) THEN
            sr( kwtop+i-1 ) = t( i, i )
            si( kwtop+i-1 ) = zero
            i = i - 1
         ELSE IF( t( i, i-1 ).EQ.zero ) THEN
            sr( kwtop+i-1 ) = t( i, i )
            si( kwtop+i-1 ) = zero
            i = i - 1
         ELSE
            aa = t( i-1, i-1 )
            cc = t( i, i-1 )
            bb = t( i-1, i )
            dd = t( i, i )
            CALL dlanv2( aa, bb, cc, dd, sr( kwtop+i-2 ),
     $                   si( kwtop+i-2 ), sr( kwtop+i-1 ),
     $                   si( kwtop+i-1 ), cs, sn )
            i = i - 2
         END IF
         GO TO 60
      END IF
*
      IF( ns.LT.jw .OR. s.EQ.zero ) THEN
         IF( ns.GT.1 .AND. s.NE.zero ) THEN
*
*           ==== Reflect spike back into lower triangle ====
*
            CALL dcopy( ns, v, ldv, work, 1 )
            beta = work( 1 )
            CALL dlarfg( ns, beta, work( 2 ), 1, tau )
            work( 1 ) = one
*
            CALL dlaset( 'L', jw-2, jw-2, zero, zero, t( 3, 1 ), ldt )
*
            CALL dlarf( 'L', ns, jw, work, 1, tau, t, ldt,
     $                  work( jw+1 ) )
            CALL dlarf( 'R', ns, ns, work, 1, tau, t, ldt,
     $                  work( jw+1 ) )
            CALL dlarf( 'R', jw, ns, work, 1, tau, v, ldv,
     $                  work( jw+1 ) )
*
            CALL dgehrd( jw, 1, ns, t, ldt, work, work( jw+1 ),
     $                   lwork-jw, info )
         END IF
*
*        ==== Copy updated reduced window into place ====
*
         IF( kwtop.GT.1 )
     $      h( kwtop, kwtop-1 ) = s*v( 1, 1 )
         CALL dlacpy( 'U', jw, jw, t, ldt, h( kwtop, kwtop ), ldh )
         CALL dcopy( jw-1, t( 2, 1 ), ldt+1, h( kwtop+1, kwtop ),
     $               ldh+1 )
*
*        ==== Accumulate orthogonal matrix in order update
*        .    H and Z, if requested.  ====
*
         IF( ns.GT.1 .AND. s.NE.zero )
     $      CALL dormhr( 'R', 'N', jw, ns, 1, ns, t, ldt, work, v, ldv,
     $                   work( jw+1 ), lwork-jw, info )
*
*        ==== Update vertical slab in H ====
*
         IF( wantt ) THEN
            ltop = 1
         ELSE
            ltop = ktop
         END IF
         DO 70 krow = ltop, kwtop - 1, nv
            kln = min( nv, kwtop-krow )
            CALL dgemm( 'N', 'N', kln, jw, jw, one, h( krow, kwtop ),
     $                  ldh, v, ldv, zero, wv, ldwv )
            CALL dlacpy( 'A', kln, jw, wv, ldwv, h( krow, kwtop ), ldh )
   70    CONTINUE
*
*        ==== Update horizontal slab in H ====
*
         IF( wantt ) THEN
            DO 80 kcol = kbot + 1, n, nh
               kln = min( nh, n-kcol+1 )
               CALL dgemm( 'C', 'N', jw, kln, jw, one, v, ldv,
     $                     h( kwtop, kcol ), ldh, zero, t, ldt )
               CALL dlacpy( 'A', jw, kln, t, ldt, h( kwtop, kcol ),
     $                      ldh )
   80       CONTINUE
         END IF
*
*        ==== Update vertical slab in Z ====
*
         IF( wantz ) THEN
            DO 90 krow = iloz, ihiz, nv
               kln = min( nv, ihiz-krow+1 )
               CALL dgemm( 'N', 'N', kln, jw, jw, one, z( krow, kwtop ),
     $                     ldz, v, ldv, zero, wv, ldwv )
               CALL dlacpy( 'A', kln, jw, wv, ldwv, z( krow, kwtop ),
     $                      ldz )
   90       CONTINUE
         END IF
      END IF
*
*     ==== Return the number of deflations ... ====
*
      nd = jw - ns
*
*     ==== ... and the number of shifts. (Subtracting
*     .    INFQR from the spike length takes care
*     .    of the case of a rare QR failure while
*     .    calculating eigenvalues of the deflation
*     .    window.)  ====
*
      ns = ns - infqr
*
*      ==== Return optimal workspace. ====
*
      work( 1 ) = dble( lwkopt )
*
*     ==== End of DLAQR3 ====
*

◆ dlaqr4()

subroutine dlaqr4	(	logical	wantt,
		logical	wantz,
		integer	n,
		integer	ilo,
		integer	ihi,
		double precision, dimension( ldh, * )	h,
		integer	ldh,
		double precision, dimension( * )	wr,
		double precision, dimension( * )	wi,
		integer	iloz,
		integer	ihiz,
		double precision, dimension( ldz, * )	z,
		integer	ldz,
		double precision, dimension( * )	work,
		integer	lwork,
		integer	info )

DLAQR4 computes the eigenvalues of a Hessenberg matrix, and optionally the matrices from the Schur decomposition.

Download DLAQR4 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!>    DLAQR4 implements one level of recursion for DLAQR0.
!>    It is a complete implementation of the small bulge multi-shift
!>    QR algorithm.  It may be called by DLAQR0 and, for large enough
!>    deflation window size, it may be called by DLAQR3.  This
!>    subroutine is identical to DLAQR0 except that it calls DLAQR2
!>    instead of DLAQR3.
!>
!>    DLAQR4 computes the eigenvalues of a Hessenberg matrix H
!>    and, optionally, the matrices T and Z from the Schur decomposition
!>    H = Z T Z**T, where T is an upper quasi-triangular matrix (the
!>    Schur form), and Z is the orthogonal matrix of Schur vectors.
!>
!>    Optionally Z may be postmultiplied into an input orthogonal
!>    matrix Q so that this routine can give the Schur factorization
!>    of a matrix A which has been reduced to the Hessenberg form H
!>    by the orthogonal matrix Q:  A = Q*H*Q**T = (QZ)*T*(QZ)**T.
!>

Parameters

[in]	WANTT	!> WANTT is LOGICAL !> = .TRUE. : the full Schur form T is required; !> = .FALSE.: only eigenvalues are required. !>
[in]	WANTZ	!> WANTZ is LOGICAL !> = .TRUE. : the matrix of Schur vectors Z is required; !> = .FALSE.: Schur vectors are not required. !>
[in]	N	!> N is INTEGER !> The order of the matrix H. N >= 0. !>
[in]	ILO	!> ILO is INTEGER !>
[in]	IHI	!> IHI is INTEGER !> It is assumed that H is already upper triangular in rows !> and columns 1:ILO-1 and IHI+1:N and, if ILO > 1, !> H(ILO,ILO-1) is zero. ILO and IHI are normally set by a !> previous call to DGEBAL, and then passed to DGEHRD when the !> matrix output by DGEBAL is reduced to Hessenberg form. !> Otherwise, ILO and IHI should be set to 1 and N, !> respectively. If N > 0, then 1 <= ILO <= IHI <= N. !> If N = 0, then ILO = 1 and IHI = 0. !>
[in,out]	H	!> H is DOUBLE PRECISION array, dimension (LDH,N) !> On entry, the upper Hessenberg matrix H. !> On exit, if INFO = 0 and WANTT is .TRUE., then H contains !> the upper quasi-triangular matrix T from the Schur !> decomposition (the Schur form); 2-by-2 diagonal blocks !> (corresponding to complex conjugate pairs of eigenvalues) !> are returned in standard form, with H(i,i) = H(i+1,i+1) !> and H(i+1,i)*H(i,i+1) < 0. If INFO = 0 and WANTT is !> .FALSE., then the contents of H are unspecified on exit. !> (The output value of H when INFO > 0 is given under the !> description of INFO below.) !> !> This subroutine may explicitly set H(i,j) = 0 for i > j and !> j = 1, 2, ... ILO-1 or j = IHI+1, IHI+2, ... N. !>
[in]	LDH	!> LDH is INTEGER !> The leading dimension of the array H. LDH >= max(1,N). !>
[out]	WR	!> WR is DOUBLE PRECISION array, dimension (IHI) !>
[out]	WI	!> WI is DOUBLE PRECISION array, dimension (IHI) !> The real and imaginary parts, respectively, of the computed !> eigenvalues of H(ILO:IHI,ILO:IHI) are stored in WR(ILO:IHI) !> and WI(ILO:IHI). If two eigenvalues are computed as a !> complex conjugate pair, they are stored in consecutive !> elements of WR and WI, say the i-th and (i+1)th, with !> WI(i) > 0 and WI(i+1) < 0. If WANTT is .TRUE., then !> the eigenvalues are stored in the same order as on the !> diagonal of the Schur form returned in H, with !> WR(i) = H(i,i) and, if H(i:i+1,i:i+1) is a 2-by-2 diagonal !> block, WI(i) = sqrt(-H(i+1,i)*H(i,i+1)) and !> WI(i+1) = -WI(i). !>
[in]	ILOZ	!> ILOZ is INTEGER !>
[in]	IHIZ	!> IHIZ is INTEGER !> Specify the rows of Z to which transformations must be !> applied if WANTZ is .TRUE.. !> 1 <= ILOZ <= ILO; IHI <= IHIZ <= N. !>
[in,out]	Z	!> Z is DOUBLE PRECISION array, dimension (LDZ,IHI) !> If WANTZ is .FALSE., then Z is not referenced. !> If WANTZ is .TRUE., then Z(ILO:IHI,ILOZ:IHIZ) is !> replaced by Z(ILO:IHI,ILOZ:IHIZ)*U where U is the !> orthogonal Schur factor of H(ILO:IHI,ILO:IHI). !> (The output value of Z when INFO > 0 is given under !> the description of INFO below.) !>
[in]	LDZ	!> LDZ is INTEGER !> The leading dimension of the array Z. if WANTZ is .TRUE. !> then LDZ >= MAX(1,IHIZ). Otherwise, LDZ >= 1. !>
[out]	WORK	!> WORK is DOUBLE PRECISION array, dimension LWORK !> On exit, if LWORK = -1, WORK(1) returns an estimate of !> the optimal value for LWORK. !>
[in]	LWORK	!> LWORK is INTEGER !> The dimension of the array WORK. LWORK >= max(1,N) !> is sufficient, but LWORK typically as large as 6*N may !> be required for optimal performance. A workspace query !> to determine the optimal workspace size is recommended. !> !> If LWORK = -1, then DLAQR4 does a workspace query. !> In this case, DLAQR4 checks the input parameters and !> estimates the optimal workspace size for the given !> values of N, ILO and IHI. The estimate is returned !> in WORK(1). No error message related to LWORK is !> issued by XERBLA. Neither H nor Z are accessed. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> > 0: if INFO = i, DLAQR4 failed to compute all of !> the eigenvalues. Elements 1:ilo-1 and i+1:n of WR !> and WI contain those eigenvalues which have been !> successfully computed. (Failures are rare.) !> !> If INFO > 0 and WANT is .FALSE., then on exit, !> the remaining unconverged eigenvalues are the eigen- !> values of the upper Hessenberg matrix rows and !> columns ILO through INFO of the final, output !> value of H. !> !> If INFO > 0 and WANTT is .TRUE., then on exit !> !> () (initial value of H)U = U(final value of H) !> !> where U is a orthogonal matrix. The final !> value of H is upper Hessenberg and triangular in !> rows and columns INFO+1 through IHI. !> !> If INFO > 0 and WANTZ is .TRUE., then on exit !> !> (final value of Z(ILO:IHI,ILOZ:IHIZ) !> = (initial value of Z(ILO:IHI,ILOZ:IHIZ)U !> !> where U is the orthogonal matrix in (*) (regard- !> less of the value of WANTT.) !> !> If INFO > 0 and WANTZ is .FALSE., then Z is not !> accessed. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: Karen Braman and Ralph Byers, Department of Mathematics, University of Kansas, USA

References:

 K. Braman, R. Byers and R. Mathias, The Multi-Shift QR
 Algorithm Part I: Maintaining Well Focused Shifts, and Level 3
 Performance, SIAM Journal of Matrix Analysis, volume 23, pages
 929--947, 2002.

K. Braman, R. Byers and R. Mathias, The Multi-Shift QR Algorithm Part II: Aggressive Early Deflation, SIAM Journal of Matrix Analysis, volume 23, pages 948–973, 2002.

Definition at line 261 of file dlaqr4.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            IHI, IHIZ, ILO, ILOZ, INFO, LDH, LDZ, LWORK, N
      LOGICAL            WANTT, WANTZ
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   H( LDH, * ), WI( * ), WORK( * ), WR( * ),
     $                   Z( LDZ, * )
*     ..
*
*  ================================================================
*     .. Parameters ..
*
*     ==== Matrices of order NTINY or smaller must be processed by
*     .    DLAHQR because of insufficient subdiagonal scratch space.
*     .    (This is a hard limit.) ====
      INTEGER            NTINY
      parameter( ntiny = 15 )
*
*     ==== Exceptional deflation windows:  try to cure rare
*     .    slow convergence by varying the size of the
*     .    deflation window after KEXNW iterations. ====
      INTEGER            KEXNW
      parameter( kexnw = 5 )
*
*     ==== Exceptional shifts: try to cure rare slow convergence
*     .    with ad-hoc exceptional shifts every KEXSH iterations.
*     .    ====
      INTEGER            KEXSH
      parameter( kexsh = 6 )
*
*     ==== The constants WILK1 and WILK2 are used to form the
*     .    exceptional shifts. ====
      DOUBLE PRECISION   WILK1, WILK2
      parameter( wilk1 = 0.75d0, wilk2 = -0.4375d0 )
      DOUBLE PRECISION   ZERO, ONE
      parameter( zero = 0.0d0, one = 1.0d0 )
*     ..
*     .. Local Scalars ..
      DOUBLE PRECISION   AA, BB, CC, CS, DD, SN, SS, SWAP
      INTEGER            I, INF, IT, ITMAX, K, KACC22, KBOT, KDU, KS,
     $                   KT, KTOP, KU, KV, KWH, KWTOP, KWV, LD, LS,
     $                   LWKOPT, NDEC, NDFL, NH, NHO, NIBBLE, NMIN, NS,
     $                   NSMAX, NSR, NVE, NW, NWMAX, NWR, NWUPBD
      LOGICAL            SORTED
      CHARACTER          JBCMPZ*2
*     ..
*     .. External Functions ..
      INTEGER            ILAENV
      EXTERNAL           ilaenv
*     ..
*     .. Local Arrays ..
      DOUBLE PRECISION   ZDUM( 1, 1 )
*     ..
*     .. External Subroutines ..
      EXTERNAL           dlacpy, dlahqr, dlanv2, dlaqr2, dlaqr5
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, dble, int, max, min, mod
*     ..
*     .. Executable Statements ..
      info = 0
*
*     ==== Quick return for N = 0: nothing to do. ====
*
      IF( n.EQ.0 ) THEN
         work( 1 ) = one
         RETURN
      END IF
*
      IF( n.LE.ntiny ) THEN
*
*        ==== Tiny matrices must use DLAHQR. ====
*
         lwkopt = 1
         IF( lwork.NE.-1 )
     $      CALL dlahqr( wantt, wantz, n, ilo, ihi, h, ldh, wr, wi,
     $                   iloz, ihiz, z, ldz, info )
      ELSE
*
*        ==== Use small bulge multi-shift QR with aggressive early
*        .    deflation on larger-than-tiny matrices. ====
*
*        ==== Hope for the best. ====
*
         info = 0
*
*        ==== Set up job flags for ILAENV. ====
*
         IF( wantt ) THEN
            jbcmpz( 1: 1 ) = 'S'
         ELSE
            jbcmpz( 1: 1 ) = 'E'
         END IF
         IF( wantz ) THEN
            jbcmpz( 2: 2 ) = 'V'
         ELSE
            jbcmpz( 2: 2 ) = 'N'
         END IF
*
*        ==== NWR = recommended deflation window size.  At this
*        .    point,  N .GT. NTINY = 15, so there is enough
*        .    subdiagonal workspace for NWR.GE.2 as required.
*        .    (In fact, there is enough subdiagonal space for
*        .    NWR.GE.4.) ====
*
         nwr = ilaenv( 13, 'DLAQR4', jbcmpz, n, ilo, ihi, lwork )
         nwr = max( 2, nwr )
         nwr = min( ihi-ilo+1, ( n-1 ) / 3, nwr )
*
*        ==== NSR = recommended number of simultaneous shifts.
*        .    At this point N .GT. NTINY = 15, so there is at
*        .    enough subdiagonal workspace for NSR to be even
*        .    and greater than or equal to two as required. ====
*
         nsr = ilaenv( 15, 'DLAQR4', jbcmpz, n, ilo, ihi, lwork )
         nsr = min( nsr, ( n-3 ) / 6, ihi-ilo )
         nsr = max( 2, nsr-mod( nsr, 2 ) )
*
*        ==== Estimate optimal workspace ====
*
*        ==== Workspace query call to DLAQR2 ====
*
         CALL dlaqr2( wantt, wantz, n, ilo, ihi, nwr+1, h, ldh, iloz,
     $                ihiz, z, ldz, ls, ld, wr, wi, h, ldh, n, h, ldh,
     $                n, h, ldh, work, -1 )
*
*        ==== Optimal workspace = MAX(DLAQR5, DLAQR2) ====
*
         lwkopt = max( 3*nsr / 2, int( work( 1 ) ) )
*
*        ==== Quick return in case of workspace query. ====
*
         IF( lwork.EQ.-1 ) THEN
            work( 1 ) = dble( lwkopt )
            RETURN
         END IF
*
*        ==== DLAHQR/DLAQR0 crossover point ====
*
         nmin = ilaenv( 12, 'DLAQR4', jbcmpz, n, ilo, ihi, lwork )
         nmin = max( ntiny, nmin )
*
*        ==== Nibble crossover point ====
*
         nibble = ilaenv( 14, 'DLAQR4', jbcmpz, n, ilo, ihi, lwork )
         nibble = max( 0, nibble )
*
*        ==== Accumulate reflections during ttswp?  Use block
*        .    2-by-2 structure during matrix-matrix multiply? ====
*
         kacc22 = ilaenv( 16, 'DLAQR4', jbcmpz, n, ilo, ihi, lwork )
         kacc22 = max( 0, kacc22 )
         kacc22 = min( 2, kacc22 )
*
*        ==== NWMAX = the largest possible deflation window for
*        .    which there is sufficient workspace. ====
*
         nwmax = min( ( n-1 ) / 3, lwork / 2 )
         nw = nwmax
*
*        ==== NSMAX = the Largest number of simultaneous shifts
*        .    for which there is sufficient workspace. ====
*
         nsmax = min( ( n-3 ) / 6, 2*lwork / 3 )
         nsmax = nsmax - mod( nsmax, 2 )
*
*        ==== NDFL: an iteration count restarted at deflation. ====
*
         ndfl = 1
*
*        ==== ITMAX = iteration limit ====
*
         itmax = max( 30, 2*kexsh )*max( 10, ( ihi-ilo+1 ) )
*
*        ==== Last row and column in the active block ====
*
         kbot = ihi
*
*        ==== Main Loop ====
*
         DO 80 it = 1, itmax
*
*           ==== Done when KBOT falls below ILO ====
*
            IF( kbot.LT.ilo )
     $         GO TO 90
*
*           ==== Locate active block ====
*
            DO 10 k = kbot, ilo + 1, -1
               IF( h( k, k-1 ).EQ.zero )
     $            GO TO 20
   10       CONTINUE
            k = ilo
   20       CONTINUE
            ktop = k
*
*           ==== Select deflation window size:
*           .    Typical Case:
*           .      If possible and advisable, nibble the entire
*           .      active block.  If not, use size MIN(NWR,NWMAX)
*           .      or MIN(NWR+1,NWMAX) depending upon which has
*           .      the smaller corresponding subdiagonal entry
*           .      (a heuristic).
*           .
*           .    Exceptional Case:
*           .      If there have been no deflations in KEXNW or
*           .      more iterations, then vary the deflation window
*           .      size.   At first, because, larger windows are,
*           .      in general, more powerful than smaller ones,
*           .      rapidly increase the window to the maximum possible.
*           .      Then, gradually reduce the window size. ====
*
            nh = kbot - ktop + 1
            nwupbd = min( nh, nwmax )
            IF( ndfl.LT.kexnw ) THEN
               nw = min( nwupbd, nwr )
            ELSE
               nw = min( nwupbd, 2*nw )
            END IF
            IF( nw.LT.nwmax ) THEN
               IF( nw.GE.nh-1 ) THEN
                  nw = nh
               ELSE
                  kwtop = kbot - nw + 1
                  IF( abs( h( kwtop, kwtop-1 ) ).GT.
     $                abs( h( kwtop-1, kwtop-2 ) ) )nw = nw + 1
               END IF
            END IF
            IF( ndfl.LT.kexnw ) THEN
               ndec = -1
            ELSE IF( ndec.GE.0 .OR. nw.GE.nwupbd ) THEN
               ndec = ndec + 1
               IF( nw-ndec.LT.2 )
     $            ndec = 0
               nw = nw - ndec
            END IF
*
*           ==== Aggressive early deflation:
*           .    split workspace under the subdiagonal into
*           .      - an nw-by-nw work array V in the lower
*           .        left-hand-corner,
*           .      - an NW-by-at-least-NW-but-more-is-better
*           .        (NW-by-NHO) horizontal work array along
*           .        the bottom edge,
*           .      - an at-least-NW-but-more-is-better (NHV-by-NW)
*           .        vertical work array along the left-hand-edge.
*           .        ====
*
            kv = n - nw + 1
            kt = nw + 1
            nho = ( n-nw-1 ) - kt + 1
            kwv = nw + 2
            nve = ( n-nw ) - kwv + 1
*
*           ==== Aggressive early deflation ====
*
            CALL dlaqr2( wantt, wantz, n, ktop, kbot, nw, h, ldh, iloz,
     $                   ihiz, z, ldz, ls, ld, wr, wi, h( kv, 1 ), ldh,
     $                   nho, h( kv, kt ), ldh, nve, h( kwv, 1 ), ldh,
     $                   work, lwork )
*
*           ==== Adjust KBOT accounting for new deflations. ====
*
            kbot = kbot - ld
*
*           ==== KS points to the shifts. ====
*
            ks = kbot - ls + 1
*
*           ==== Skip an expensive QR sweep if there is a (partly
*           .    heuristic) reason to expect that many eigenvalues
*           .    will deflate without it.  Here, the QR sweep is
*           .    skipped if many eigenvalues have just been deflated
*           .    or if the remaining active block is small.
*
            IF( ( ld.EQ.0 ) .OR. ( ( 100*ld.LE.nw*nibble ) .AND. ( kbot-
     $          ktop+1.GT.min( nmin, nwmax ) ) ) ) THEN
*
*              ==== NS = nominal number of simultaneous shifts.
*              .    This may be lowered (slightly) if DLAQR2
*              .    did not provide that many shifts. ====
*
               ns = min( nsmax, nsr, max( 2, kbot-ktop ) )
               ns = ns - mod( ns, 2 )
*
*              ==== If there have been no deflations
*              .    in a multiple of KEXSH iterations,
*              .    then try exceptional shifts.
*              .    Otherwise use shifts provided by
*              .    DLAQR2 above or from the eigenvalues
*              .    of a trailing principal submatrix. ====
*
               IF( mod( ndfl, kexsh ).EQ.0 ) THEN
                  ks = kbot - ns + 1
                  DO 30 i = kbot, max( ks+1, ktop+2 ), -2
                     ss = abs( h( i, i-1 ) ) + abs( h( i-1, i-2 ) )
                     aa = wilk1*ss + h( i, i )
                     bb = ss
                     cc = wilk2*ss
                     dd = aa
                     CALL dlanv2( aa, bb, cc, dd, wr( i-1 ), wi( i-1 ),
     $                            wr( i ), wi( i ), cs, sn )
   30             CONTINUE
                  IF( ks.EQ.ktop ) THEN
                     wr( ks+1 ) = h( ks+1, ks+1 )
                     wi( ks+1 ) = zero
                     wr( ks ) = wr( ks+1 )
                     wi( ks ) = wi( ks+1 )
                  END IF
               ELSE
*
*                 ==== Got NS/2 or fewer shifts? Use DLAHQR
*                 .    on a trailing principal submatrix to
*                 .    get more. (Since NS.LE.NSMAX.LE.(N-3)/6,
*                 .    there is enough space below the subdiagonal
*                 .    to fit an NS-by-NS scratch array.) ====
*
                  IF( kbot-ks+1.LE.ns / 2 ) THEN
                     ks = kbot - ns + 1
                     kt = n - ns + 1
                     CALL dlacpy( 'A', ns, ns, h( ks, ks ), ldh,
     $                            h( kt, 1 ), ldh )
                     CALL dlahqr( .false., .false., ns, 1, ns,
     $                            h( kt, 1 ), ldh, wr( ks ), wi( ks ),
     $                            1, 1, zdum, 1, inf )
                     ks = ks + inf
*
*                    ==== In case of a rare QR failure use
*                    .    eigenvalues of the trailing 2-by-2
*                    .    principal submatrix.  ====
*
                     IF( ks.GE.kbot ) THEN
                        aa = h( kbot-1, kbot-1 )
                        cc = h( kbot, kbot-1 )
                        bb = h( kbot-1, kbot )
                        dd = h( kbot, kbot )
                        CALL dlanv2( aa, bb, cc, dd, wr( kbot-1 ),
     $                               wi( kbot-1 ), wr( kbot ),
     $                               wi( kbot ), cs, sn )
                        ks = kbot - 1
                     END IF
                  END IF
*
                  IF( kbot-ks+1.GT.ns ) THEN
*
*                    ==== Sort the shifts (Helps a little)
*                    .    Bubble sort keeps complex conjugate
*                    .    pairs together. ====
*
                     sorted = .false.
                     DO 50 k = kbot, ks + 1, -1
                        IF( sorted )
     $                     GO TO 60
                        sorted = .true.
                        DO 40 i = ks, k - 1
                           IF( abs( wr( i ) )+abs( wi( i ) ).LT.
     $                         abs( wr( i+1 ) )+abs( wi( i+1 ) ) ) THEN
                              sorted = .false.
*
                              swap = wr( i )
                              wr( i ) = wr( i+1 )
                              wr( i+1 ) = swap
*
                              swap = wi( i )
                              wi( i ) = wi( i+1 )
                              wi( i+1 ) = swap
                           END IF
   40                   CONTINUE
   50                CONTINUE
   60                CONTINUE
                  END IF
*
*                 ==== Shuffle shifts into pairs of real shifts
*                 .    and pairs of complex conjugate shifts
*                 .    assuming complex conjugate shifts are
*                 .    already adjacent to one another. (Yes,
*                 .    they are.)  ====
*
                  DO 70 i = kbot, ks + 2, -2
                     IF( wi( i ).NE.-wi( i-1 ) ) THEN
*
                        swap = wr( i )
                        wr( i ) = wr( i-1 )
                        wr( i-1 ) = wr( i-2 )
                        wr( i-2 ) = swap
*
                        swap = wi( i )
                        wi( i ) = wi( i-1 )
                        wi( i-1 ) = wi( i-2 )
                        wi( i-2 ) = swap
                     END IF
   70             CONTINUE
               END IF
*
*              ==== If there are only two shifts and both are
*              .    real, then use only one.  ====
*
               IF( kbot-ks+1.EQ.2 ) THEN
                  IF( wi( kbot ).EQ.zero ) THEN
                     IF( abs( wr( kbot )-h( kbot, kbot ) ).LT.
     $                   abs( wr( kbot-1 )-h( kbot, kbot ) ) ) THEN
                        wr( kbot-1 ) = wr( kbot )
                     ELSE
                        wr( kbot ) = wr( kbot-1 )
                     END IF
                  END IF
               END IF
*
*              ==== Use up to NS of the the smallest magnitude
*              .    shifts.  If there aren't NS shifts available,
*              .    then use them all, possibly dropping one to
*              .    make the number of shifts even. ====
*
               ns = min( ns, kbot-ks+1 )
               ns = ns - mod( ns, 2 )
               ks = kbot - ns + 1
*
*              ==== Small-bulge multi-shift QR sweep:
*              .    split workspace under the subdiagonal into
*              .    - a KDU-by-KDU work array U in the lower
*              .      left-hand-corner,
*              .    - a KDU-by-at-least-KDU-but-more-is-better
*              .      (KDU-by-NHo) horizontal work array WH along
*              .      the bottom edge,
*              .    - and an at-least-KDU-but-more-is-better-by-KDU
*              .      (NVE-by-KDU) vertical work WV arrow along
*              .      the left-hand-edge. ====
*
               kdu = 2*ns
               ku = n - kdu + 1
               kwh = kdu + 1
               nho = ( n-kdu+1-4 ) - ( kdu+1 ) + 1
               kwv = kdu + 4
               nve = n - kdu - kwv + 1
*
*              ==== Small-bulge multi-shift QR sweep ====
*
               CALL dlaqr5( wantt, wantz, kacc22, n, ktop, kbot, ns,
     $                      wr( ks ), wi( ks ), h, ldh, iloz, ihiz, z,
     $                      ldz, work, 3, h( ku, 1 ), ldh, nve,
     $                      h( kwv, 1 ), ldh, nho, h( ku, kwh ), ldh )
            END IF
*
*           ==== Note progress (or the lack of it). ====
*
            IF( ld.GT.0 ) THEN
               ndfl = 1
            ELSE
               ndfl = ndfl + 1
            END IF
*
*           ==== End of main loop ====
   80    CONTINUE
*
*        ==== Iteration limit exceeded.  Set INFO to show where
*        .    the problem occurred and exit. ====
*
         info = kbot
   90    CONTINUE
      END IF
*
*     ==== Return the optimal value of LWORK. ====
*
      work( 1 ) = dble( lwkopt )
*
*     ==== End of DLAQR4 ====
*

◆ dlaqr5()

subroutine dlaqr5	(	logical	wantt,
		logical	wantz,
		integer	kacc22,
		integer	n,
		integer	ktop,
		integer	kbot,
		integer	nshfts,
		double precision, dimension( * )	sr,
		double precision, dimension( * )	si,
		double precision, dimension( ldh, * )	h,
		integer	ldh,
		integer	iloz,
		integer	ihiz,
		double precision, dimension( ldz, * )	z,
		integer	ldz,
		double precision, dimension( ldv, * )	v,
		integer	ldv,
		double precision, dimension( ldu, * )	u,
		integer	ldu,
		integer	nv,
		double precision, dimension( ldwv, * )	wv,
		integer	ldwv,
		integer	nh,
		double precision, dimension( ldwh, * )	wh,
		integer	ldwh )

DLAQR5 performs a single small-bulge multi-shift QR sweep.

Download DLAQR5 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!>    DLAQR5, called by DLAQR0, performs a
!>    single small-bulge multi-shift QR sweep.
!>

Parameters

[in]	WANTT	!> WANTT is LOGICAL !> WANTT = .true. if the quasi-triangular Schur factor !> is being computed. WANTT is set to .false. otherwise. !>
[in]	WANTZ	!> WANTZ is LOGICAL !> WANTZ = .true. if the orthogonal Schur factor is being !> computed. WANTZ is set to .false. otherwise. !>
[in]	KACC22	!> KACC22 is INTEGER with value 0, 1, or 2. !> Specifies the computation mode of far-from-diagonal !> orthogonal updates. !> = 0: DLAQR5 does not accumulate reflections and does not !> use matrix-matrix multiply to update far-from-diagonal !> matrix entries. !> = 1: DLAQR5 accumulates reflections and uses matrix-matrix !> multiply to update the far-from-diagonal matrix entries. !> = 2: Same as KACC22 = 1. This option used to enable exploiting !> the 2-by-2 structure during matrix multiplications, but !> this is no longer supported. !>
[in]	N	!> N is INTEGER !> N is the order of the Hessenberg matrix H upon which this !> subroutine operates. !>
[in]	KTOP	!> KTOP is INTEGER !>
[in]	KBOT	!> KBOT is INTEGER !> These are the first and last rows and columns of an !> isolated diagonal block upon which the QR sweep is to be !> applied. It is assumed without a check that !> either KTOP = 1 or H(KTOP,KTOP-1) = 0 !> and !> either KBOT = N or H(KBOT+1,KBOT) = 0. !>
[in]	NSHFTS	!> NSHFTS is INTEGER !> NSHFTS gives the number of simultaneous shifts. NSHFTS !> must be positive and even. !>
[in,out]	SR	!> SR is DOUBLE PRECISION array, dimension (NSHFTS) !>
[in,out]	SI	!> SI is DOUBLE PRECISION array, dimension (NSHFTS) !> SR contains the real parts and SI contains the imaginary !> parts of the NSHFTS shifts of origin that define the !> multi-shift QR sweep. On output SR and SI may be !> reordered. !>
[in,out]	H	!> H is DOUBLE PRECISION array, dimension (LDH,N) !> On input H contains a Hessenberg matrix. On output a !> multi-shift QR sweep with shifts SR(J)+i*SI(J) is applied !> to the isolated diagonal block in rows and columns KTOP !> through KBOT. !>
[in]	LDH	!> LDH is INTEGER !> LDH is the leading dimension of H just as declared in the !> calling procedure. LDH >= MAX(1,N). !>
[in]	ILOZ	!> ILOZ is INTEGER !>
[in]	IHIZ	!> IHIZ is INTEGER !> Specify the rows of Z to which transformations must be !> applied if WANTZ is .TRUE.. 1 <= ILOZ <= IHIZ <= N !>
[in,out]	Z	!> Z is DOUBLE PRECISION array, dimension (LDZ,IHIZ) !> If WANTZ = .TRUE., then the QR Sweep orthogonal !> similarity transformation is accumulated into !> Z(ILOZ:IHIZ,ILOZ:IHIZ) from the right. !> If WANTZ = .FALSE., then Z is unreferenced. !>
[in]	LDZ	!> LDZ is INTEGER !> LDA is the leading dimension of Z just as declared in !> the calling procedure. LDZ >= N. !>
[out]	V	!> V is DOUBLE PRECISION array, dimension (LDV,NSHFTS/2) !>
[in]	LDV	!> LDV is INTEGER !> LDV is the leading dimension of V as declared in the !> calling procedure. LDV >= 3. !>
[out]	U	!> U is DOUBLE PRECISION array, dimension (LDU,2*NSHFTS) !>
[in]	LDU	!> LDU is INTEGER !> LDU is the leading dimension of U just as declared in the !> in the calling subroutine. LDU >= 2*NSHFTS. !>
[in]	NV	!> NV is INTEGER !> NV is the number of rows in WV agailable for workspace. !> NV >= 1. !>
[out]	WV	!> WV is DOUBLE PRECISION array, dimension (LDWV,2*NSHFTS) !>
[in]	LDWV	!> LDWV is INTEGER !> LDWV is the leading dimension of WV as declared in the !> in the calling subroutine. LDWV >= NV. !>
[in]	NH	!> NH is INTEGER !> NH is the number of columns in array WH available for !> workspace. NH >= 1. !>
[out]	WH	!> WH is DOUBLE PRECISION array, dimension (LDWH,NH) !>
[in]	LDWH	!> LDWH is INTEGER !> Leading dimension of WH just as declared in the !> calling procedure. LDWH >= 2*NSHFTS. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: Karen Braman and Ralph Byers, Department of Mathematics, University of Kansas, USA

Lars Karlsson, Daniel Kressner, and Bruno Lang

Thijs Steel, Department of Computer science, KU Leuven, Belgium

References:: K. Braman, R. Byers and R. Mathias, The Multi-Shift QR Algorithm Part I: Maintaining Well Focused Shifts, and Level 3 Performance, SIAM Journal of Matrix Analysis, volume 23, pages 929–947, 2002.

Lars Karlsson, Daniel Kressner, and Bruno Lang, Optimally packed chains of bulges in multishift QR algorithms. ACM Trans. Math. Softw. 40, 2, Article 12 (February 2014).

Definition at line 262 of file dlaqr5.f.

      IMPLICIT NONE
*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            IHIZ, ILOZ, KACC22, KBOT, KTOP, LDH, LDU, LDV,
     $                   LDWH, LDWV, LDZ, N, NH, NSHFTS, NV
      LOGICAL            WANTT, WANTZ
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   H( LDH, * ), SI( * ), SR( * ), U( LDU, * ),
     $                   V( LDV, * ), WH( LDWH, * ), WV( LDWV, * ),
     $                   Z( LDZ, * )
*     ..
*
*  ================================================================
*     .. Parameters ..
      DOUBLE PRECISION   ZERO, ONE
      parameter( zero = 0.0d0, one = 1.0d0 )
*     ..
*     .. Local Scalars ..
      DOUBLE PRECISION   ALPHA, BETA, H11, H12, H21, H22, REFSUM,
     $                   SAFMAX, SAFMIN, SCL, SMLNUM, SWAP, TST1, TST2,
     $                   ULP
      INTEGER            I, I2, I4, INCOL, J, JBOT, JCOL, JLEN,
     $                   JROW, JTOP, K, K1, KDU, KMS, KRCOL,
     $                   M, M22, MBOT, MTOP, NBMPS, NDCOL,
     $                   NS, NU
      LOGICAL            ACCUM, BMP22
*     ..
*     .. External Functions ..
      DOUBLE PRECISION   DLAMCH
      EXTERNAL           dlamch
*     ..
*     .. Intrinsic Functions ..
*
      INTRINSIC          abs, dble, max, min, mod
*     ..
*     .. Local Arrays ..
      DOUBLE PRECISION   VT( 3 )
*     ..
*     .. External Subroutines ..
      EXTERNAL           dgemm, dlabad, dlacpy, dlaqr1, dlarfg, dlaset,
     $                   dtrmm
*     ..
*     .. Executable Statements ..
*
*     ==== If there are no shifts, then there is nothing to do. ====
*
      IF( nshfts.LT.2 )
     $   RETURN
*
*     ==== If the active block is empty or 1-by-1, then there
*     .    is nothing to do. ====
*
      IF( ktop.GE.kbot )
     $   RETURN
*
*     ==== Shuffle shifts into pairs of real shifts and pairs
*     .    of complex conjugate shifts assuming complex
*     .    conjugate shifts are already adjacent to one
*     .    another. ====
*
      DO 10 i = 1, nshfts - 2, 2
         IF( si( i ).NE.-si( i+1 ) ) THEN
*
            swap = sr( i )
            sr( i ) = sr( i+1 )
            sr( i+1 ) = sr( i+2 )
            sr( i+2 ) = swap
*
            swap = si( i )
            si( i ) = si( i+1 )
            si( i+1 ) = si( i+2 )
            si( i+2 ) = swap
         END IF
   10 CONTINUE
*
*     ==== NSHFTS is supposed to be even, but if it is odd,
*     .    then simply reduce it by one.  The shuffle above
*     .    ensures that the dropped shift is real and that
*     .    the remaining shifts are paired. ====
*
      ns = nshfts - mod( nshfts, 2 )
*
*     ==== Machine constants for deflation ====
*
      safmin = dlamch( 'SAFE MINIMUM' )
      safmax = one / safmin
      CALL dlabad( safmin, safmax )
      ulp = dlamch( 'PRECISION' )
      smlnum = safmin*( dble( n ) / ulp )
*
*     ==== Use accumulated reflections to update far-from-diagonal
*     .    entries ? ====
*
      accum = ( kacc22.EQ.1 ) .OR. ( kacc22.EQ.2 )
*
*     ==== clear trash ====
*
      IF( ktop+2.LE.kbot )
     $   h( ktop+2, ktop ) = zero
*
*     ==== NBMPS = number of 2-shift bulges in the chain ====
*
      nbmps = ns / 2
*
*     ==== KDU = width of slab ====
*
      kdu = 4*nbmps
*
*     ==== Create and chase chains of NBMPS bulges ====
*
      DO 180 incol = ktop - 2*nbmps + 1, kbot - 2, 2*nbmps
*
*        JTOP = Index from which updates from the right start.
*
         IF( accum ) THEN
            jtop = max( ktop, incol )
         ELSE IF( wantt ) THEN
            jtop = 1
         ELSE
            jtop = ktop
         END IF
*
         ndcol = incol + kdu
         IF( accum )
     $      CALL dlaset( 'ALL', kdu, kdu, zero, one, u, ldu )
*
*        ==== Near-the-diagonal bulge chase.  The following loop
*        .    performs the near-the-diagonal part of a small bulge
*        .    multi-shift QR sweep.  Each 4*NBMPS column diagonal
*        .    chunk extends from column INCOL to column NDCOL
*        .    (including both column INCOL and column NDCOL). The
*        .    following loop chases a 2*NBMPS+1 column long chain of
*        .    NBMPS bulges 2*NBMPS columns to the right.  (INCOL
*        .    may be less than KTOP and and NDCOL may be greater than
*        .    KBOT indicating phantom columns from which to chase
*        .    bulges before they are actually introduced or to which
*        .    to chase bulges beyond column KBOT.)  ====
*
         DO 145 krcol = incol, min( incol+2*nbmps-1, kbot-2 )
*
*           ==== Bulges number MTOP to MBOT are active double implicit
*           .    shift bulges.  There may or may not also be small
*           .    2-by-2 bulge, if there is room.  The inactive bulges
*           .    (if any) must wait until the active bulges have moved
*           .    down the diagonal to make room.  The phantom matrix
*           .    paradigm described above helps keep track.  ====
*
            mtop = max( 1, ( ktop-krcol ) / 2+1 )
            mbot = min( nbmps, ( kbot-krcol-1 ) / 2 )
            m22 = mbot + 1
            bmp22 = ( mbot.LT.nbmps ) .AND. ( krcol+2*( m22-1 ) ).EQ.
     $              ( kbot-2 )
*
*           ==== Generate reflections to chase the chain right
*           .    one column.  (The minimum value of K is KTOP-1.) ====
*
            IF ( bmp22 ) THEN
*
*              ==== Special case: 2-by-2 reflection at bottom treated
*              .    separately ====
*
               k = krcol + 2*( m22-1 )
               IF( k.EQ.ktop-1 ) THEN
                  CALL dlaqr1( 2, h( k+1, k+1 ), ldh, sr( 2*m22-1 ),
     $                         si( 2*m22-1 ), sr( 2*m22 ), si( 2*m22 ),
     $                         v( 1, m22 ) )
                  beta = v( 1, m22 )
                  CALL dlarfg( 2, beta, v( 2, m22 ), 1, v( 1, m22 ) )
               ELSE
                  beta = h( k+1, k )
                  v( 2, m22 ) = h( k+2, k )
                  CALL dlarfg( 2, beta, v( 2, m22 ), 1, v( 1, m22 ) )
                  h( k+1, k ) = beta
                  h( k+2, k ) = zero
               END IF
 
*
*              ==== Perform update from right within 
*              .    computational window. ====
*
               DO 30 j = jtop, min( kbot, k+3 )
                  refsum = v( 1, m22 )*( h( j, k+1 )+v( 2, m22 )*
     $                     h( j, k+2 ) )
                  h( j, k+1 ) = h( j, k+1 ) - refsum
                  h( j, k+2 ) = h( j, k+2 ) - refsum*v( 2, m22 )
   30          CONTINUE
*
*              ==== Perform update from left within 
*              .    computational window. ====
*
               IF( accum ) THEN
                  jbot = min( ndcol, kbot )
               ELSE IF( wantt ) THEN
                  jbot = n
               ELSE
                  jbot = kbot
               END IF
               DO 40 j = k+1, jbot
                  refsum = v( 1, m22 )*( h( k+1, j )+v( 2, m22 )*
     $                     h( k+2, j ) )
                  h( k+1, j ) = h( k+1, j ) - refsum
                  h( k+2, j ) = h( k+2, j ) - refsum*v( 2, m22 )
   40          CONTINUE
*
*              ==== The following convergence test requires that
*              .    the tradition small-compared-to-nearby-diagonals
*              .    criterion and the Ahues & Tisseur (LAWN 122, 1997)
*              .    criteria both be satisfied.  The latter improves
*              .    accuracy in some examples. Falling back on an
*              .    alternate convergence criterion when TST1 or TST2
*              .    is zero (as done here) is traditional but probably
*              .    unnecessary. ====
*
               IF( k.GE.ktop ) THEN
                  IF( h( k+1, k ).NE.zero ) THEN
                     tst1 = abs( h( k, k ) ) + abs( h( k+1, k+1 ) )
                     IF( tst1.EQ.zero ) THEN
                        IF( k.GE.ktop+1 )
     $                     tst1 = tst1 + abs( h( k, k-1 ) )
                        IF( k.GE.ktop+2 )
     $                     tst1 = tst1 + abs( h( k, k-2 ) )
                        IF( k.GE.ktop+3 )
     $                     tst1 = tst1 + abs( h( k, k-3 ) )
                        IF( k.LE.kbot-2 )
     $                     tst1 = tst1 + abs( h( k+2, k+1 ) )
                        IF( k.LE.kbot-3 )
     $                     tst1 = tst1 + abs( h( k+3, k+1 ) )
                        IF( k.LE.kbot-4 )
     $                     tst1 = tst1 + abs( h( k+4, k+1 ) )
                     END IF
                     IF( abs( h( k+1, k ) )
     $                   .LE.max( smlnum, ulp*tst1 ) ) THEN
                        h12 = max( abs( h( k+1, k ) ),
     $                             abs( h( k, k+1 ) ) )
                        h21 = min( abs( h( k+1, k ) ),
     $                             abs( h( k, k+1 ) ) )
                        h11 = max( abs( h( k+1, k+1 ) ),
     $                             abs( h( k, k )-h( k+1, k+1 ) ) )
                        h22 = min( abs( h( k+1, k+1 ) ),
     $                        abs( h( k, k )-h( k+1, k+1 ) ) )
                        scl = h11 + h12
                        tst2 = h22*( h11 / scl )
*
                        IF( tst2.EQ.zero .OR. h21*( h12 / scl ).LE.
     $                      max( smlnum, ulp*tst2 ) ) THEN
                           h( k+1, k ) = zero
                        END IF
                     END IF
                  END IF
               END IF
*
*              ==== Accumulate orthogonal transformations. ====
*
               IF( accum ) THEN
                  kms = k - incol
                  DO 50 j = max( 1, ktop-incol ), kdu
                     refsum = v( 1, m22 )*( u( j, kms+1 )+
     $                        v( 2, m22 )*u( j, kms+2 ) )
                     u( j, kms+1 ) = u( j, kms+1 ) - refsum
                     u( j, kms+2 ) = u( j, kms+2 ) - refsum*v( 2, m22 )
  50                 CONTINUE
               ELSE IF( wantz ) THEN
                  DO 60 j = iloz, ihiz
                     refsum = v( 1, m22 )*( z( j, k+1 )+v( 2, m22 )*
     $                        z( j, k+2 ) )
                     z( j, k+1 ) = z( j, k+1 ) - refsum
                     z( j, k+2 ) = z( j, k+2 ) - refsum*v( 2, m22 )
  60              CONTINUE
               END IF
            END IF
*
*           ==== Normal case: Chain of 3-by-3 reflections ====
*
            DO 80 m = mbot, mtop, -1
               k = krcol + 2*( m-1 )
               IF( k.EQ.ktop-1 ) THEN
                  CALL dlaqr1( 3, h( ktop, ktop ), ldh, sr( 2*m-1 ),
     $                         si( 2*m-1 ), sr( 2*m ), si( 2*m ),
     $                         v( 1, m ) )
                  alpha = v( 1, m )
                  CALL dlarfg( 3, alpha, v( 2, m ), 1, v( 1, m ) )
               ELSE
*
*                 ==== Perform delayed transformation of row below
*                 .    Mth bulge. Exploit fact that first two elements
*                 .    of row are actually zero. ====
*
                  refsum = v( 1, m )*v( 3, m )*h( k+3, k+2 )
                  h( k+3, k   ) = -refsum
                  h( k+3, k+1 ) = -refsum*v( 2, m )
                  h( k+3, k+2 ) = h( k+3, k+2 ) - refsum*v( 3, m )
*
*                 ==== Calculate reflection to move
*                 .    Mth bulge one step. ====
*
                  beta      = h( k+1, k )
                  v( 2, m ) = h( k+2, k )
                  v( 3, m ) = h( k+3, k )
                  CALL dlarfg( 3, beta, v( 2, m ), 1, v( 1, m ) )
*
*                 ==== A Bulge may collapse because of vigilant
*                 .    deflation or destructive underflow.  In the
*                 .    underflow case, try the two-small-subdiagonals
*                 .    trick to try to reinflate the bulge.  ====
*
                  IF( h( k+3, k ).NE.zero .OR. h( k+3, k+1 ).NE.
     $                zero .OR. h( k+3, k+2 ).EQ.zero ) THEN
*
*                    ==== Typical case: not collapsed (yet). ====
*
                     h( k+1, k ) = beta
                     h( k+2, k ) = zero
                     h( k+3, k ) = zero
                  ELSE
*
*                    ==== Atypical case: collapsed.  Attempt to
*                    .    reintroduce ignoring H(K+1,K) and H(K+2,K).
*                    .    If the fill resulting from the new
*                    .    reflector is too large, then abandon it.
*                    .    Otherwise, use the new one. ====
*
                     CALL dlaqr1( 3, h( k+1, k+1 ), ldh, sr( 2*m-1 ),
     $                            si( 2*m-1 ), sr( 2*m ), si( 2*m ),
     $                            vt )
                     alpha = vt( 1 )
                     CALL dlarfg( 3, alpha, vt( 2 ), 1, vt( 1 ) )
                     refsum = vt( 1 )*( h( k+1, k )+vt( 2 )*
     $                        h( k+2, k ) )
*
                     IF( abs( h( k+2, k )-refsum*vt( 2 ) )+
     $                   abs( refsum*vt( 3 ) ).GT.ulp*
     $                   ( abs( h( k, k ) )+abs( h( k+1,
     $                   k+1 ) )+abs( h( k+2, k+2 ) ) ) ) THEN
*
*                       ==== Starting a new bulge here would
*                       .    create non-negligible fill.  Use
*                       .    the old one with trepidation. ====
*
                        h( k+1, k ) = beta
                        h( k+2, k ) = zero
                        h( k+3, k ) = zero
                     ELSE
*
*                       ==== Starting a new bulge here would
*                       .    create only negligible fill.
*                       .    Replace the old reflector with
*                       .    the new one. ====
*
                        h( k+1, k ) = h( k+1, k ) - refsum
                        h( k+2, k ) = zero
                        h( k+3, k ) = zero
                        v( 1, m ) = vt( 1 )
                        v( 2, m ) = vt( 2 )
                        v( 3, m ) = vt( 3 )
                     END IF
                  END IF
               END IF
*
*              ====  Apply reflection from the right and
*              .     the first column of update from the left.
*              .     These updates are required for the vigilant
*              .     deflation check. We still delay most of the
*              .     updates from the left for efficiency. ====      
*
               DO 70 j = jtop, min( kbot, k+3 )
                  refsum = v( 1, m )*( h( j, k+1 )+v( 2, m )*
     $                     h( j, k+2 )+v( 3, m )*h( j, k+3 ) )
                  h( j, k+1 ) = h( j, k+1 ) - refsum
                  h( j, k+2 ) = h( j, k+2 ) - refsum*v( 2, m )
                  h( j, k+3 ) = h( j, k+3 ) - refsum*v( 3, m )
   70          CONTINUE
*
*              ==== Perform update from left for subsequent
*              .    column. ====
*
               refsum = v( 1, m )*( h( k+1, k+1 )+v( 2, m )*
     $                  h( k+2, k+1 )+v( 3, m )*h( k+3, k+1 ) )
               h( k+1, k+1 ) = h( k+1, k+1 ) - refsum
               h( k+2, k+1 ) = h( k+2, k+1 ) - refsum*v( 2, m )
               h( k+3, k+1 ) = h( k+3, k+1 ) - refsum*v( 3, m )
*
*              ==== The following convergence test requires that
*              .    the tradition small-compared-to-nearby-diagonals
*              .    criterion and the Ahues & Tisseur (LAWN 122, 1997)
*              .    criteria both be satisfied.  The latter improves
*              .    accuracy in some examples. Falling back on an
*              .    alternate convergence criterion when TST1 or TST2
*              .    is zero (as done here) is traditional but probably
*              .    unnecessary. ====
*
               IF( k.LT.ktop)
     $              cycle
               IF( h( k+1, k ).NE.zero ) THEN
                  tst1 = abs( h( k, k ) ) + abs( h( k+1, k+1 ) )
                  IF( tst1.EQ.zero ) THEN
                     IF( k.GE.ktop+1 )
     $                  tst1 = tst1 + abs( h( k, k-1 ) )
                     IF( k.GE.ktop+2 )
     $                  tst1 = tst1 + abs( h( k, k-2 ) )
                     IF( k.GE.ktop+3 )
     $                  tst1 = tst1 + abs( h( k, k-3 ) )
                     IF( k.LE.kbot-2 )
     $                  tst1 = tst1 + abs( h( k+2, k+1 ) )
                     IF( k.LE.kbot-3 )
     $                  tst1 = tst1 + abs( h( k+3, k+1 ) )
                     IF( k.LE.kbot-4 )
     $                  tst1 = tst1 + abs( h( k+4, k+1 ) )
                  END IF
                  IF( abs( h( k+1, k ) ).LE.max( smlnum, ulp*tst1 ) )
     $                 THEN
                     h12 = max( abs( h( k+1, k ) ), abs( h( k, k+1 ) ) )
                     h21 = min( abs( h( k+1, k ) ), abs( h( k, k+1 ) ) )
                     h11 = max( abs( h( k+1, k+1 ) ),
     $                     abs( h( k, k )-h( k+1, k+1 ) ) )
                     h22 = min( abs( h( k+1, k+1 ) ),
     $                     abs( h( k, k )-h( k+1, k+1 ) ) )
                     scl = h11 + h12
                     tst2 = h22*( h11 / scl )
*
                     IF( tst2.EQ.zero .OR. h21*( h12 / scl ).LE.
     $                   max( smlnum, ulp*tst2 ) ) THEN
                        h( k+1, k ) = zero
                     END IF
                  END IF
               END IF
   80       CONTINUE
*
*           ==== Multiply H by reflections from the left ====
*
            IF( accum ) THEN
               jbot = min( ndcol, kbot )
            ELSE IF( wantt ) THEN
               jbot = n
            ELSE
               jbot = kbot
            END IF
*
            DO 100 m = mbot, mtop, -1
               k = krcol + 2*( m-1 )
               DO 90 j = max( ktop, krcol + 2*m ), jbot
                  refsum = v( 1, m )*( h( k+1, j )+v( 2, m )*
     $                     h( k+2, j )+v( 3, m )*h( k+3, j ) )
                  h( k+1, j ) = h( k+1, j ) - refsum
                  h( k+2, j ) = h( k+2, j ) - refsum*v( 2, m )
                  h( k+3, j ) = h( k+3, j ) - refsum*v( 3, m )
   90          CONTINUE
  100       CONTINUE
*
*           ==== Accumulate orthogonal transformations. ====
*
            IF( accum ) THEN
*
*              ==== Accumulate U. (If needed, update Z later
*              .    with an efficient matrix-matrix
*              .    multiply.) ====
*
               DO 120 m = mbot, mtop, -1
                  k = krcol + 2*( m-1 )
                  kms = k - incol
                  i2 = max( 1, ktop-incol )
                  i2 = max( i2, kms-(krcol-incol)+1 )
                  i4 = min( kdu, krcol + 2*( mbot-1 ) - incol + 5 )
                  DO 110 j = i2, i4
                     refsum = v( 1, m )*( u( j, kms+1 )+v( 2, m )*
     $                        u( j, kms+2 )+v( 3, m )*u( j, kms+3 ) )
                     u( j, kms+1 ) = u( j, kms+1 ) - refsum
                     u( j, kms+2 ) = u( j, kms+2 ) - refsum*v( 2, m )
                     u( j, kms+3 ) = u( j, kms+3 ) - refsum*v( 3, m )
  110             CONTINUE
  120          CONTINUE
            ELSE IF( wantz ) THEN
*
*              ==== U is not accumulated, so update Z
*              .    now by multiplying by reflections
*              .    from the right. ====
*
               DO 140 m = mbot, mtop, -1
                  k = krcol + 2*( m-1 )
                  DO 130 j = iloz, ihiz
                     refsum = v( 1, m )*( z( j, k+1 )+v( 2, m )*
     $                        z( j, k+2 )+v( 3, m )*z( j, k+3 ) )
                     z( j, k+1 ) = z( j, k+1 ) - refsum
                     z( j, k+2 ) = z( j, k+2 ) - refsum*v( 2, m )
                     z( j, k+3 ) = z( j, k+3 ) - refsum*v( 3, m )
  130             CONTINUE
  140          CONTINUE
            END IF
*
*           ==== End of near-the-diagonal bulge chase. ====
*
  145    CONTINUE
*
*        ==== Use U (if accumulated) to update far-from-diagonal
*        .    entries in H.  If required, use U to update Z as
*        .    well. ====
*
         IF( accum ) THEN
            IF( wantt ) THEN
               jtop = 1
               jbot = n
            ELSE
               jtop = ktop
               jbot = kbot
            END IF
            k1 = max( 1, ktop-incol )
            nu = ( kdu-max( 0, ndcol-kbot ) ) - k1 + 1
*
*           ==== Horizontal Multiply ====
*
            DO 150 jcol = min( ndcol, kbot ) + 1, jbot, nh
               jlen = min( nh, jbot-jcol+1 )
               CALL dgemm( 'C', 'N', nu, jlen, nu, one, u( k1, k1 ),
     $                        ldu, h( incol+k1, jcol ), ldh, zero, wh,
     $                        ldwh )
               CALL dlacpy( 'ALL', nu, jlen, wh, ldwh,
     $                         h( incol+k1, jcol ), ldh )
  150       CONTINUE
*
*           ==== Vertical multiply ====
*
            DO 160 jrow = jtop, max( ktop, incol ) - 1, nv
               jlen = min( nv, max( ktop, incol )-jrow )
               CALL dgemm( 'N', 'N', jlen, nu, nu, one,
     $                     h( jrow, incol+k1 ), ldh, u( k1, k1 ),
     $                     ldu, zero, wv, ldwv )
               CALL dlacpy( 'ALL', jlen, nu, wv, ldwv,
     $                      h( jrow, incol+k1 ), ldh )
  160       CONTINUE
*
*           ==== Z multiply (also vertical) ====
*
            IF( wantz ) THEN
               DO 170 jrow = iloz, ihiz, nv
                  jlen = min( nv, ihiz-jrow+1 )
                  CALL dgemm( 'N', 'N', jlen, nu, nu, one,
     $                        z( jrow, incol+k1 ), ldz, u( k1, k1 ),
     $                        ldu, zero, wv, ldwv )
                  CALL dlacpy( 'ALL', jlen, nu, wv, ldwv,
     $                         z( jrow, incol+k1 ), ldz )
  170          CONTINUE
            END IF
         END IF
  180 CONTINUE
*
*     ==== End of DLAQR5 ====
*

◆ dlaqsb()

subroutine dlaqsb	(	character	uplo,
		integer	n,
		integer	kd,
		double precision, dimension( ldab, * )	ab,
		integer	ldab,
		double precision, dimension( * )	s,
		double precision	scond,
		double precision	amax,
		character	equed )

DLAQSB scales a symmetric/Hermitian band matrix, using scaling factors computed by spbequ.

Download DLAQSB + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLAQSB equilibrates a symmetric band matrix A using the scaling
!> factors in the vector S.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> Specifies whether the upper or lower triangular part of the !> symmetric matrix A is stored. !> = 'U': Upper triangular !> = 'L': Lower triangular !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in]	KD	!> KD is INTEGER !> The number of super-diagonals of the matrix A if UPLO = 'U', !> or the number of sub-diagonals if UPLO = 'L'. KD >= 0. !>
[in,out]	AB	!> AB is DOUBLE PRECISION array, dimension (LDAB,N) !> On entry, the upper or lower triangle of the symmetric band !> matrix A, stored in the first KD+1 rows of the array. The !> j-th column of A is stored in the j-th column of the array AB !> as follows: !> if UPLO = 'U', AB(kd+1+i-j,j) = A(i,j) for max(1,j-kd)<=i<=j; !> if UPLO = 'L', AB(1+i-j,j) = A(i,j) for j<=i<=min(n,j+kd). !> !> On exit, if INFO = 0, the triangular factor U or L from the !> Cholesky factorization A = U*TU or A = LL*T of the band !> matrix A, in the same storage format as A. !>
[in]	LDAB	!> LDAB is INTEGER !> The leading dimension of the array AB. LDAB >= KD+1. !>
[in]	S	!> S is DOUBLE PRECISION array, dimension (N) !> The scale factors for A. !>
[in]	SCOND	!> SCOND is DOUBLE PRECISION !> Ratio of the smallest S(i) to the largest S(i). !>
[in]	AMAX	!> AMAX is DOUBLE PRECISION !> Absolute value of largest matrix entry. !>
[out]	EQUED	!> EQUED is CHARACTER1 !> Specifies whether or not equilibration was done. !> = 'N': No equilibration. !> = 'Y': Equilibration was done, i.e., A has been replaced by !> diag(S) A * diag(S). !>

Internal Parameters:

!>  THRESH is a threshold value used to decide if scaling should be done
!>  based on the ratio of the scaling factors.  If SCOND < THRESH,
!>  scaling is done.
!>
!>  LARGE and SMALL are threshold values used to decide if scaling should
!>  be done based on the absolute size of the largest matrix element.
!>  If AMAX > LARGE or AMAX < SMALL, scaling is done.
!>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 139 of file dlaqsb.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          EQUED, UPLO
      INTEGER            KD, LDAB, N
      DOUBLE PRECISION   AMAX, SCOND
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   AB( LDAB, * ), S( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ONE, THRESH
      parameter( one = 1.0d+0, thresh = 0.1d+0 )
*     ..
*     .. Local Scalars ..
      INTEGER            I, J
      DOUBLE PRECISION   CJ, LARGE, SMALL
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      DOUBLE PRECISION   DLAMCH
      EXTERNAL           lsame, dlamch
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, min
*     ..
*     .. Executable Statements ..
*
*     Quick return if possible
*
      IF( n.LE.0 ) THEN
         equed = 'N'
         RETURN
      END IF
*
*     Initialize LARGE and SMALL.
*
      small = dlamch( 'Safe minimum' ) / dlamch( 'Precision' )
      large = one / small
*
      IF( scond.GE.thresh .AND. amax.GE.small .AND. amax.LE.large ) THEN
*
*        No equilibration
*
         equed = 'N'
      ELSE
*
*        Replace A by diag(S) * A * diag(S).
*
         IF( lsame( uplo, 'U' ) ) THEN
*
*           Upper triangle of A is stored in band format.
*
            DO 20 j = 1, n
               cj = s( j )
               DO 10 i = max( 1, j-kd ), j
                  ab( kd+1+i-j, j ) = cj*s( i )*ab( kd+1+i-j, j )
   10          CONTINUE
   20       CONTINUE
         ELSE
*
*           Lower triangle of A is stored.
*
            DO 40 j = 1, n
               cj = s( j )
               DO 30 i = j, min( n, j+kd )
                  ab( 1+i-j, j ) = cj*s( i )*ab( 1+i-j, j )
   30          CONTINUE
   40       CONTINUE
         END IF
         equed = 'Y'
      END IF
*
      RETURN
*
*     End of DLAQSB
*

◆ dlaqsp()

subroutine dlaqsp	(	character	uplo,
		integer	n,
		double precision, dimension( * )	ap,
		double precision, dimension( * )	s,
		double precision	scond,
		double precision	amax,
		character	equed )

DLAQSP scales a symmetric/Hermitian matrix in packed storage, using scaling factors computed by sppequ.

Download DLAQSP + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLAQSP equilibrates a symmetric matrix A using the scaling factors
!> in the vector S.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> Specifies whether the upper or lower triangular part of the !> symmetric matrix A is stored. !> = 'U': Upper triangular !> = 'L': Lower triangular !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in,out]	AP	!> AP is DOUBLE PRECISION array, dimension (N(N+1)/2) !> On entry, the upper or lower triangle of the symmetric matrix !> A, packed columnwise in a linear array. The j-th column of A !> is stored in the array AP as follows: !> if UPLO = 'U', AP(i + (j-1)j/2) = A(i,j) for 1<=i<=j; !> if UPLO = 'L', AP(i + (j-1)(2n-j)/2) = A(i,j) for j<=i<=n. !> !> On exit, the equilibrated matrix: diag(S) A * diag(S), in !> the same storage format as A. !>
[in]	S	!> S is DOUBLE PRECISION array, dimension (N) !> The scale factors for A. !>
[in]	SCOND	!> SCOND is DOUBLE PRECISION !> Ratio of the smallest S(i) to the largest S(i). !>
[in]	AMAX	!> AMAX is DOUBLE PRECISION !> Absolute value of largest matrix entry. !>
[out]	EQUED	!> EQUED is CHARACTER1 !> Specifies whether or not equilibration was done. !> = 'N': No equilibration. !> = 'Y': Equilibration was done, i.e., A has been replaced by !> diag(S) A * diag(S). !>

Internal Parameters:

!>  THRESH is a threshold value used to decide if scaling should be done
!>  based on the ratio of the scaling factors.  If SCOND < THRESH,
!>  scaling is done.
!>
!>  LARGE and SMALL are threshold values used to decide if scaling should
!>  be done based on the absolute size of the largest matrix element.
!>  If AMAX > LARGE or AMAX < SMALL, scaling is done.
!>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 124 of file dlaqsp.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          EQUED, UPLO
      INTEGER            N
      DOUBLE PRECISION   AMAX, SCOND
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   AP( * ), S( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ONE, THRESH
      parameter( one = 1.0d+0, thresh = 0.1d+0 )
*     ..
*     .. Local Scalars ..
      INTEGER            I, J, JC
      DOUBLE PRECISION   CJ, LARGE, SMALL
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      DOUBLE PRECISION   DLAMCH
      EXTERNAL           lsame, dlamch
*     ..
*     .. Executable Statements ..
*
*     Quick return if possible
*
      IF( n.LE.0 ) THEN
         equed = 'N'
         RETURN
      END IF
*
*     Initialize LARGE and SMALL.
*
      small = dlamch( 'Safe minimum' ) / dlamch( 'Precision' )
      large = one / small
*
      IF( scond.GE.thresh .AND. amax.GE.small .AND. amax.LE.large ) THEN
*
*        No equilibration
*
         equed = 'N'
      ELSE
*
*        Replace A by diag(S) * A * diag(S).
*
         IF( lsame( uplo, 'U' ) ) THEN
*
*           Upper triangle of A is stored.
*
            jc = 1
            DO 20 j = 1, n
               cj = s( j )
               DO 10 i = 1, j
                  ap( jc+i-1 ) = cj*s( i )*ap( jc+i-1 )
   10          CONTINUE
               jc = jc + j
   20       CONTINUE
         ELSE
*
*           Lower triangle of A is stored.
*
            jc = 1
            DO 40 j = 1, n
               cj = s( j )
               DO 30 i = j, n
                  ap( jc+i-j ) = cj*s( i )*ap( jc+i-j )
   30          CONTINUE
               jc = jc + n - j + 1
   40       CONTINUE
         END IF
         equed = 'Y'
      END IF
*
      RETURN
*
*     End of DLAQSP
*

◆ dlaqtr()

subroutine dlaqtr	(	logical	ltran,
		logical	lreal,
		integer	n,
		double precision, dimension( ldt, * )	t,
		integer	ldt,
		double precision, dimension( * )	b,
		double precision	w,
		double precision	scale,
		double precision, dimension( * )	x,
		double precision, dimension( * )	work,
		integer	info )

DLAQTR solves a real quasi-triangular system of equations, or a complex quasi-triangular system of special form, in real arithmetic.

Download DLAQTR + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLAQTR solves the real quasi-triangular system
!>
!>              op(T)*p = scale*c,               if LREAL = .TRUE.
!>
!> or the complex quasi-triangular systems
!>
!>            op(T + iB)*(p+iq) = scale*(c+id),  if LREAL = .FALSE.
!>
!> in real arithmetic, where T is upper quasi-triangular.
!> If LREAL = .FALSE., then the first diagonal block of T must be
!> 1 by 1, B is the specially structured matrix
!>
!>                B = [ b(1) b(2) ... b(n) ]
!>                    [       w            ]
!>                    [           w        ]
!>                    [              .     ]
!>                    [                 w  ]
!>
!> op(A) = A or A**T, A**T denotes the transpose of
!> matrix A.
!>
!> On input, X = [ c ].  On output, X = [ p ].
!>               [ d ]                  [ q ]
!>
!> This subroutine is designed for the condition number estimation
!> in routine DTRSNA.
!>

Parameters

[in]	LTRAN	!> LTRAN is LOGICAL !> On entry, LTRAN specifies the option of conjugate transpose: !> = .FALSE., op(T+iB) = T+iB, !> = .TRUE., op(T+iB) = (T+iB)**T. !>
[in]	LREAL	!> LREAL is LOGICAL !> On entry, LREAL specifies the input matrix structure: !> = .FALSE., the input is complex !> = .TRUE., the input is real !>
[in]	N	!> N is INTEGER !> On entry, N specifies the order of T+i*B. N >= 0. !>
[in]	T	!> T is DOUBLE PRECISION array, dimension (LDT,N) !> On entry, T contains a matrix in Schur canonical form. !> If LREAL = .FALSE., then the first diagonal block of T mu !> be 1 by 1. !>
[in]	LDT	!> LDT is INTEGER !> The leading dimension of the matrix T. LDT >= max(1,N). !>
[in]	B	!> B is DOUBLE PRECISION array, dimension (N) !> On entry, B contains the elements to form the matrix !> B as described above. !> If LREAL = .TRUE., B is not referenced. !>
[in]	W	!> W is DOUBLE PRECISION !> On entry, W is the diagonal element of the matrix B. !> If LREAL = .TRUE., W is not referenced. !>
[out]	SCALE	!> SCALE is DOUBLE PRECISION !> On exit, SCALE is the scale factor. !>
[in,out]	X	!> X is DOUBLE PRECISION array, dimension (2*N) !> On entry, X contains the right hand side of the system. !> On exit, X is overwritten by the solution. !>
[out]	WORK	!> WORK is DOUBLE PRECISION array, dimension (N) !>
[out]	INFO	!> INFO is INTEGER !> On exit, INFO is set to !> 0: successful exit. !> 1: the some diagonal 1 by 1 block has been perturbed by !> a small number SMIN to keep nonsingularity. !> 2: the some diagonal 2 by 2 block has been perturbed by !> a small number in DLALN2 to keep nonsingularity. !> NOTE: In the interests of speed, this routine does not !> check the inputs for errors. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 163 of file dlaqtr.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      LOGICAL            LREAL, LTRAN
      INTEGER            INFO, LDT, N
      DOUBLE PRECISION   SCALE, W
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   B( * ), T( LDT, * ), WORK( * ), X( * )
*     ..
*
* =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ZERO, ONE
      parameter( zero = 0.0d+0, one = 1.0d+0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            NOTRAN
      INTEGER            I, IERR, J, J1, J2, JNEXT, K, N1, N2
      DOUBLE PRECISION   BIGNUM, EPS, REC, SCALOC, SI, SMIN, SMINW,
     $                   SMLNUM, SR, TJJ, TMP, XJ, XMAX, XNORM, Z
*     ..
*     .. Local Arrays ..
      DOUBLE PRECISION   D( 2, 2 ), V( 2, 2 )
*     ..
*     .. External Functions ..
      INTEGER            IDAMAX
      DOUBLE PRECISION   DASUM, DDOT, DLAMCH, DLANGE
      EXTERNAL           idamax, dasum, ddot, dlamch, dlange
*     ..
*     .. External Subroutines ..
      EXTERNAL           daxpy, dladiv, dlaln2, dscal
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, max
*     ..
*     .. Executable Statements ..
*
*     Do not test the input parameters for errors
*
      notran = .NOT.ltran
      info = 0
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
*     Set constants to control overflow
*
      eps = dlamch( 'P' )
      smlnum = dlamch( 'S' ) / eps
      bignum = one / smlnum
*
      xnorm = dlange( 'M', n, n, t, ldt, d )
      IF( .NOT.lreal )
     $   xnorm = max( xnorm, abs( w ), dlange( 'M', n, 1, b, n, d ) )
      smin = max( smlnum, eps*xnorm )
*
*     Compute 1-norm of each column of strictly upper triangular
*     part of T to control overflow in triangular solver.
*
      work( 1 ) = zero
      DO 10 j = 2, n
         work( j ) = dasum( j-1, t( 1, j ), 1 )
   10 CONTINUE
*
      IF( .NOT.lreal ) THEN
         DO 20 i = 2, n
            work( i ) = work( i ) + abs( b( i ) )
   20    CONTINUE
      END IF
*
      n2 = 2*n
      n1 = n
      IF( .NOT.lreal )
     $   n1 = n2
      k = idamax( n1, x, 1 )
      xmax = abs( x( k ) )
      scale = one
*
      IF( xmax.GT.bignum ) THEN
         scale = bignum / xmax
         CALL dscal( n1, scale, x, 1 )
         xmax = bignum
      END IF
*
      IF( lreal ) THEN
*
         IF( notran ) THEN
*
*           Solve T*p = scale*c
*
            jnext = n
            DO 30 j = n, 1, -1
               IF( j.GT.jnext )
     $            GO TO 30
               j1 = j
               j2 = j
               jnext = j - 1
               IF( j.GT.1 ) THEN
                  IF( t( j, j-1 ).NE.zero ) THEN
                     j1 = j - 1
                     jnext = j - 2
                  END IF
               END IF
*
               IF( j1.EQ.j2 ) THEN
*
*                 Meet 1 by 1 diagonal block
*
*                 Scale to avoid overflow when computing
*                     x(j) = b(j)/T(j,j)
*
                  xj = abs( x( j1 ) )
                  tjj = abs( t( j1, j1 ) )
                  tmp = t( j1, j1 )
                  IF( tjj.LT.smin ) THEN
                     tmp = smin
                     tjj = smin
                     info = 1
                  END IF
*
                  IF( xj.EQ.zero )
     $               GO TO 30
*
                  IF( tjj.LT.one ) THEN
                     IF( xj.GT.bignum*tjj ) THEN
                        rec = one / xj
                        CALL dscal( n, rec, x, 1 )
                        scale = scale*rec
                        xmax = xmax*rec
                     END IF
                  END IF
                  x( j1 ) = x( j1 ) / tmp
                  xj = abs( x( j1 ) )
*
*                 Scale x if necessary to avoid overflow when adding a
*                 multiple of column j1 of T.
*
                  IF( xj.GT.one ) THEN
                     rec = one / xj
                     IF( work( j1 ).GT.( bignum-xmax )*rec ) THEN
                        CALL dscal( n, rec, x, 1 )
                        scale = scale*rec
                     END IF
                  END IF
                  IF( j1.GT.1 ) THEN
                     CALL daxpy( j1-1, -x( j1 ), t( 1, j1 ), 1, x, 1 )
                     k = idamax( j1-1, x, 1 )
                     xmax = abs( x( k ) )
                  END IF
*
               ELSE
*
*                 Meet 2 by 2 diagonal block
*
*                 Call 2 by 2 linear system solve, to take
*                 care of possible overflow by scaling factor.
*
                  d( 1, 1 ) = x( j1 )
                  d( 2, 1 ) = x( j2 )
                  CALL dlaln2( .false., 2, 1, smin, one, t( j1, j1 ),
     $                         ldt, one, one, d, 2, zero, zero, v, 2,
     $                         scaloc, xnorm, ierr )
                  IF( ierr.NE.0 )
     $               info = 2
*
                  IF( scaloc.NE.one ) THEN
                     CALL dscal( n, scaloc, x, 1 )
                     scale = scale*scaloc
                  END IF
                  x( j1 ) = v( 1, 1 )
                  x( j2 ) = v( 2, 1 )
*
*                 Scale V(1,1) (= X(J1)) and/or V(2,1) (=X(J2))
*                 to avoid overflow in updating right-hand side.
*
                  xj = max( abs( v( 1, 1 ) ), abs( v( 2, 1 ) ) )
                  IF( xj.GT.one ) THEN
                     rec = one / xj
                     IF( max( work( j1 ), work( j2 ) ).GT.
     $                   ( bignum-xmax )*rec ) THEN
                        CALL dscal( n, rec, x, 1 )
                        scale = scale*rec
                     END IF
                  END IF
*
*                 Update right-hand side
*
                  IF( j1.GT.1 ) THEN
                     CALL daxpy( j1-1, -x( j1 ), t( 1, j1 ), 1, x, 1 )
                     CALL daxpy( j1-1, -x( j2 ), t( 1, j2 ), 1, x, 1 )
                     k = idamax( j1-1, x, 1 )
                     xmax = abs( x( k ) )
                  END IF
*
               END IF
*
   30       CONTINUE
*
         ELSE
*
*           Solve T**T*p = scale*c
*
            jnext = 1
            DO 40 j = 1, n
               IF( j.LT.jnext )
     $            GO TO 40
               j1 = j
               j2 = j
               jnext = j + 1
               IF( j.LT.n ) THEN
                  IF( t( j+1, j ).NE.zero ) THEN
                     j2 = j + 1
                     jnext = j + 2
                  END IF
               END IF
*
               IF( j1.EQ.j2 ) THEN
*
*                 1 by 1 diagonal block
*
*                 Scale if necessary to avoid overflow in forming the
*                 right-hand side element by inner product.
*
                  xj = abs( x( j1 ) )
                  IF( xmax.GT.one ) THEN
                     rec = one / xmax
                     IF( work( j1 ).GT.( bignum-xj )*rec ) THEN
                        CALL dscal( n, rec, x, 1 )
                        scale = scale*rec
                        xmax = xmax*rec
                     END IF
                  END IF
*
                  x( j1 ) = x( j1 ) - ddot( j1-1, t( 1, j1 ), 1, x, 1 )
*
                  xj = abs( x( j1 ) )
                  tjj = abs( t( j1, j1 ) )
                  tmp = t( j1, j1 )
                  IF( tjj.LT.smin ) THEN
                     tmp = smin
                     tjj = smin
                     info = 1
                  END IF
*
                  IF( tjj.LT.one ) THEN
                     IF( xj.GT.bignum*tjj ) THEN
                        rec = one / xj
                        CALL dscal( n, rec, x, 1 )
                        scale = scale*rec
                        xmax = xmax*rec
                     END IF
                  END IF
                  x( j1 ) = x( j1 ) / tmp
                  xmax = max( xmax, abs( x( j1 ) ) )
*
               ELSE
*
*                 2 by 2 diagonal block
*
*                 Scale if necessary to avoid overflow in forming the
*                 right-hand side elements by inner product.
*
                  xj = max( abs( x( j1 ) ), abs( x( j2 ) ) )
                  IF( xmax.GT.one ) THEN
                     rec = one / xmax
                     IF( max( work( j2 ), work( j1 ) ).GT.( bignum-xj )*
     $                   rec ) THEN
                        CALL dscal( n, rec, x, 1 )
                        scale = scale*rec
                        xmax = xmax*rec
                     END IF
                  END IF
*
                  d( 1, 1 ) = x( j1 ) - ddot( j1-1, t( 1, j1 ), 1, x,
     $                        1 )
                  d( 2, 1 ) = x( j2 ) - ddot( j1-1, t( 1, j2 ), 1, x,
     $                        1 )
*
                  CALL dlaln2( .true., 2, 1, smin, one, t( j1, j1 ),
     $                         ldt, one, one, d, 2, zero, zero, v, 2,
     $                         scaloc, xnorm, ierr )
                  IF( ierr.NE.0 )
     $               info = 2
*
                  IF( scaloc.NE.one ) THEN
                     CALL dscal( n, scaloc, x, 1 )
                     scale = scale*scaloc
                  END IF
                  x( j1 ) = v( 1, 1 )
                  x( j2 ) = v( 2, 1 )
                  xmax = max( abs( x( j1 ) ), abs( x( j2 ) ), xmax )
*
               END IF
   40       CONTINUE
         END IF
*
      ELSE
*
         sminw = max( eps*abs( w ), smin )
         IF( notran ) THEN
*
*           Solve (T + iB)*(p+iq) = c+id
*
            jnext = n
            DO 70 j = n, 1, -1
               IF( j.GT.jnext )
     $            GO TO 70
               j1 = j
               j2 = j
               jnext = j - 1
               IF( j.GT.1 ) THEN
                  IF( t( j, j-1 ).NE.zero ) THEN
                     j1 = j - 1
                     jnext = j - 2
                  END IF
               END IF
*
               IF( j1.EQ.j2 ) THEN
*
*                 1 by 1 diagonal block
*
*                 Scale if necessary to avoid overflow in division
*
                  z = w
                  IF( j1.EQ.1 )
     $               z = b( 1 )
                  xj = abs( x( j1 ) ) + abs( x( n+j1 ) )
                  tjj = abs( t( j1, j1 ) ) + abs( z )
                  tmp = t( j1, j1 )
                  IF( tjj.LT.sminw ) THEN
                     tmp = sminw
                     tjj = sminw
                     info = 1
                  END IF
*
                  IF( xj.EQ.zero )
     $               GO TO 70
*
                  IF( tjj.LT.one ) THEN
                     IF( xj.GT.bignum*tjj ) THEN
                        rec = one / xj
                        CALL dscal( n2, rec, x, 1 )
                        scale = scale*rec
                        xmax = xmax*rec
                     END IF
                  END IF
                  CALL dladiv( x( j1 ), x( n+j1 ), tmp, z, sr, si )
                  x( j1 ) = sr
                  x( n+j1 ) = si
                  xj = abs( x( j1 ) ) + abs( x( n+j1 ) )
*
*                 Scale x if necessary to avoid overflow when adding a
*                 multiple of column j1 of T.
*
                  IF( xj.GT.one ) THEN
                     rec = one / xj
                     IF( work( j1 ).GT.( bignum-xmax )*rec ) THEN
                        CALL dscal( n2, rec, x, 1 )
                        scale = scale*rec
                     END IF
                  END IF
*
                  IF( j1.GT.1 ) THEN
                     CALL daxpy( j1-1, -x( j1 ), t( 1, j1 ), 1, x, 1 )
                     CALL daxpy( j1-1, -x( n+j1 ), t( 1, j1 ), 1,
     $                           x( n+1 ), 1 )
*
                     x( 1 ) = x( 1 ) + b( j1 )*x( n+j1 )
                     x( n+1 ) = x( n+1 ) - b( j1 )*x( j1 )
*
                     xmax = zero
                     DO 50 k = 1, j1 - 1
                        xmax = max( xmax, abs( x( k ) )+
     $                         abs( x( k+n ) ) )
   50                CONTINUE
                  END IF
*
               ELSE
*
*                 Meet 2 by 2 diagonal block
*
                  d( 1, 1 ) = x( j1 )
                  d( 2, 1 ) = x( j2 )
                  d( 1, 2 ) = x( n+j1 )
                  d( 2, 2 ) = x( n+j2 )
                  CALL dlaln2( .false., 2, 2, sminw, one, t( j1, j1 ),
     $                         ldt, one, one, d, 2, zero, -w, v, 2,
     $                         scaloc, xnorm, ierr )
                  IF( ierr.NE.0 )
     $               info = 2
*
                  IF( scaloc.NE.one ) THEN
                     CALL dscal( 2*n, scaloc, x, 1 )
                     scale = scaloc*scale
                  END IF
                  x( j1 ) = v( 1, 1 )
                  x( j2 ) = v( 2, 1 )
                  x( n+j1 ) = v( 1, 2 )
                  x( n+j2 ) = v( 2, 2 )
*
*                 Scale X(J1), .... to avoid overflow in
*                 updating right hand side.
*
                  xj = max( abs( v( 1, 1 ) )+abs( v( 1, 2 ) ),
     $                 abs( v( 2, 1 ) )+abs( v( 2, 2 ) ) )
                  IF( xj.GT.one ) THEN
                     rec = one / xj
                     IF( max( work( j1 ), work( j2 ) ).GT.
     $                   ( bignum-xmax )*rec ) THEN
                        CALL dscal( n2, rec, x, 1 )
                        scale = scale*rec
                     END IF
                  END IF
*
*                 Update the right-hand side.
*
                  IF( j1.GT.1 ) THEN
                     CALL daxpy( j1-1, -x( j1 ), t( 1, j1 ), 1, x, 1 )
                     CALL daxpy( j1-1, -x( j2 ), t( 1, j2 ), 1, x, 1 )
*
                     CALL daxpy( j1-1, -x( n+j1 ), t( 1, j1 ), 1,
     $                           x( n+1 ), 1 )
                     CALL daxpy( j1-1, -x( n+j2 ), t( 1, j2 ), 1,
     $                           x( n+1 ), 1 )
*
                     x( 1 ) = x( 1 ) + b( j1 )*x( n+j1 ) +
     $                        b( j2 )*x( n+j2 )
                     x( n+1 ) = x( n+1 ) - b( j1 )*x( j1 ) -
     $                          b( j2 )*x( j2 )
*
                     xmax = zero
                     DO 60 k = 1, j1 - 1
                        xmax = max( abs( x( k ) )+abs( x( k+n ) ),
     $                         xmax )
   60                CONTINUE
                  END IF
*
               END IF
   70       CONTINUE
*
         ELSE
*
*           Solve (T + iB)**T*(p+iq) = c+id
*
            jnext = 1
            DO 80 j = 1, n
               IF( j.LT.jnext )
     $            GO TO 80
               j1 = j
               j2 = j
               jnext = j + 1
               IF( j.LT.n ) THEN
                  IF( t( j+1, j ).NE.zero ) THEN
                     j2 = j + 1
                     jnext = j + 2
                  END IF
               END IF
*
               IF( j1.EQ.j2 ) THEN
*
*                 1 by 1 diagonal block
*
*                 Scale if necessary to avoid overflow in forming the
*                 right-hand side element by inner product.
*
                  xj = abs( x( j1 ) ) + abs( x( j1+n ) )
                  IF( xmax.GT.one ) THEN
                     rec = one / xmax
                     IF( work( j1 ).GT.( bignum-xj )*rec ) THEN
                        CALL dscal( n2, rec, x, 1 )
                        scale = scale*rec
                        xmax = xmax*rec
                     END IF
                  END IF
*
                  x( j1 ) = x( j1 ) - ddot( j1-1, t( 1, j1 ), 1, x, 1 )
                  x( n+j1 ) = x( n+j1 ) - ddot( j1-1, t( 1, j1 ), 1,
     $                        x( n+1 ), 1 )
                  IF( j1.GT.1 ) THEN
                     x( j1 ) = x( j1 ) - b( j1 )*x( n+1 )
                     x( n+j1 ) = x( n+j1 ) + b( j1 )*x( 1 )
                  END IF
                  xj = abs( x( j1 ) ) + abs( x( j1+n ) )
*
                  z = w
                  IF( j1.EQ.1 )
     $               z = b( 1 )
*
*                 Scale if necessary to avoid overflow in
*                 complex division
*
                  tjj = abs( t( j1, j1 ) ) + abs( z )
                  tmp = t( j1, j1 )
                  IF( tjj.LT.sminw ) THEN
                     tmp = sminw
                     tjj = sminw
                     info = 1
                  END IF
*
                  IF( tjj.LT.one ) THEN
                     IF( xj.GT.bignum*tjj ) THEN
                        rec = one / xj
                        CALL dscal( n2, rec, x, 1 )
                        scale = scale*rec
                        xmax = xmax*rec
                     END IF
                  END IF
                  CALL dladiv( x( j1 ), x( n+j1 ), tmp, -z, sr, si )
                  x( j1 ) = sr
                  x( j1+n ) = si
                  xmax = max( abs( x( j1 ) )+abs( x( j1+n ) ), xmax )
*
               ELSE
*
*                 2 by 2 diagonal block
*
*                 Scale if necessary to avoid overflow in forming the
*                 right-hand side element by inner product.
*
                  xj = max( abs( x( j1 ) )+abs( x( n+j1 ) ),
     $                 abs( x( j2 ) )+abs( x( n+j2 ) ) )
                  IF( xmax.GT.one ) THEN
                     rec = one / xmax
                     IF( max( work( j1 ), work( j2 ) ).GT.
     $                   ( bignum-xj ) / xmax ) THEN
                        CALL dscal( n2, rec, x, 1 )
                        scale = scale*rec
                        xmax = xmax*rec
                     END IF
                  END IF
*
                  d( 1, 1 ) = x( j1 ) - ddot( j1-1, t( 1, j1 ), 1, x,
     $                        1 )
                  d( 2, 1 ) = x( j2 ) - ddot( j1-1, t( 1, j2 ), 1, x,
     $                        1 )
                  d( 1, 2 ) = x( n+j1 ) - ddot( j1-1, t( 1, j1 ), 1,
     $                        x( n+1 ), 1 )
                  d( 2, 2 ) = x( n+j2 ) - ddot( j1-1, t( 1, j2 ), 1,
     $                        x( n+1 ), 1 )
                  d( 1, 1 ) = d( 1, 1 ) - b( j1 )*x( n+1 )
                  d( 2, 1 ) = d( 2, 1 ) - b( j2 )*x( n+1 )
                  d( 1, 2 ) = d( 1, 2 ) + b( j1 )*x( 1 )
                  d( 2, 2 ) = d( 2, 2 ) + b( j2 )*x( 1 )
*
                  CALL dlaln2( .true., 2, 2, sminw, one, t( j1, j1 ),
     $                         ldt, one, one, d, 2, zero, w, v, 2,
     $                         scaloc, xnorm, ierr )
                  IF( ierr.NE.0 )
     $               info = 2
*
                  IF( scaloc.NE.one ) THEN
                     CALL dscal( n2, scaloc, x, 1 )
                     scale = scaloc*scale
                  END IF
                  x( j1 ) = v( 1, 1 )
                  x( j2 ) = v( 2, 1 )
                  x( n+j1 ) = v( 1, 2 )
                  x( n+j2 ) = v( 2, 2 )
                  xmax = max( abs( x( j1 ) )+abs( x( n+j1 ) ),
     $                   abs( x( j2 ) )+abs( x( n+j2 ) ), xmax )
*
               END IF
*
   80       CONTINUE
*
         END IF
*
      END IF
*
      RETURN
*
*     End of DLAQTR
*

◆ dlar1v()

subroutine dlar1v	(	integer	n,
		integer	b1,
		integer	bn,
		double precision	lambda,
		double precision, dimension( * )	d,
		double precision, dimension( * )	l,
		double precision, dimension( * )	ld,
		double precision, dimension( * )	lld,
		double precision	pivmin,
		double precision	gaptol,
		double precision, dimension( * )	z,
		logical	wantnc,
		integer	negcnt,
		double precision	ztz,
		double precision	mingma,
		integer	r,
		integer, dimension( * )	isuppz,
		double precision	nrminv,
		double precision	resid,
		double precision	rqcorr,
		double precision, dimension( * )	work )

DLAR1V computes the (scaled) r-th column of the inverse of the submatrix in rows b1 through bn of the tridiagonal matrix LDLT - λI.

Download DLAR1V + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLAR1V computes the (scaled) r-th column of the inverse of
!> the sumbmatrix in rows B1 through BN of the tridiagonal matrix
!> L D L**T - sigma I. When sigma is close to an eigenvalue, the
!> computed vector is an accurate eigenvector. Usually, r corresponds
!> to the index where the eigenvector is largest in magnitude.
!> The following steps accomplish this computation :
!> (a) Stationary qd transform,  L D L**T - sigma I = L(+) D(+) L(+)**T,
!> (b) Progressive qd transform, L D L**T - sigma I = U(-) D(-) U(-)**T,
!> (c) Computation of the diagonal elements of the inverse of
!>     L D L**T - sigma I by combining the above transforms, and choosing
!>     r as the index where the diagonal of the inverse is (one of the)
!>     largest in magnitude.
!> (d) Computation of the (scaled) r-th column of the inverse using the
!>     twisted factorization obtained by combining the top part of the
!>     the stationary and the bottom part of the progressive transform.
!>

Parameters

[in]	N	!> N is INTEGER !> The order of the matrix L D L**T. !>
[in]	B1	!> B1 is INTEGER !> First index of the submatrix of L D L**T. !>
[in]	BN	!> BN is INTEGER !> Last index of the submatrix of L D L**T. !>
[in]	LAMBDA	!> LAMBDA is DOUBLE PRECISION !> The shift. In order to compute an accurate eigenvector, !> LAMBDA should be a good approximation to an eigenvalue !> of L D L**T. !>
[in]	L	!> L is DOUBLE PRECISION array, dimension (N-1) !> The (n-1) subdiagonal elements of the unit bidiagonal matrix !> L, in elements 1 to N-1. !>
[in]	D	!> D is DOUBLE PRECISION array, dimension (N) !> The n diagonal elements of the diagonal matrix D. !>
[in]	LD	!> LD is DOUBLE PRECISION array, dimension (N-1) !> The n-1 elements L(i)*D(i). !>
[in]	LLD	!> LLD is DOUBLE PRECISION array, dimension (N-1) !> The n-1 elements L(i)L(i)D(i). !>
[in]	PIVMIN	!> PIVMIN is DOUBLE PRECISION !> The minimum pivot in the Sturm sequence. !>
[in]	GAPTOL	!> GAPTOL is DOUBLE PRECISION !> Tolerance that indicates when eigenvector entries are negligible !> w.r.t. their contribution to the residual. !>
[in,out]	Z	!> Z is DOUBLE PRECISION array, dimension (N) !> On input, all entries of Z must be set to 0. !> On output, Z contains the (scaled) r-th column of the !> inverse. The scaling is such that Z(R) equals 1. !>
[in]	WANTNC	!> WANTNC is LOGICAL !> Specifies whether NEGCNT has to be computed. !>
[out]	NEGCNT	!> NEGCNT is INTEGER !> If WANTNC is .TRUE. then NEGCNT = the number of pivots < pivmin !> in the matrix factorization L D L**T, and NEGCNT = -1 otherwise. !>
[out]	ZTZ	!> ZTZ is DOUBLE PRECISION !> The square of the 2-norm of Z. !>
[out]	MINGMA	!> MINGMA is DOUBLE PRECISION !> The reciprocal of the largest (in magnitude) diagonal !> element of the inverse of L D L**T - sigma I. !>
[in,out]	R	!> R is INTEGER !> The twist index for the twisted factorization used to !> compute Z. !> On input, 0 <= R <= N. If R is input as 0, R is set to !> the index where (L D L**T - sigma I)^{-1} is largest !> in magnitude. If 1 <= R <= N, R is unchanged. !> On output, R contains the twist index used to compute Z. !> Ideally, R designates the position of the maximum entry in the !> eigenvector. !>
[out]	ISUPPZ	!> ISUPPZ is INTEGER array, dimension (2) !> The support of the vector in Z, i.e., the vector Z is !> nonzero only in elements ISUPPZ(1) through ISUPPZ( 2 ). !>
[out]	NRMINV	!> NRMINV is DOUBLE PRECISION !> NRMINV = 1/SQRT( ZTZ ) !>
[out]	RESID	!> RESID is DOUBLE PRECISION !> The residual of the FP vector. !> RESID = ABS( MINGMA )/SQRT( ZTZ ) !>
[out]	RQCORR	!> RQCORR is DOUBLE PRECISION !> The Rayleigh Quotient correction to LAMBDA. !> RQCORR = MINGMA*TMP !>
[out]	WORK	!> WORK is DOUBLE PRECISION array, dimension (4*N) !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: Beresford Parlett, University of California, Berkeley, USA
Jim Demmel, University of California, Berkeley, USA
Inderjit Dhillon, University of Texas, Austin, USA
Osni Marques, LBNL/NERSC, USA
Christof Voemel, University of California, Berkeley, USA

Definition at line 227 of file dlar1v.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      LOGICAL            WANTNC
      INTEGER   B1, BN, N, NEGCNT, R
      DOUBLE PRECISION   GAPTOL, LAMBDA, MINGMA, NRMINV, PIVMIN, RESID,
     $                   RQCORR, ZTZ
*     ..
*     .. Array Arguments ..
      INTEGER            ISUPPZ( * )
      DOUBLE PRECISION   D( * ), L( * ), LD( * ), LLD( * ),
     $                  WORK( * )
      DOUBLE PRECISION Z( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ZERO, ONE
      parameter( zero = 0.0d0, one = 1.0d0 )
 
*     ..
*     .. Local Scalars ..
      LOGICAL            SAWNAN1, SAWNAN2
      INTEGER            I, INDLPL, INDP, INDS, INDUMN, NEG1, NEG2, R1,
     $                   R2
      DOUBLE PRECISION   DMINUS, DPLUS, EPS, S, TMP
*     ..
*     .. External Functions ..
      LOGICAL DISNAN
      DOUBLE PRECISION   DLAMCH
      EXTERNAL           disnan, dlamch
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs
*     ..
*     .. Executable Statements ..
*
      eps = dlamch( 'Precision' )
 
 
      IF( r.EQ.0 ) THEN
         r1 = b1
         r2 = bn
      ELSE
         r1 = r
         r2 = r
      END IF
 
*     Storage for LPLUS
      indlpl = 0
*     Storage for UMINUS
      indumn = n
      inds = 2*n + 1
      indp = 3*n + 1
 
      IF( b1.EQ.1 ) THEN
         work( inds ) = zero
      ELSE
         work( inds+b1-1 ) = lld( b1-1 )
      END IF
 
*
*     Compute the stationary transform (using the differential form)
*     until the index R2.
*
      sawnan1 = .false.
      neg1 = 0
      s = work( inds+b1-1 ) - lambda
      DO 50 i = b1, r1 - 1
         dplus = d( i ) + s
         work( indlpl+i ) = ld( i ) / dplus
         IF(dplus.LT.zero) neg1 = neg1 + 1
         work( inds+i ) = s*work( indlpl+i )*l( i )
         s = work( inds+i ) - lambda
 50   CONTINUE
      sawnan1 = disnan( s )
      IF( sawnan1 ) GOTO 60
      DO 51 i = r1, r2 - 1
         dplus = d( i ) + s
         work( indlpl+i ) = ld( i ) / dplus
         work( inds+i ) = s*work( indlpl+i )*l( i )
         s = work( inds+i ) - lambda
 51   CONTINUE
      sawnan1 = disnan( s )
*
 60   CONTINUE
      IF( sawnan1 ) THEN
*        Runs a slower version of the above loop if a NaN is detected
         neg1 = 0
         s = work( inds+b1-1 ) - lambda
         DO 70 i = b1, r1 - 1
            dplus = d( i ) + s
            IF(abs(dplus).LT.pivmin) dplus = -pivmin
            work( indlpl+i ) = ld( i ) / dplus
            IF(dplus.LT.zero) neg1 = neg1 + 1
            work( inds+i ) = s*work( indlpl+i )*l( i )
            IF( work( indlpl+i ).EQ.zero )
     $                      work( inds+i ) = lld( i )
            s = work( inds+i ) - lambda
 70      CONTINUE
         DO 71 i = r1, r2 - 1
            dplus = d( i ) + s
            IF(abs(dplus).LT.pivmin) dplus = -pivmin
            work( indlpl+i ) = ld( i ) / dplus
            work( inds+i ) = s*work( indlpl+i )*l( i )
            IF( work( indlpl+i ).EQ.zero )
     $                      work( inds+i ) = lld( i )
            s = work( inds+i ) - lambda
 71      CONTINUE
      END IF
*
*     Compute the progressive transform (using the differential form)
*     until the index R1
*
      sawnan2 = .false.
      neg2 = 0
      work( indp+bn-1 ) = d( bn ) - lambda
      DO 80 i = bn - 1, r1, -1
         dminus = lld( i ) + work( indp+i )
         tmp = d( i ) / dminus
         IF(dminus.LT.zero) neg2 = neg2 + 1
         work( indumn+i ) = l( i )*tmp
         work( indp+i-1 ) = work( indp+i )*tmp - lambda
 80   CONTINUE
      tmp = work( indp+r1-1 )
      sawnan2 = disnan( tmp )
 
      IF( sawnan2 ) THEN
*        Runs a slower version of the above loop if a NaN is detected
         neg2 = 0
         DO 100 i = bn-1, r1, -1
            dminus = lld( i ) + work( indp+i )
            IF(abs(dminus).LT.pivmin) dminus = -pivmin
            tmp = d( i ) / dminus
            IF(dminus.LT.zero) neg2 = neg2 + 1
            work( indumn+i ) = l( i )*tmp
            work( indp+i-1 ) = work( indp+i )*tmp - lambda
            IF( tmp.EQ.zero )
     $          work( indp+i-1 ) = d( i ) - lambda
 100     CONTINUE
      END IF
*
*     Find the index (from R1 to R2) of the largest (in magnitude)
*     diagonal element of the inverse
*
      mingma = work( inds+r1-1 ) + work( indp+r1-1 )
      IF( mingma.LT.zero ) neg1 = neg1 + 1
      IF( wantnc ) THEN
         negcnt = neg1 + neg2
      ELSE
         negcnt = -1
      ENDIF
      IF( abs(mingma).EQ.zero )
     $   mingma = eps*work( inds+r1-1 )
      r = r1
      DO 110 i = r1, r2 - 1
         tmp = work( inds+i ) + work( indp+i )
         IF( tmp.EQ.zero )
     $      tmp = eps*work( inds+i )
         IF( abs( tmp ).LE.abs( mingma ) ) THEN
            mingma = tmp
            r = i + 1
         END IF
 110  CONTINUE
*
*     Compute the FP vector: solve N^T v = e_r
*
      isuppz( 1 ) = b1
      isuppz( 2 ) = bn
      z( r ) = one
      ztz = one
*
*     Compute the FP vector upwards from R
*
      IF( .NOT.sawnan1 .AND. .NOT.sawnan2 ) THEN
         DO 210 i = r-1, b1, -1
            z( i ) = -( work( indlpl+i )*z( i+1 ) )
            IF( (abs(z(i))+abs(z(i+1)))* abs(ld(i)).LT.gaptol )
     $           THEN
               z( i ) = zero
               isuppz( 1 ) = i + 1
               GOTO 220
            ENDIF
            ztz = ztz + z( i )*z( i )
 210     CONTINUE
 220     CONTINUE
      ELSE
*        Run slower loop if NaN occurred.
         DO 230 i = r - 1, b1, -1
            IF( z( i+1 ).EQ.zero ) THEN
               z( i ) = -( ld( i+1 ) / ld( i ) )*z( i+2 )
            ELSE
               z( i ) = -( work( indlpl+i )*z( i+1 ) )
            END IF
            IF( (abs(z(i))+abs(z(i+1)))* abs(ld(i)).LT.gaptol )
     $           THEN
               z( i ) = zero
               isuppz( 1 ) = i + 1
               GO TO 240
            END IF
            ztz = ztz + z( i )*z( i )
 230     CONTINUE
 240     CONTINUE
      ENDIF
 
*     Compute the FP vector downwards from R in blocks of size BLKSIZ
      IF( .NOT.sawnan1 .AND. .NOT.sawnan2 ) THEN
         DO 250 i = r, bn-1
            z( i+1 ) = -( work( indumn+i )*z( i ) )
            IF( (abs(z(i))+abs(z(i+1)))* abs(ld(i)).LT.gaptol )
     $         THEN
               z( i+1 ) = zero
               isuppz( 2 ) = i
               GO TO 260
            END IF
            ztz = ztz + z( i+1 )*z( i+1 )
 250     CONTINUE
 260     CONTINUE
      ELSE
*        Run slower loop if NaN occurred.
         DO 270 i = r, bn - 1
            IF( z( i ).EQ.zero ) THEN
               z( i+1 ) = -( ld( i-1 ) / ld( i ) )*z( i-1 )
            ELSE
               z( i+1 ) = -( work( indumn+i )*z( i ) )
            END IF
            IF( (abs(z(i))+abs(z(i+1)))* abs(ld(i)).LT.gaptol )
     $           THEN
               z( i+1 ) = zero
               isuppz( 2 ) = i
               GO TO 280
            END IF
            ztz = ztz + z( i+1 )*z( i+1 )
 270     CONTINUE
 280     CONTINUE
      END IF
*
*     Compute quantities for convergence test
*
      tmp = one / ztz
      nrminv = sqrt( tmp )
      resid = abs( mingma )*nrminv
      rqcorr = mingma*tmp
*
*
      RETURN
*
*     End of DLAR1V
*

◆ dlar2v()

subroutine dlar2v	(	integer	n,
		double precision, dimension( * )	x,
		double precision, dimension( * )	y,
		double precision, dimension( * )	z,
		integer	incx,
		double precision, dimension( * )	c,
		double precision, dimension( * )	s,
		integer	incc )

DLAR2V applies a vector of plane rotations with real cosines and real sines from both sides to a sequence of 2-by-2 symmetric/Hermitian matrices.

Download DLAR2V + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLAR2V applies a vector of real plane rotations from both sides to
!> a sequence of 2-by-2 real symmetric matrices, defined by the elements
!> of the vectors x, y and z. For i = 1,2,...,n
!>
!>    ( x(i)  z(i) ) := (  c(i)  s(i) ) ( x(i)  z(i) ) ( c(i) -s(i) )
!>    ( z(i)  y(i) )    ( -s(i)  c(i) ) ( z(i)  y(i) ) ( s(i)  c(i) )
!>

Parameters

[in]	N	!> N is INTEGER !> The number of plane rotations to be applied. !>
[in,out]	X	!> X is DOUBLE PRECISION array, !> dimension (1+(N-1)*INCX) !> The vector x. !>
[in,out]	Y	!> Y is DOUBLE PRECISION array, !> dimension (1+(N-1)*INCX) !> The vector y. !>
[in,out]	Z	!> Z is DOUBLE PRECISION array, !> dimension (1+(N-1)*INCX) !> The vector z. !>
[in]	INCX	!> INCX is INTEGER !> The increment between elements of X, Y and Z. INCX > 0. !>
[in]	C	!> C is DOUBLE PRECISION array, dimension (1+(N-1)*INCC) !> The cosines of the plane rotations. !>
[in]	S	!> S is DOUBLE PRECISION array, dimension (1+(N-1)*INCC) !> The sines of the plane rotations. !>
[in]	INCC	!> INCC is INTEGER !> The increment between elements of C and S. INCC > 0. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 109 of file dlar2v.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INCC, INCX, N
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   C( * ), S( * ), X( * ), Y( * ), Z( * )
*     ..
*
*  =====================================================================
*
*     .. Local Scalars ..
      INTEGER            I, IC, IX
      DOUBLE PRECISION   CI, SI, T1, T2, T3, T4, T5, T6, XI, YI, ZI
*     ..
*     .. Executable Statements ..
*
      ix = 1
      ic = 1
      DO 10 i = 1, n
         xi = x( ix )
         yi = y( ix )
         zi = z( ix )
         ci = c( ic )
         si = s( ic )
         t1 = si*zi
         t2 = ci*zi
         t3 = t2 - si*xi
         t4 = t2 + si*yi
         t5 = ci*xi + t1
         t6 = ci*yi - t1
         x( ix ) = ci*t5 + si*t4
         y( ix ) = ci*t6 - si*t3
         z( ix ) = ci*t4 - si*t5
         ix = ix + incx
         ic = ic + incc
   10 CONTINUE
*
*     End of DLAR2V
*
      RETURN

◆ dlarf()

subroutine dlarf	(	character	side,
		integer	m,
		integer	n,
		double precision, dimension( * )	v,
		integer	incv,
		double precision	tau,
		double precision, dimension( ldc, * )	c,
		integer	ldc,
		double precision, dimension( * )	work )

DLARF applies an elementary reflector to a general rectangular matrix.

Download DLARF + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLARF applies a real elementary reflector H to a real m by n matrix
!> C, from either the left or the right. H is represented in the form
!>
!>       H = I - tau * v * v**T
!>
!> where tau is a real scalar and v is a real vector.
!>
!> If tau = 0, then H is taken to be the unit matrix.
!>

Parameters

[in]	SIDE	!> SIDE is CHARACTER1 !> = 'L': form H C !> = 'R': form C * H !>
[in]	M	!> M is INTEGER !> The number of rows of the matrix C. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix C. !>
[in]	V	!> V is DOUBLE PRECISION array, dimension !> (1 + (M-1)abs(INCV)) if SIDE = 'L' !> or (1 + (N-1)abs(INCV)) if SIDE = 'R' !> The vector v in the representation of H. V is not used if !> TAU = 0. !>
[in]	INCV	!> INCV is INTEGER !> The increment between elements of v. INCV <> 0. !>
[in]	TAU	!> TAU is DOUBLE PRECISION !> The value tau in the representation of H. !>
[in,out]	C	!> C is DOUBLE PRECISION array, dimension (LDC,N) !> On entry, the m by n matrix C. !> On exit, C is overwritten by the matrix H * C if SIDE = 'L', !> or C * H if SIDE = 'R'. !>
[in]	LDC	!> LDC is INTEGER !> The leading dimension of the array C. LDC >= max(1,M). !>
[out]	WORK	!> WORK is DOUBLE PRECISION array, dimension !> (N) if SIDE = 'L' !> or (M) if SIDE = 'R' !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 123 of file dlarf.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          SIDE
      INTEGER            INCV, LDC, M, N
      DOUBLE PRECISION   TAU
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   C( LDC, * ), V( * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ONE, ZERO
      parameter( one = 1.0d+0, zero = 0.0d+0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            APPLYLEFT
      INTEGER            I, LASTV, LASTC
*     ..
*     .. External Subroutines ..
      EXTERNAL           dgemv, dger
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      INTEGER            ILADLR, ILADLC
      EXTERNAL           lsame, iladlr, iladlc
*     ..
*     .. Executable Statements ..
*
      applyleft = lsame( side, 'L' )
      lastv = 0
      lastc = 0
      IF( tau.NE.zero ) THEN
!     Set up variables for scanning V.  LASTV begins pointing to the end
!     of V.
         IF( applyleft ) THEN
            lastv = m
         ELSE
            lastv = n
         END IF
         IF( incv.GT.0 ) THEN
            i = 1 + (lastv-1) * incv
         ELSE
            i = 1
         END IF
!     Look for the last non-zero row in V.
         DO WHILE( lastv.GT.0 .AND. v( i ).EQ.zero )
            lastv = lastv - 1
            i = i - incv
         END DO
         IF( applyleft ) THEN
!     Scan for the last non-zero column in C(1:lastv,:).
            lastc = iladlc(lastv, n, c, ldc)
         ELSE
!     Scan for the last non-zero row in C(:,1:lastv).
            lastc = iladlr(m, lastv, c, ldc)
         END IF
      END IF
!     Note that lastc.eq.0 renders the BLAS operations null; no special
!     case is needed at this level.
      IF( applyleft ) THEN
*
*        Form  H * C
*
         IF( lastv.GT.0 ) THEN
*
*           w(1:lastc,1) := C(1:lastv,1:lastc)**T * v(1:lastv,1)
*
            CALL dgemv( 'Transpose', lastv, lastc, one, c, ldc, v, incv,
     $           zero, work, 1 )
*
*           C(1:lastv,1:lastc) := C(...) - v(1:lastv,1) * w(1:lastc,1)**T
*
            CALL dger( lastv, lastc, -tau, v, incv, work, 1, c, ldc )
         END IF
      ELSE
*
*        Form  C * H
*
         IF( lastv.GT.0 ) THEN
*
*           w(1:lastc,1) := C(1:lastc,1:lastv) * v(1:lastv,1)
*
            CALL dgemv( 'No transpose', lastc, lastv, one, c, ldc,
     $           v, incv, zero, work, 1 )
*
*           C(1:lastc,1:lastv) := C(...) - w(1:lastc,1) * v(1:lastv,1)**T
*
            CALL dger( lastc, lastv, -tau, work, 1, v, incv, c, ldc )
         END IF
      END IF
      RETURN
*
*     End of DLARF
*

◆ dlarfb()

subroutine dlarfb	(	character	side,
		character	trans,
		character	direct,
		character	storev,
		integer	m,
		integer	n,
		integer	k,
		double precision, dimension( ldv, * )	v,
		integer	ldv,
		double precision, dimension( ldt, * )	t,
		integer	ldt,
		double precision, dimension( ldc, * )	c,
		integer	ldc,
		double precision, dimension( ldwork, * )	work,
		integer	ldwork )

DLARFB applies a block reflector or its transpose to a general rectangular matrix.

Download DLARFB + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLARFB applies a real block reflector H or its transpose H**T to a
!> real m by n matrix C, from either the left or the right.
!>

Parameters

[in]	SIDE	!> SIDE is CHARACTER1 !> = 'L': apply H or HT from the Left !> = 'R': apply H or H*T from the Right !>
[in]	TRANS	!> TRANS is CHARACTER1 !> = 'N': apply H (No transpose) !> = 'T': apply H*T (Transpose) !>
[in]	DIRECT	!> DIRECT is CHARACTER*1 !> Indicates how H is formed from a product of elementary !> reflectors !> = 'F': H = H(1) H(2) . . . H(k) (Forward) !> = 'B': H = H(k) . . . H(2) H(1) (Backward) !>
[in]	STOREV	!> STOREV is CHARACTER*1 !> Indicates how the vectors which define the elementary !> reflectors are stored: !> = 'C': Columnwise !> = 'R': Rowwise !>
[in]	M	!> M is INTEGER !> The number of rows of the matrix C. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix C. !>
[in]	K	!> K is INTEGER !> The order of the matrix T (= the number of elementary !> reflectors whose product defines the block reflector). !> If SIDE = 'L', M >= K >= 0; !> if SIDE = 'R', N >= K >= 0. !>
[in]	V	!> V is DOUBLE PRECISION array, dimension !> (LDV,K) if STOREV = 'C' !> (LDV,M) if STOREV = 'R' and SIDE = 'L' !> (LDV,N) if STOREV = 'R' and SIDE = 'R' !> The matrix V. See Further Details. !>
[in]	LDV	!> LDV is INTEGER !> The leading dimension of the array V. !> If STOREV = 'C' and SIDE = 'L', LDV >= max(1,M); !> if STOREV = 'C' and SIDE = 'R', LDV >= max(1,N); !> if STOREV = 'R', LDV >= K. !>
[in]	T	!> T is DOUBLE PRECISION array, dimension (LDT,K) !> The triangular k by k matrix T in the representation of the !> block reflector. !>
[in]	LDT	!> LDT is INTEGER !> The leading dimension of the array T. LDT >= K. !>
[in,out]	C	!> C is DOUBLE PRECISION array, dimension (LDC,N) !> On entry, the m by n matrix C. !> On exit, C is overwritten by HC or HTC or CH or CH**T. !>
[in]	LDC	!> LDC is INTEGER !> The leading dimension of the array C. LDC >= max(1,M). !>
[out]	WORK	!> WORK is DOUBLE PRECISION array, dimension (LDWORK,K) !>
[in]	LDWORK	!> LDWORK is INTEGER !> The leading dimension of the array WORK. !> If SIDE = 'L', LDWORK >= max(1,N); !> if SIDE = 'R', LDWORK >= max(1,M). !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  The shape of the matrix V and the storage of the vectors which define
!>  the H(i) is best illustrated by the following example with n = 5 and
!>  k = 3. The elements equal to 1 are not stored; the corresponding
!>  array elements are modified but restored on exit. The rest of the
!>  array is not used.
!>
!>  DIRECT = 'F' and STOREV = 'C':         DIRECT = 'F' and STOREV = 'R':
!>
!>               V = (  1       )                 V = (  1 v1 v1 v1 v1 )
!>                   ( v1  1    )                     (     1 v2 v2 v2 )
!>                   ( v1 v2  1 )                     (        1 v3 v3 )
!>                   ( v1 v2 v3 )
!>                   ( v1 v2 v3 )
!>
!>  DIRECT = 'B' and STOREV = 'C':         DIRECT = 'B' and STOREV = 'R':
!>
!>               V = ( v1 v2 v3 )                 V = ( v1 v1  1       )
!>                   ( v1 v2 v3 )                     ( v2 v2 v2  1    )
!>                   (  1 v2 v3 )                     ( v3 v3 v3 v3  1 )
!>                   (     1 v3 )
!>                   (        1 )
!>

Definition at line 195 of file dlarfb.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          DIRECT, SIDE, STOREV, TRANS
      INTEGER            K, LDC, LDT, LDV, LDWORK, M, N
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   C( LDC, * ), T( LDT, * ), V( LDV, * ),
     $                   WORK( LDWORK, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ONE
      parameter( one = 1.0d+0 )
*     ..
*     .. Local Scalars ..
      CHARACTER          TRANST
      INTEGER            I, J
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           dcopy, dgemm, dtrmm
*     ..
*     .. Executable Statements ..
*
*     Quick return if possible
*
      IF( m.LE.0 .OR. n.LE.0 )
     $   RETURN
*
      IF( lsame( trans, 'N' ) ) THEN
         transt = 'T'
      ELSE
         transt = 'N'
      END IF
*
      IF( lsame( storev, 'C' ) ) THEN
*
         IF( lsame( direct, 'F' ) ) THEN
*
*           Let  V =  ( V1 )    (first K rows)
*                     ( V2 )
*           where  V1  is unit lower triangular.
*
            IF( lsame( side, 'L' ) ) THEN
*
*              Form  H * C  or  H**T * C  where  C = ( C1 )
*                                                    ( C2 )
*
*              W := C**T * V  =  (C1**T * V1 + C2**T * V2)  (stored in WORK)
*
*              W := C1**T
*
               DO 10 j = 1, k
                  CALL dcopy( n, c( j, 1 ), ldc, work( 1, j ), 1 )
   10          CONTINUE
*
*              W := W * V1
*
               CALL dtrmm( 'Right', 'Lower', 'No transpose', 'Unit', n,
     $                     k, one, v, ldv, work, ldwork )
               IF( m.GT.k ) THEN
*
*                 W := W + C2**T * V2
*
                  CALL dgemm( 'Transpose', 'No transpose', n, k, m-k,
     $                        one, c( k+1, 1 ), ldc, v( k+1, 1 ), ldv,
     $                        one, work, ldwork )
               END IF
*
*              W := W * T**T  or  W * T
*
               CALL dtrmm( 'Right', 'Upper', transt, 'Non-unit', n, k,
     $                     one, t, ldt, work, ldwork )
*
*              C := C - V * W**T
*
               IF( m.GT.k ) THEN
*
*                 C2 := C2 - V2 * W**T
*
                  CALL dgemm( 'No transpose', 'Transpose', m-k, n, k,
     $                        -one, v( k+1, 1 ), ldv, work, ldwork, one,
     $                        c( k+1, 1 ), ldc )
               END IF
*
*              W := W * V1**T
*
               CALL dtrmm( 'Right', 'Lower', 'Transpose', 'Unit', n, k,
     $                     one, v, ldv, work, ldwork )
*
*              C1 := C1 - W**T
*
               DO 30 j = 1, k
                  DO 20 i = 1, n
                     c( j, i ) = c( j, i ) - work( i, j )
   20             CONTINUE
   30          CONTINUE
*
            ELSE IF( lsame( side, 'R' ) ) THEN
*
*              Form  C * H  or  C * H**T  where  C = ( C1  C2 )
*
*              W := C * V  =  (C1*V1 + C2*V2)  (stored in WORK)
*
*              W := C1
*
               DO 40 j = 1, k
                  CALL dcopy( m, c( 1, j ), 1, work( 1, j ), 1 )
   40          CONTINUE
*
*              W := W * V1
*
               CALL dtrmm( 'Right', 'Lower', 'No transpose', 'Unit', m,
     $                     k, one, v, ldv, work, ldwork )
               IF( n.GT.k ) THEN
*
*                 W := W + C2 * V2
*
                  CALL dgemm( 'No transpose', 'No transpose', m, k, n-k,
     $                        one, c( 1, k+1 ), ldc, v( k+1, 1 ), ldv,
     $                        one, work, ldwork )
               END IF
*
*              W := W * T  or  W * T**T
*
               CALL dtrmm( 'Right', 'Upper', trans, 'Non-unit', m, k,
     $                     one, t, ldt, work, ldwork )
*
*              C := C - W * V**T
*
               IF( n.GT.k ) THEN
*
*                 C2 := C2 - W * V2**T
*
                  CALL dgemm( 'No transpose', 'Transpose', m, n-k, k,
     $                        -one, work, ldwork, v( k+1, 1 ), ldv, one,
     $                        c( 1, k+1 ), ldc )
               END IF
*
*              W := W * V1**T
*
               CALL dtrmm( 'Right', 'Lower', 'Transpose', 'Unit', m, k,
     $                     one, v, ldv, work, ldwork )
*
*              C1 := C1 - W
*
               DO 60 j = 1, k
                  DO 50 i = 1, m
                     c( i, j ) = c( i, j ) - work( i, j )
   50             CONTINUE
   60          CONTINUE
            END IF
*
         ELSE
*
*           Let  V =  ( V1 )
*                     ( V2 )    (last K rows)
*           where  V2  is unit upper triangular.
*
            IF( lsame( side, 'L' ) ) THEN
*
*              Form  H * C  or  H**T * C  where  C = ( C1 )
*                                                    ( C2 )
*
*              W := C**T * V  =  (C1**T * V1 + C2**T * V2)  (stored in WORK)
*
*              W := C2**T
*
               DO 70 j = 1, k
                  CALL dcopy( n, c( m-k+j, 1 ), ldc, work( 1, j ), 1 )
   70          CONTINUE
*
*              W := W * V2
*
               CALL dtrmm( 'Right', 'Upper', 'No transpose', 'Unit', n,
     $                     k, one, v( m-k+1, 1 ), ldv, work, ldwork )
               IF( m.GT.k ) THEN
*
*                 W := W + C1**T * V1
*
                  CALL dgemm( 'Transpose', 'No transpose', n, k, m-k,
     $                        one, c, ldc, v, ldv, one, work, ldwork )
               END IF
*
*              W := W * T**T  or  W * T
*
               CALL dtrmm( 'Right', 'Lower', transt, 'Non-unit', n, k,
     $                     one, t, ldt, work, ldwork )
*
*              C := C - V * W**T
*
               IF( m.GT.k ) THEN
*
*                 C1 := C1 - V1 * W**T
*
                  CALL dgemm( 'No transpose', 'Transpose', m-k, n, k,
     $                        -one, v, ldv, work, ldwork, one, c, ldc )
               END IF
*
*              W := W * V2**T
*
               CALL dtrmm( 'Right', 'Upper', 'Transpose', 'Unit', n, k,
     $                     one, v( m-k+1, 1 ), ldv, work, ldwork )
*
*              C2 := C2 - W**T
*
               DO 90 j = 1, k
                  DO 80 i = 1, n
                     c( m-k+j, i ) = c( m-k+j, i ) - work( i, j )
   80             CONTINUE
   90          CONTINUE
*
            ELSE IF( lsame( side, 'R' ) ) THEN
*
*              Form  C * H  or  C * H**T  where  C = ( C1  C2 )
*
*              W := C * V  =  (C1*V1 + C2*V2)  (stored in WORK)
*
*              W := C2
*
               DO 100 j = 1, k
                  CALL dcopy( m, c( 1, n-k+j ), 1, work( 1, j ), 1 )
  100          CONTINUE
*
*              W := W * V2
*
               CALL dtrmm( 'Right', 'Upper', 'No transpose', 'Unit', m,
     $                     k, one, v( n-k+1, 1 ), ldv, work, ldwork )
               IF( n.GT.k ) THEN
*
*                 W := W + C1 * V1
*
                  CALL dgemm( 'No transpose', 'No transpose', m, k, n-k,
     $                        one, c, ldc, v, ldv, one, work, ldwork )
               END IF
*
*              W := W * T  or  W * T**T
*
               CALL dtrmm( 'Right', 'Lower', trans, 'Non-unit', m, k,
     $                     one, t, ldt, work, ldwork )
*
*              C := C - W * V**T
*
               IF( n.GT.k ) THEN
*
*                 C1 := C1 - W * V1**T
*
                  CALL dgemm( 'No transpose', 'Transpose', m, n-k, k,
     $                        -one, work, ldwork, v, ldv, one, c, ldc )
               END IF
*
*              W := W * V2**T
*
               CALL dtrmm( 'Right', 'Upper', 'Transpose', 'Unit', m, k,
     $                     one, v( n-k+1, 1 ), ldv, work, ldwork )
*
*              C2 := C2 - W
*
               DO 120 j = 1, k
                  DO 110 i = 1, m
                     c( i, n-k+j ) = c( i, n-k+j ) - work( i, j )
  110             CONTINUE
  120          CONTINUE
            END IF
         END IF
*
      ELSE IF( lsame( storev, 'R' ) ) THEN
*
         IF( lsame( direct, 'F' ) ) THEN
*
*           Let  V =  ( V1  V2 )    (V1: first K columns)
*           where  V1  is unit upper triangular.
*
            IF( lsame( side, 'L' ) ) THEN
*
*              Form  H * C  or  H**T * C  where  C = ( C1 )
*                                                    ( C2 )
*
*              W := C**T * V**T  =  (C1**T * V1**T + C2**T * V2**T) (stored in WORK)
*
*              W := C1**T
*
               DO 130 j = 1, k
                  CALL dcopy( n, c( j, 1 ), ldc, work( 1, j ), 1 )
  130          CONTINUE
*
*              W := W * V1**T
*
               CALL dtrmm( 'Right', 'Upper', 'Transpose', 'Unit', n, k,
     $                     one, v, ldv, work, ldwork )
               IF( m.GT.k ) THEN
*
*                 W := W + C2**T * V2**T
*
                  CALL dgemm( 'Transpose', 'Transpose', n, k, m-k, one,
     $                        c( k+1, 1 ), ldc, v( 1, k+1 ), ldv, one,
     $                        work, ldwork )
               END IF
*
*              W := W * T**T  or  W * T
*
               CALL dtrmm( 'Right', 'Upper', transt, 'Non-unit', n, k,
     $                     one, t, ldt, work, ldwork )
*
*              C := C - V**T * W**T
*
               IF( m.GT.k ) THEN
*
*                 C2 := C2 - V2**T * W**T
*
                  CALL dgemm( 'Transpose', 'Transpose', m-k, n, k, -one,
     $                        v( 1, k+1 ), ldv, work, ldwork, one,
     $                        c( k+1, 1 ), ldc )
               END IF
*
*              W := W * V1
*
               CALL dtrmm( 'Right', 'Upper', 'No transpose', 'Unit', n,
     $                     k, one, v, ldv, work, ldwork )
*
*              C1 := C1 - W**T
*
               DO 150 j = 1, k
                  DO 140 i = 1, n
                     c( j, i ) = c( j, i ) - work( i, j )
  140             CONTINUE
  150          CONTINUE
*
            ELSE IF( lsame( side, 'R' ) ) THEN
*
*              Form  C * H  or  C * H**T  where  C = ( C1  C2 )
*
*              W := C * V**T  =  (C1*V1**T + C2*V2**T)  (stored in WORK)
*
*              W := C1
*
               DO 160 j = 1, k
                  CALL dcopy( m, c( 1, j ), 1, work( 1, j ), 1 )
  160          CONTINUE
*
*              W := W * V1**T
*
               CALL dtrmm( 'Right', 'Upper', 'Transpose', 'Unit', m, k,
     $                     one, v, ldv, work, ldwork )
               IF( n.GT.k ) THEN
*
*                 W := W + C2 * V2**T
*
                  CALL dgemm( 'No transpose', 'Transpose', m, k, n-k,
     $                        one, c( 1, k+1 ), ldc, v( 1, k+1 ), ldv,
     $                        one, work, ldwork )
               END IF
*
*              W := W * T  or  W * T**T
*
               CALL dtrmm( 'Right', 'Upper', trans, 'Non-unit', m, k,
     $                     one, t, ldt, work, ldwork )
*
*              C := C - W * V
*
               IF( n.GT.k ) THEN
*
*                 C2 := C2 - W * V2
*
                  CALL dgemm( 'No transpose', 'No transpose', m, n-k, k,
     $                        -one, work, ldwork, v( 1, k+1 ), ldv, one,
     $                        c( 1, k+1 ), ldc )
               END IF
*
*              W := W * V1
*
               CALL dtrmm( 'Right', 'Upper', 'No transpose', 'Unit', m,
     $                     k, one, v, ldv, work, ldwork )
*
*              C1 := C1 - W
*
               DO 180 j = 1, k
                  DO 170 i = 1, m
                     c( i, j ) = c( i, j ) - work( i, j )
  170             CONTINUE
  180          CONTINUE
*
            END IF
*
         ELSE
*
*           Let  V =  ( V1  V2 )    (V2: last K columns)
*           where  V2  is unit lower triangular.
*
            IF( lsame( side, 'L' ) ) THEN
*
*              Form  H * C  or  H**T * C  where  C = ( C1 )
*                                                    ( C2 )
*
*              W := C**T * V**T  =  (C1**T * V1**T + C2**T * V2**T) (stored in WORK)
*
*              W := C2**T
*
               DO 190 j = 1, k
                  CALL dcopy( n, c( m-k+j, 1 ), ldc, work( 1, j ), 1 )
  190          CONTINUE
*
*              W := W * V2**T
*
               CALL dtrmm( 'Right', 'Lower', 'Transpose', 'Unit', n, k,
     $                     one, v( 1, m-k+1 ), ldv, work, ldwork )
               IF( m.GT.k ) THEN
*
*                 W := W + C1**T * V1**T
*
                  CALL dgemm( 'Transpose', 'Transpose', n, k, m-k, one,
     $                        c, ldc, v, ldv, one, work, ldwork )
               END IF
*
*              W := W * T**T  or  W * T
*
               CALL dtrmm( 'Right', 'Lower', transt, 'Non-unit', n, k,
     $                     one, t, ldt, work, ldwork )
*
*              C := C - V**T * W**T
*
               IF( m.GT.k ) THEN
*
*                 C1 := C1 - V1**T * W**T
*
                  CALL dgemm( 'Transpose', 'Transpose', m-k, n, k, -one,
     $                        v, ldv, work, ldwork, one, c, ldc )
               END IF
*
*              W := W * V2
*
               CALL dtrmm( 'Right', 'Lower', 'No transpose', 'Unit', n,
     $                     k, one, v( 1, m-k+1 ), ldv, work, ldwork )
*
*              C2 := C2 - W**T
*
               DO 210 j = 1, k
                  DO 200 i = 1, n
                     c( m-k+j, i ) = c( m-k+j, i ) - work( i, j )
  200             CONTINUE
  210          CONTINUE
*
            ELSE IF( lsame( side, 'R' ) ) THEN
*
*              Form  C * H  or  C * H'  where  C = ( C1  C2 )
*
*              W := C * V**T  =  (C1*V1**T + C2*V2**T)  (stored in WORK)
*
*              W := C2
*
               DO 220 j = 1, k
                  CALL dcopy( m, c( 1, n-k+j ), 1, work( 1, j ), 1 )
  220          CONTINUE
*
*              W := W * V2**T
*
               CALL dtrmm( 'Right', 'Lower', 'Transpose', 'Unit', m, k,
     $                     one, v( 1, n-k+1 ), ldv, work, ldwork )
               IF( n.GT.k ) THEN
*
*                 W := W + C1 * V1**T
*
                  CALL dgemm( 'No transpose', 'Transpose', m, k, n-k,
     $                        one, c, ldc, v, ldv, one, work, ldwork )
               END IF
*
*              W := W * T  or  W * T**T
*
               CALL dtrmm( 'Right', 'Lower', trans, 'Non-unit', m, k,
     $                     one, t, ldt, work, ldwork )
*
*              C := C - W * V
*
               IF( n.GT.k ) THEN
*
*                 C1 := C1 - W * V1
*
                  CALL dgemm( 'No transpose', 'No transpose', m, n-k, k,
     $                        -one, work, ldwork, v, ldv, one, c, ldc )
               END IF
*
*              W := W * V2
*
               CALL dtrmm( 'Right', 'Lower', 'No transpose', 'Unit', m,
     $                     k, one, v( 1, n-k+1 ), ldv, work, ldwork )
*
*              C1 := C1 - W
*
               DO 240 j = 1, k
                  DO 230 i = 1, m
                     c( i, n-k+j ) = c( i, n-k+j ) - work( i, j )
  230             CONTINUE
  240          CONTINUE
*
            END IF
*
         END IF
      END IF
*
      RETURN
*
*     End of DLARFB
*

◆ dlarfb_gett()

subroutine dlarfb_gett	(	character	ident,
		integer	m,
		integer	n,
		integer	k,
		double precision, dimension( ldt, * )	t,
		integer	ldt,
		double precision, dimension( lda, * )	a,
		integer	lda,
		double precision, dimension( ldb, * )	b,
		integer	ldb,
		double precision, dimension( ldwork, * )	work,
		integer	ldwork )

DLARFB_GETT

Download DLARFB_GETT + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLARFB_GETT applies a real Householder block reflector H from the
!> left to a real (K+M)-by-N   matrix
!> composed of two block matrices: an upper trapezoidal K-by-N matrix A
!> stored in the array A, and a rectangular M-by-(N-K) matrix B, stored
!> in the array B. The block reflector H is stored in a compact
!> WY-representation, where the elementary reflectors are in the
!> arrays A, B and T. See Further Details section.
!>

Parameters

[in]	IDENT	!> IDENT is CHARACTER*1 !> If IDENT = not 'I', or not 'i', then V1 is unit !> lower-triangular and stored in the left K-by-K block of !> the input matrix A, !> If IDENT = 'I' or 'i', then V1 is an identity matrix and !> not stored. !> See Further Details section. !>
[in]	M	!> M is INTEGER !> The number of rows of the matrix B. !> M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrices A and B. !> N >= 0. !>
[in]	K	!> K is INTEGER !> The number or rows of the matrix A. !> K is also order of the matrix T, i.e. the number of !> elementary reflectors whose product defines the block !> reflector. 0 <= K <= N. !>
[in]	T	!> T is DOUBLE PRECISION array, dimension (LDT,K) !> The upper-triangular K-by-K matrix T in the representation !> of the block reflector. !>
[in]	LDT	!> LDT is INTEGER !> The leading dimension of the array T. LDT >= K. !>
[in,out]	A	!> A is DOUBLE PRECISION array, dimension (LDA,N) !> !> On entry: !> a) In the K-by-N upper-trapezoidal part A: input matrix A. !> b) In the columns below the diagonal: columns of V1 !> (ones are not stored on the diagonal). !> !> On exit: !> A is overwritten by rectangular K-by-N product H*A. !> !> See Further Details section. !>
[in]	LDA	!> LDB is INTEGER !> The leading dimension of the array A. LDA >= max(1,K). !>
[in,out]	B	!> B is DOUBLE PRECISION array, dimension (LDB,N) !> !> On entry: !> a) In the M-by-(N-K) right block: input matrix B. !> b) In the M-by-N left block: columns of V2. !> !> On exit: !> B is overwritten by rectangular M-by-N product H*B. !> !> See Further Details section. !>
[in]	LDB	!> LDB is INTEGER !> The leading dimension of the array B. LDB >= max(1,M). !>
[out]	WORK	!> WORK is DOUBLE PRECISION array, !> dimension (LDWORK,max(K,N-K)) !>
[in]	LDWORK	!> LDWORK is INTEGER !> The leading dimension of the array WORK. LDWORK>=max(1,K). !> !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:

!>
!> November 2020, Igor Kozachenko,
!>                Computer Science Division,
!>                University of California, Berkeley
!>
!>

Further Details:

!>
!>    (1) Description of the Algebraic Operation.
!>
!>    The matrix A is a K-by-N matrix composed of two column block
!>    matrices, A1, which is K-by-K, and A2, which is K-by-(N-K):
!>    A = ( A1, A2 ).
!>    The matrix B is an M-by-N matrix composed of two column block
!>    matrices, B1, which is M-by-K, and B2, which is M-by-(N-K):
!>    B = ( B1, B2 ).
!>
!>    Perform the operation:
!>
!>       ( A_out ) := H * ( A_in ) = ( I - V * T * V**T ) * ( A_in ) =
!>       ( B_out )        ( B_in )                          ( B_in )
!>                  = ( I - ( V1 ) * T * ( V1**T, V2**T ) ) * ( A_in )
!>                          ( V2 )                            ( B_in )
!>     On input:
!>
!>    a) ( A_in )  consists of two block columns:
!>       ( B_in )
!>
!>       ( A_in ) = (( A1_in ) ( A2_in )) = (( A1_in ) ( A2_in ))
!>       ( B_in )   (( B1_in ) ( B2_in ))   ((     0 ) ( B2_in )),
!>
!>       where the column blocks are:
!>
!>       (  A1_in )  is a K-by-K upper-triangular matrix stored in the
!>                   upper triangular part of the array A(1:K,1:K).
!>       (  B1_in )  is an M-by-K rectangular ZERO matrix and not stored.
!>
!>       ( A2_in )  is a K-by-(N-K) rectangular matrix stored
!>                  in the array A(1:K,K+1:N).
!>       ( B2_in )  is an M-by-(N-K) rectangular matrix stored
!>                  in the array B(1:M,K+1:N).
!>
!>    b) V = ( V1 )
!>           ( V2 )
!>
!>       where:
!>       1) if IDENT == 'I',V1 is a K-by-K identity matrix, not stored;
!>       2) if IDENT != 'I',V1 is a K-by-K unit lower-triangular matrix,
!>          stored in the lower-triangular part of the array
!>          A(1:K,1:K) (ones are not stored),
!>       and V2 is an M-by-K rectangular stored the array B(1:M,1:K),
!>                 (because on input B1_in is a rectangular zero
!>                  matrix that is not stored and the space is
!>                  used to store V2).
!>
!>    c) T is a K-by-K upper-triangular matrix stored
!>       in the array T(1:K,1:K).
!>
!>    On output:
!>
!>    a) ( A_out ) consists of two  block columns:
!>       ( B_out )
!>
!>       ( A_out ) = (( A1_out ) ( A2_out ))
!>       ( B_out )   (( B1_out ) ( B2_out )),
!>
!>       where the column blocks are:
!>
!>       ( A1_out )  is a K-by-K square matrix, or a K-by-K
!>                   upper-triangular matrix, if V1 is an
!>                   identity matrix. AiOut is stored in
!>                   the array A(1:K,1:K).
!>       ( B1_out )  is an M-by-K rectangular matrix stored
!>                   in the array B(1:M,K:N).
!>
!>       ( A2_out )  is a K-by-(N-K) rectangular matrix stored
!>                   in the array A(1:K,K+1:N).
!>       ( B2_out )  is an M-by-(N-K) rectangular matrix stored
!>                   in the array B(1:M,K+1:N).
!>
!>
!>    The operation above can be represented as the same operation
!>    on each block column:
!>
!>       ( A1_out ) := H * ( A1_in ) = ( I - V * T * V**T ) * ( A1_in )
!>       ( B1_out )        (     0 )                          (     0 )
!>
!>       ( A2_out ) := H * ( A2_in ) = ( I - V * T * V**T ) * ( A2_in )
!>       ( B2_out )        ( B2_in )                          ( B2_in )
!>
!>    If IDENT != 'I':
!>
!>       The computation for column block 1:
!>
!>       A1_out: = A1_in - V1*T*(V1**T)*A1_in
!>
!>       B1_out: = - V2*T*(V1**T)*A1_in
!>
!>       The computation for column block 2, which exists if N > K:
!>
!>       A2_out: = A2_in - V1*T*( (V1**T)*A2_in + (V2**T)*B2_in )
!>
!>       B2_out: = B2_in - V2*T*( (V1**T)*A2_in + (V2**T)*B2_in )
!>
!>    If IDENT == 'I':
!>
!>       The operation for column block 1:
!>
!>       A1_out: = A1_in - V1*T**A1_in
!>
!>       B1_out: = - V2*T**A1_in
!>
!>       The computation for column block 2, which exists if N > K:
!>
!>       A2_out: = A2_in - T*( A2_in + (V2**T)*B2_in )
!>
!>       B2_out: = B2_in - V2*T*( A2_in + (V2**T)*B2_in )
!>
!>    (2) Description of the Algorithmic Computation.
!>
!>    In the first step, we compute column block 2, i.e. A2 and B2.
!>    Here, we need to use the K-by-(N-K) rectangular workspace
!>    matrix W2 that is of the same size as the matrix A2.
!>    W2 is stored in the array WORK(1:K,1:(N-K)).
!>
!>    In the second step, we compute column block 1, i.e. A1 and B1.
!>    Here, we need to use the K-by-K square workspace matrix W1
!>    that is of the same size as the as the matrix A1.
!>    W1 is stored in the array WORK(1:K,1:K).
!>
!>    NOTE: Hence, in this routine, we need the workspace array WORK
!>    only of size WORK(1:K,1:max(K,N-K)) so it can hold both W2 from
!>    the first step and W1 from the second step.
!>
!>    Case (A), when V1 is unit lower-triangular, i.e. IDENT != 'I',
!>    more computations than in the Case (B).
!>
!>    if( IDENT != 'I' ) then
!>     if ( N > K ) then
!>       (First Step - column block 2)
!>       col2_(1) W2: = A2
!>       col2_(2) W2: = (V1**T) * W2 = (unit_lower_tr_of_(A1)**T) * W2
!>       col2_(3) W2: = W2 + (V2**T) * B2 = W2 + (B1**T) * B2
!>       col2_(4) W2: = T * W2
!>       col2_(5) B2: = B2 - V2 * W2 = B2 - B1 * W2
!>       col2_(6) W2: = V1 * W2 = unit_lower_tr_of_(A1) * W2
!>       col2_(7) A2: = A2 - W2
!>     else
!>       (Second Step - column block 1)
!>       col1_(1) W1: = A1
!>       col1_(2) W1: = (V1**T) * W1 = (unit_lower_tr_of_(A1)**T) * W1
!>       col1_(3) W1: = T * W1
!>       col1_(4) B1: = - V2 * W1 = - B1 * W1
!>       col1_(5) square W1: = V1 * W1 = unit_lower_tr_of_(A1) * W1
!>       col1_(6) square A1: = A1 - W1
!>     end if
!>    end if
!>
!>    Case (B), when V1 is an identity matrix, i.e. IDENT == 'I',
!>    less computations than in the Case (A)
!>
!>    if( IDENT == 'I' ) then
!>     if ( N > K ) then
!>       (First Step - column block 2)
!>       col2_(1) W2: = A2
!>       col2_(3) W2: = W2 + (V2**T) * B2 = W2 + (B1**T) * B2
!>       col2_(4) W2: = T * W2
!>       col2_(5) B2: = B2 - V2 * W2 = B2 - B1 * W2
!>       col2_(7) A2: = A2 - W2
!>     else
!>       (Second Step - column block 1)
!>       col1_(1) W1: = A1
!>       col1_(3) W1: = T * W1
!>       col1_(4) B1: = - V2 * W1 = - B1 * W1
!>       col1_(6) upper-triangular_of_(A1): = A1 - W1
!>     end if
!>    end if
!>
!>    Combine these cases (A) and (B) together, this is the resulting
!>    algorithm:
!>
!>    if ( N > K ) then
!>
!>      (First Step - column block 2)
!>
!>      col2_(1)  W2: = A2
!>      if( IDENT != 'I' ) then
!>        col2_(2)  W2: = (V1**T) * W2
!>                      = (unit_lower_tr_of_(A1)**T) * W2
!>      end if
!>      col2_(3)  W2: = W2 + (V2**T) * B2 = W2 + (B1**T) * B2]
!>      col2_(4)  W2: = T * W2
!>      col2_(5)  B2: = B2 - V2 * W2 = B2 - B1 * W2
!>      if( IDENT != 'I' ) then
!>        col2_(6)    W2: = V1 * W2 = unit_lower_tr_of_(A1) * W2
!>      end if
!>      col2_(7) A2: = A2 - W2
!>
!>    else
!>
!>    (Second Step - column block 1)
!>
!>      col1_(1) W1: = A1
!>      if( IDENT != 'I' ) then
!>        col1_(2) W1: = (V1**T) * W1
!>                    = (unit_lower_tr_of_(A1)**T) * W1
!>      end if
!>      col1_(3) W1: = T * W1
!>      col1_(4) B1: = - V2 * W1 = - B1 * W1
!>      if( IDENT != 'I' ) then
!>        col1_(5) square W1: = V1 * W1 = unit_lower_tr_of_(A1) * W1
!>        col1_(6_a) below_diag_of_(A1): =  - below_diag_of_(W1)
!>      end if
!>      col1_(6_b) up_tr_of_(A1): = up_tr_of_(A1) - up_tr_of_(W1)
!>
!>    end if
!>
!>

Definition at line 390 of file dlarfb_gett.f.

      IMPLICIT NONE
*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          IDENT
      INTEGER            K, LDA, LDB, LDT, LDWORK, M, N
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   A( LDA, * ), B( LDB, * ), T( LDT, * ),
     $                   WORK( LDWORK, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ONE, ZERO
      parameter( one = 1.0d+0, zero = 0.0d+0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            LNOTIDENT
      INTEGER            I, J
*     ..
*     .. EXTERNAL FUNCTIONS ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           dcopy, dgemm, dtrmm
*     ..
*     .. Executable Statements ..
*
*     Quick return if possible
*
      IF( m.LT.0 .OR. n.LE.0 .OR. k.EQ.0 .OR. k.GT.n )
     $   RETURN
*
      lnotident = .NOT.lsame( ident, 'I' )
*
*     ------------------------------------------------------------------
*
*     First Step. Computation of the Column Block 2:
*
*        ( A2 ) := H * ( A2 )
*        ( B2 )        ( B2 )
*
*     ------------------------------------------------------------------
*
      IF( n.GT.k ) THEN
*
*        col2_(1) Compute W2: = A2. Therefore, copy A2 = A(1:K, K+1:N)
*        into W2=WORK(1:K, 1:N-K) column-by-column.
*
         DO j = 1, n-k
            CALL dcopy( k, a( 1, k+j ), 1, work( 1, j ), 1 )
         END DO
 
         IF( lnotident ) THEN
*
*           col2_(2) Compute W2: = (V1**T) * W2 = (A1**T) * W2,
*           V1 is not an identy matrix, but unit lower-triangular
*           V1 stored in A1 (diagonal ones are not stored).
*
*
            CALL dtrmm( 'L', 'L', 'T', 'U', k, n-k, one, a, lda,
     $                  work, ldwork )
         END IF
*
*        col2_(3) Compute W2: = W2 + (V2**T) * B2 = W2 + (B1**T) * B2
*        V2 stored in B1.
*
         IF( m.GT.0 ) THEN
            CALL dgemm( 'T', 'N', k, n-k, m, one, b, ldb,
     $                  b( 1, k+1 ), ldb, one, work, ldwork )
         END IF
*
*        col2_(4) Compute W2: = T * W2,
*        T is upper-triangular.
*
         CALL dtrmm( 'L', 'U', 'N', 'N', k, n-k, one, t, ldt,
     $               work, ldwork )
*
*        col2_(5) Compute B2: = B2 - V2 * W2 = B2 - B1 * W2,
*        V2 stored in B1.
*
         IF( m.GT.0 ) THEN
            CALL dgemm( 'N', 'N', m, n-k, k, -one, b, ldb,
     $                   work, ldwork, one, b( 1, k+1 ), ldb )
         END IF
*
         IF( lnotident ) THEN
*
*           col2_(6) Compute W2: = V1 * W2 = A1 * W2,
*           V1 is not an identity matrix, but unit lower-triangular,
*           V1 stored in A1 (diagonal ones are not stored).
*
            CALL dtrmm( 'L', 'L', 'N', 'U', k, n-k, one, a, lda,
     $                  work, ldwork )
         END IF
*
*        col2_(7) Compute A2: = A2 - W2 =
*                             = A(1:K, K+1:N-K) - WORK(1:K, 1:N-K),
*        column-by-column.
*
         DO j = 1, n-k
            DO i = 1, k
               a( i, k+j ) = a( i, k+j ) - work( i, j )
            END DO
         END DO
*
      END IF
*
*     ------------------------------------------------------------------
*
*     Second Step. Computation of the Column Block 1:
*
*        ( A1 ) := H * ( A1 )
*        ( B1 )        (  0 )
*
*     ------------------------------------------------------------------
*
*     col1_(1) Compute W1: = A1. Copy the upper-triangular
*     A1 = A(1:K, 1:K) into the upper-triangular
*     W1 = WORK(1:K, 1:K) column-by-column.
*
      DO j = 1, k
         CALL dcopy( j, a( 1, j ), 1, work( 1, j ), 1 )
      END DO
*
*     Set the subdiagonal elements of W1 to zero column-by-column.
*
      DO j = 1, k - 1
         DO i = j + 1, k
            work( i, j ) = zero
         END DO
      END DO
*
      IF( lnotident ) THEN
*
*        col1_(2) Compute W1: = (V1**T) * W1 = (A1**T) * W1,
*        V1 is not an identity matrix, but unit lower-triangular
*        V1 stored in A1 (diagonal ones are not stored),
*        W1 is upper-triangular with zeroes below the diagonal.
*
         CALL dtrmm( 'L', 'L', 'T', 'U', k, k, one, a, lda,
     $               work, ldwork )
      END IF
*
*     col1_(3) Compute W1: = T * W1,
*     T is upper-triangular,
*     W1 is upper-triangular with zeroes below the diagonal.
*
      CALL dtrmm( 'L', 'U', 'N', 'N', k, k, one, t, ldt,
     $            work, ldwork )
*
*     col1_(4) Compute B1: = - V2 * W1 = - B1 * W1,
*     V2 = B1, W1 is upper-triangular with zeroes below the diagonal.
*
      IF( m.GT.0 ) THEN
         CALL dtrmm( 'R', 'U', 'N', 'N', m, k, -one, work, ldwork,
     $               b, ldb )
      END IF
*
      IF( lnotident ) THEN
*
*        col1_(5) Compute W1: = V1 * W1 = A1 * W1,
*        V1 is not an identity matrix, but unit lower-triangular
*        V1 stored in A1 (diagonal ones are not stored),
*        W1 is upper-triangular on input with zeroes below the diagonal,
*        and square on output.
*
         CALL dtrmm( 'L', 'L', 'N', 'U', k, k, one, a, lda,
     $               work, ldwork )
*
*        col1_(6) Compute A1: = A1 - W1 = A(1:K, 1:K) - WORK(1:K, 1:K)
*        column-by-column. A1 is upper-triangular on input.
*        If IDENT, A1 is square on output, and W1 is square,
*        if NOT IDENT, A1 is upper-triangular on output,
*        W1 is upper-triangular.
*
*        col1_(6)_a Compute elements of A1 below the diagonal.
*
         DO j = 1, k - 1
            DO i = j + 1, k
               a( i, j ) = - work( i, j )
            END DO
         END DO
*
      END IF
*
*     col1_(6)_b Compute elements of A1 on and above the diagonal.
*
      DO j = 1, k
         DO i = 1, j
            a( i, j ) = a( i, j ) - work( i, j )
         END DO
      END DO
*
      RETURN
*
*     End of DLARFB_GETT
*

◆ dlarfg()

subroutine dlarfg	(	integer	n,
		double precision	alpha,
		double precision, dimension( * )	x,
		integer	incx,
		double precision	tau )

DLARFG generates an elementary reflector (Householder matrix).

Download DLARFG + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLARFG generates a real elementary reflector H of order n, such
!> that
!>
!>       H * ( alpha ) = ( beta ),   H**T * H = I.
!>           (   x   )   (   0  )
!>
!> where alpha and beta are scalars, and x is an (n-1)-element real
!> vector. H is represented in the form
!>
!>       H = I - tau * ( 1 ) * ( 1 v**T ) ,
!>                     ( v )
!>
!> where tau is a real scalar and v is a real (n-1)-element
!> vector.
!>
!> If the elements of x are all zero, then tau = 0 and H is taken to be
!> the unit matrix.
!>
!> Otherwise  1 <= tau <= 2.
!>

Parameters

[in]	N	!> N is INTEGER !> The order of the elementary reflector. !>
[in,out]	ALPHA	!> ALPHA is DOUBLE PRECISION !> On entry, the value alpha. !> On exit, it is overwritten with the value beta. !>
[in,out]	X	!> X is DOUBLE PRECISION array, dimension !> (1+(N-2)*abs(INCX)) !> On entry, the vector x. !> On exit, it is overwritten with the vector v. !>
[in]	INCX	!> INCX is INTEGER !> The increment between elements of X. INCX > 0. !>
[out]	TAU	!> TAU is DOUBLE PRECISION !> The value tau. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 105 of file dlarfg.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INCX, N
      DOUBLE PRECISION   ALPHA, TAU
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   X( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ONE, ZERO
      parameter( one = 1.0d+0, zero = 0.0d+0 )
*     ..
*     .. Local Scalars ..
      INTEGER            J, KNT
      DOUBLE PRECISION   BETA, RSAFMN, SAFMIN, XNORM
*     ..
*     .. External Functions ..
      DOUBLE PRECISION   DLAMCH, DLAPY2, DNRM2
      EXTERNAL           dlamch, dlapy2, dnrm2
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, sign
*     ..
*     .. External Subroutines ..
      EXTERNAL           dscal
*     ..
*     .. Executable Statements ..
*
      IF( n.LE.1 ) THEN
         tau = zero
         RETURN
      END IF
*
      xnorm = dnrm2( n-1, x, incx )
*
      IF( xnorm.EQ.zero ) THEN
*
*        H  =  I
*
         tau = zero
      ELSE
*
*        general case
*
         beta = -sign( dlapy2( alpha, xnorm ), alpha )
         safmin = dlamch( 'S' ) / dlamch( 'E' )
         knt = 0
         IF( abs( beta ).LT.safmin ) THEN
*
*           XNORM, BETA may be inaccurate; scale X and recompute them
*
            rsafmn = one / safmin
   10       CONTINUE
            knt = knt + 1
            CALL dscal( n-1, rsafmn, x, incx )
            beta = beta*rsafmn
            alpha = alpha*rsafmn
            IF( (abs( beta ).LT.safmin) .AND. (knt .LT. 20) )
     $         GO TO 10
*
*           New BETA is at most 1, at least SAFMIN
*
            xnorm = dnrm2( n-1, x, incx )
            beta = -sign( dlapy2( alpha, xnorm ), alpha )
         END IF
         tau = ( beta-alpha ) / beta
         CALL dscal( n-1, one / ( alpha-beta ), x, incx )
*
*        If ALPHA is subnormal, it may lose relative accuracy
*
         DO 20 j = 1, knt
            beta = beta*safmin
 20      CONTINUE
         alpha = beta
      END IF
*
      RETURN
*
*     End of DLARFG
*

◆ dlarfgp()

subroutine dlarfgp	(	integer	n,
		double precision	alpha,
		double precision, dimension( * )	x,
		integer	incx,
		double precision	tau )

DLARFGP generates an elementary reflector (Householder matrix) with non-negative beta.

Download DLARFGP + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLARFGP generates a real elementary reflector H of order n, such
!> that
!>
!>       H * ( alpha ) = ( beta ),   H**T * H = I.
!>           (   x   )   (   0  )
!>
!> where alpha and beta are scalars, beta is non-negative, and x is
!> an (n-1)-element real vector.  H is represented in the form
!>
!>       H = I - tau * ( 1 ) * ( 1 v**T ) ,
!>                     ( v )
!>
!> where tau is a real scalar and v is a real (n-1)-element
!> vector.
!>
!> If the elements of x are all zero, then tau = 0 and H is taken to be
!> the unit matrix.
!>

Parameters

[in]	N	!> N is INTEGER !> The order of the elementary reflector. !>
[in,out]	ALPHA	!> ALPHA is DOUBLE PRECISION !> On entry, the value alpha. !> On exit, it is overwritten with the value beta. !>
[in,out]	X	!> X is DOUBLE PRECISION array, dimension !> (1+(N-2)*abs(INCX)) !> On entry, the vector x. !> On exit, it is overwritten with the vector v. !>
[in]	INCX	!> INCX is INTEGER !> The increment between elements of X. INCX > 0. !>
[out]	TAU	!> TAU is DOUBLE PRECISION !> The value tau. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 103 of file dlarfgp.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INCX, N
      DOUBLE PRECISION   ALPHA, TAU
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   X( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   TWO, ONE, ZERO
      parameter( two = 2.0d+0, one = 1.0d+0, zero = 0.0d+0 )
*     ..
*     .. Local Scalars ..
      INTEGER            J, KNT
      DOUBLE PRECISION   BETA, BIGNUM, SAVEALPHA, SMLNUM, XNORM
*     ..
*     .. External Functions ..
      DOUBLE PRECISION   DLAMCH, DLAPY2, DNRM2
      EXTERNAL           dlamch, dlapy2, dnrm2
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, sign
*     ..
*     .. External Subroutines ..
      EXTERNAL           dscal
*     ..
*     .. Executable Statements ..
*
      IF( n.LE.0 ) THEN
         tau = zero
         RETURN
      END IF
*
      xnorm = dnrm2( n-1, x, incx )
*
      IF( xnorm.EQ.zero ) THEN
*
*        H  =  [+/-1, 0; I], sign chosen so ALPHA >= 0
*
         IF( alpha.GE.zero ) THEN
*           When TAU.eq.ZERO, the vector is special-cased to be
*           all zeros in the application routines.  We do not need
*           to clear it.
            tau = zero
         ELSE
*           However, the application routines rely on explicit
*           zero checks when TAU.ne.ZERO, and we must clear X.
            tau = two
            DO j = 1, n-1
               x( 1 + (j-1)*incx ) = 0
            END DO
            alpha = -alpha
         END IF
      ELSE
*
*        general case
*
         beta = sign( dlapy2( alpha, xnorm ), alpha )
         smlnum = dlamch( 'S' ) / dlamch( 'E' )
         knt = 0
         IF( abs( beta ).LT.smlnum ) THEN
*
*           XNORM, BETA may be inaccurate; scale X and recompute them
*
            bignum = one / smlnum
   10       CONTINUE
            knt = knt + 1
            CALL dscal( n-1, bignum, x, incx )
            beta = beta*bignum
            alpha = alpha*bignum
            IF( (abs( beta ).LT.smlnum) .AND. (knt .LT. 20) )
     $         GO TO 10
*
*           New BETA is at most 1, at least SMLNUM
*
            xnorm = dnrm2( n-1, x, incx )
            beta = sign( dlapy2( alpha, xnorm ), alpha )
         END IF
         savealpha = alpha
         alpha = alpha + beta
         IF( beta.LT.zero ) THEN
            beta = -beta
            tau = -alpha / beta
         ELSE
            alpha = xnorm * (xnorm/alpha)
            tau = alpha / beta
            alpha = -alpha
         END IF
*
         IF ( abs(tau).LE.smlnum ) THEN
*
*           In the case where the computed TAU ends up being a denormalized number,
*           it loses relative accuracy. This is a BIG problem. Solution: flush TAU
*           to ZERO. This explains the next IF statement.
*
*           (Bug report provided by Pat Quillen from MathWorks on Jul 29, 2009.)
*           (Thanks Pat. Thanks MathWorks.)
*
            IF( savealpha.GE.zero ) THEN
               tau = zero
            ELSE
               tau = two
               DO j = 1, n-1
                  x( 1 + (j-1)*incx ) = 0
               END DO
               beta = -savealpha
            END IF
*
         ELSE
*
*           This is the general case.
*
            CALL dscal( n-1, one / alpha, x, incx )
*
         END IF
*
*        If BETA is subnormal, it may lose relative accuracy
*
         DO 20 j = 1, knt
            beta = beta*smlnum
 20      CONTINUE
         alpha = beta
      END IF
*
      RETURN
*
*     End of DLARFGP
*

◆ dlarft()

subroutine dlarft	(	character	direct,
		character	storev,
		integer	n,
		integer	k,
		double precision, dimension( ldv, * )	v,
		integer	ldv,
		double precision, dimension( * )	tau,
		double precision, dimension( ldt, * )	t,
		integer	ldt )

DLARFT forms the triangular factor T of a block reflector H = I - vtvH

Download DLARFT + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLARFT forms the triangular factor T of a real block reflector H
!> of order n, which is defined as a product of k elementary reflectors.
!>
!> If DIRECT = 'F', H = H(1) H(2) . . . H(k) and T is upper triangular;
!>
!> If DIRECT = 'B', H = H(k) . . . H(2) H(1) and T is lower triangular.
!>
!> If STOREV = 'C', the vector which defines the elementary reflector
!> H(i) is stored in the i-th column of the array V, and
!>
!>    H  =  I - V * T * V**T
!>
!> If STOREV = 'R', the vector which defines the elementary reflector
!> H(i) is stored in the i-th row of the array V, and
!>
!>    H  =  I - V**T * T * V
!>

Parameters

[in]	DIRECT	!> DIRECT is CHARACTER*1 !> Specifies the order in which the elementary reflectors are !> multiplied to form the block reflector: !> = 'F': H = H(1) H(2) . . . H(k) (Forward) !> = 'B': H = H(k) . . . H(2) H(1) (Backward) !>
[in]	STOREV	!> STOREV is CHARACTER*1 !> Specifies how the vectors which define the elementary !> reflectors are stored (see also Further Details): !> = 'C': columnwise !> = 'R': rowwise !>
[in]	N	!> N is INTEGER !> The order of the block reflector H. N >= 0. !>
[in]	K	!> K is INTEGER !> The order of the triangular factor T (= the number of !> elementary reflectors). K >= 1. !>
[in]	V	!> V is DOUBLE PRECISION array, dimension !> (LDV,K) if STOREV = 'C' !> (LDV,N) if STOREV = 'R' !> The matrix V. See further details. !>
[in]	LDV	!> LDV is INTEGER !> The leading dimension of the array V. !> If STOREV = 'C', LDV >= max(1,N); if STOREV = 'R', LDV >= K. !>
[in]	TAU	!> TAU is DOUBLE PRECISION array, dimension (K) !> TAU(i) must contain the scalar factor of the elementary !> reflector H(i). !>
[out]	T	!> T is DOUBLE PRECISION array, dimension (LDT,K) !> The k by k triangular factor T of the block reflector. !> If DIRECT = 'F', T is upper triangular; if DIRECT = 'B', T is !> lower triangular. The rest of the array is not used. !>
[in]	LDT	!> LDT is INTEGER !> The leading dimension of the array T. LDT >= K. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  The shape of the matrix V and the storage of the vectors which define
!>  the H(i) is best illustrated by the following example with n = 5 and
!>  k = 3. The elements equal to 1 are not stored.
!>
!>  DIRECT = 'F' and STOREV = 'C':         DIRECT = 'F' and STOREV = 'R':
!>
!>               V = (  1       )                 V = (  1 v1 v1 v1 v1 )
!>                   ( v1  1    )                     (     1 v2 v2 v2 )
!>                   ( v1 v2  1 )                     (        1 v3 v3 )
!>                   ( v1 v2 v3 )
!>                   ( v1 v2 v3 )
!>
!>  DIRECT = 'B' and STOREV = 'C':         DIRECT = 'B' and STOREV = 'R':
!>
!>               V = ( v1 v2 v3 )                 V = ( v1 v1  1       )
!>                   ( v1 v2 v3 )                     ( v2 v2 v2  1    )
!>                   (  1 v2 v3 )                     ( v3 v3 v3 v3  1 )
!>                   (     1 v3 )
!>                   (        1 )
!>

Definition at line 162 of file dlarft.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          DIRECT, STOREV
      INTEGER            K, LDT, LDV, N
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   T( LDT, * ), TAU( * ), V( LDV, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ONE, ZERO
      parameter( one = 1.0d+0, zero = 0.0d+0 )
*     ..
*     .. Local Scalars ..
      INTEGER            I, J, PREVLASTV, LASTV
*     ..
*     .. External Subroutines ..
      EXTERNAL           dgemv, dtrmv
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. Executable Statements ..
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
      IF( lsame( direct, 'F' ) ) THEN
         prevlastv = n
         DO i = 1, k
            prevlastv = max( i, prevlastv )
            IF( tau( i ).EQ.zero ) THEN
*
*              H(i)  =  I
*
               DO j = 1, i
                  t( j, i ) = zero
               END DO
            ELSE
*
*              general case
*
               IF( lsame( storev, 'C' ) ) THEN
*                 Skip any trailing zeros.
                  DO lastv = n, i+1, -1
                     IF( v( lastv, i ).NE.zero ) EXIT
                  END DO
                  DO j = 1, i-1
                     t( j, i ) = -tau( i ) * v( i , j )
                  END DO
                  j = min( lastv, prevlastv )
*
*                 T(1:i-1,i) := - tau(i) * V(i:j,1:i-1)**T * V(i:j,i)
*
                  CALL dgemv( 'Transpose', j-i, i-1, -tau( i ),
     $                        v( i+1, 1 ), ldv, v( i+1, i ), 1, one,
     $                        t( 1, i ), 1 )
               ELSE
*                 Skip any trailing zeros.
                  DO lastv = n, i+1, -1
                     IF( v( i, lastv ).NE.zero ) EXIT
                  END DO
                  DO j = 1, i-1
                     t( j, i ) = -tau( i ) * v( j , i )
                  END DO
                  j = min( lastv, prevlastv )
*
*                 T(1:i-1,i) := - tau(i) * V(1:i-1,i:j) * V(i,i:j)**T
*
                  CALL dgemv( 'No transpose', i-1, j-i, -tau( i ),
     $                        v( 1, i+1 ), ldv, v( i, i+1 ), ldv, one,
     $                        t( 1, i ), 1 )
               END IF
*
*              T(1:i-1,i) := T(1:i-1,1:i-1) * T(1:i-1,i)
*
               CALL dtrmv( 'Upper', 'No transpose', 'Non-unit', i-1, t,
     $                     ldt, t( 1, i ), 1 )
               t( i, i ) = tau( i )
               IF( i.GT.1 ) THEN
                  prevlastv = max( prevlastv, lastv )
               ELSE
                  prevlastv = lastv
               END IF
            END IF
         END DO
      ELSE
         prevlastv = 1
         DO i = k, 1, -1
            IF( tau( i ).EQ.zero ) THEN
*
*              H(i)  =  I
*
               DO j = i, k
                  t( j, i ) = zero
               END DO
            ELSE
*
*              general case
*
               IF( i.LT.k ) THEN
                  IF( lsame( storev, 'C' ) ) THEN
*                    Skip any leading zeros.
                     DO lastv = 1, i-1
                        IF( v( lastv, i ).NE.zero ) EXIT
                     END DO
                     DO j = i+1, k
                        t( j, i ) = -tau( i ) * v( n-k+i , j )
                     END DO
                     j = max( lastv, prevlastv )
*
*                    T(i+1:k,i) = -tau(i) * V(j:n-k+i,i+1:k)**T * V(j:n-k+i,i)
*
                     CALL dgemv( 'Transpose', n-k+i-j, k-i, -tau( i ),
     $                           v( j, i+1 ), ldv, v( j, i ), 1, one,
     $                           t( i+1, i ), 1 )
                  ELSE
*                    Skip any leading zeros.
                     DO lastv = 1, i-1
                        IF( v( i, lastv ).NE.zero ) EXIT
                     END DO
                     DO j = i+1, k
                        t( j, i ) = -tau( i ) * v( j, n-k+i )
                     END DO
                     j = max( lastv, prevlastv )
*
*                    T(i+1:k,i) = -tau(i) * V(i+1:k,j:n-k+i) * V(i,j:n-k+i)**T
*
                     CALL dgemv( 'No transpose', k-i, n-k+i-j,
     $                    -tau( i ), v( i+1, j ), ldv, v( i, j ), ldv,
     $                    one, t( i+1, i ), 1 )
                  END IF
*
*                 T(i+1:k,i) := T(i+1:k,i+1:k) * T(i+1:k,i)
*
                  CALL dtrmv( 'Lower', 'No transpose', 'Non-unit', k-i,
     $                        t( i+1, i+1 ), ldt, t( i+1, i ), 1 )
                  IF( i.GT.1 ) THEN
                     prevlastv = min( prevlastv, lastv )
                  ELSE
                     prevlastv = lastv
                  END IF
               END IF
               t( i, i ) = tau( i )
            END IF
         END DO
      END IF
      RETURN
*
*     End of DLARFT
*

◆ dlarfx()

subroutine dlarfx	(	character	side,
		integer	m,
		integer	n,
		double precision, dimension( * )	v,
		double precision	tau,
		double precision, dimension( ldc, * )	c,
		integer	ldc,
		double precision, dimension( * )	work )

DLARFX applies an elementary reflector to a general rectangular matrix, with loop unrolling when the reflector has order ≤ 10.

Download DLARFX + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLARFX applies a real elementary reflector H to a real m by n
!> matrix C, from either the left or the right. H is represented in the
!> form
!>
!>       H = I - tau * v * v**T
!>
!> where tau is a real scalar and v is a real vector.
!>
!> If tau = 0, then H is taken to be the unit matrix
!>
!> This version uses inline code if H has order < 11.
!>

Parameters

[in]	SIDE	!> SIDE is CHARACTER1 !> = 'L': form H C !> = 'R': form C * H !>
[in]	M	!> M is INTEGER !> The number of rows of the matrix C. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix C. !>
[in]	V	!> V is DOUBLE PRECISION array, dimension (M) if SIDE = 'L' !> or (N) if SIDE = 'R' !> The vector v in the representation of H. !>
[in]	TAU	!> TAU is DOUBLE PRECISION !> The value tau in the representation of H. !>
[in,out]	C	!> C is DOUBLE PRECISION array, dimension (LDC,N) !> On entry, the m by n matrix C. !> On exit, C is overwritten by the matrix H * C if SIDE = 'L', !> or C * H if SIDE = 'R'. !>
[in]	LDC	!> LDC is INTEGER !> The leading dimension of the array C. LDC >= (1,M). !>
[out]	WORK	!> WORK is DOUBLE PRECISION array, dimension !> (N) if SIDE = 'L' !> or (M) if SIDE = 'R' !> WORK is not referenced if H has order < 11. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 119 of file dlarfx.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          SIDE
      INTEGER            LDC, M, N
      DOUBLE PRECISION   TAU
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   C( LDC, * ), V( * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ZERO, ONE
      parameter( zero = 0.0d+0, one = 1.0d+0 )
*     ..
*     .. Local Scalars ..
      INTEGER            J
      DOUBLE PRECISION   SUM, T1, T10, T2, T3, T4, T5, T6, T7, T8, T9,
     $                   V1, V10, V2, V3, V4, V5, V6, V7, V8, V9
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      EXTERNAL           lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL           dlarf
*     ..
*     .. Executable Statements ..
*
      IF( tau.EQ.zero )
     $   RETURN
      IF( lsame( side, 'L' ) ) THEN
*
*        Form  H * C, where H has order m.
*
         GO TO ( 10, 30, 50, 70, 90, 110, 130, 150,
     $           170, 190 )m
*
*        Code for general M
*
         CALL dlarf( side, m, n, v, 1, tau, c, ldc, work )
         GO TO 410
   10    CONTINUE
*
*        Special code for 1 x 1 Householder
*
         t1 = one - tau*v( 1 )*v( 1 )
         DO 20 j = 1, n
            c( 1, j ) = t1*c( 1, j )
   20    CONTINUE
         GO TO 410
   30    CONTINUE
*
*        Special code for 2 x 2 Householder
*
         v1 = v( 1 )
         t1 = tau*v1
         v2 = v( 2 )
         t2 = tau*v2
         DO 40 j = 1, n
            sum = v1*c( 1, j ) + v2*c( 2, j )
            c( 1, j ) = c( 1, j ) - sum*t1
            c( 2, j ) = c( 2, j ) - sum*t2
   40    CONTINUE
         GO TO 410
   50    CONTINUE
*
*        Special code for 3 x 3 Householder
*
         v1 = v( 1 )
         t1 = tau*v1
         v2 = v( 2 )
         t2 = tau*v2
         v3 = v( 3 )
         t3 = tau*v3
         DO 60 j = 1, n
            sum = v1*c( 1, j ) + v2*c( 2, j ) + v3*c( 3, j )
            c( 1, j ) = c( 1, j ) - sum*t1
            c( 2, j ) = c( 2, j ) - sum*t2
            c( 3, j ) = c( 3, j ) - sum*t3
   60    CONTINUE
         GO TO 410
   70    CONTINUE
*
*        Special code for 4 x 4 Householder
*
         v1 = v( 1 )
         t1 = tau*v1
         v2 = v( 2 )
         t2 = tau*v2
         v3 = v( 3 )
         t3 = tau*v3
         v4 = v( 4 )
         t4 = tau*v4
         DO 80 j = 1, n
            sum = v1*c( 1, j ) + v2*c( 2, j ) + v3*c( 3, j ) +
     $            v4*c( 4, j )
            c( 1, j ) = c( 1, j ) - sum*t1
            c( 2, j ) = c( 2, j ) - sum*t2
            c( 3, j ) = c( 3, j ) - sum*t3
            c( 4, j ) = c( 4, j ) - sum*t4
   80    CONTINUE
         GO TO 410
   90    CONTINUE
*
*        Special code for 5 x 5 Householder
*
         v1 = v( 1 )
         t1 = tau*v1
         v2 = v( 2 )
         t2 = tau*v2
         v3 = v( 3 )
         t3 = tau*v3
         v4 = v( 4 )
         t4 = tau*v4
         v5 = v( 5 )
         t5 = tau*v5
         DO 100 j = 1, n
            sum = v1*c( 1, j ) + v2*c( 2, j ) + v3*c( 3, j ) +
     $            v4*c( 4, j ) + v5*c( 5, j )
            c( 1, j ) = c( 1, j ) - sum*t1
            c( 2, j ) = c( 2, j ) - sum*t2
            c( 3, j ) = c( 3, j ) - sum*t3
            c( 4, j ) = c( 4, j ) - sum*t4
            c( 5, j ) = c( 5, j ) - sum*t5
  100    CONTINUE
         GO TO 410
  110    CONTINUE
*
*        Special code for 6 x 6 Householder
*
         v1 = v( 1 )
         t1 = tau*v1
         v2 = v( 2 )
         t2 = tau*v2
         v3 = v( 3 )
         t3 = tau*v3
         v4 = v( 4 )
         t4 = tau*v4
         v5 = v( 5 )
         t5 = tau*v5
         v6 = v( 6 )
         t6 = tau*v6
         DO 120 j = 1, n
            sum = v1*c( 1, j ) + v2*c( 2, j ) + v3*c( 3, j ) +
     $            v4*c( 4, j ) + v5*c( 5, j ) + v6*c( 6, j )
            c( 1, j ) = c( 1, j ) - sum*t1
            c( 2, j ) = c( 2, j ) - sum*t2
            c( 3, j ) = c( 3, j ) - sum*t3
            c( 4, j ) = c( 4, j ) - sum*t4
            c( 5, j ) = c( 5, j ) - sum*t5
            c( 6, j ) = c( 6, j ) - sum*t6
  120    CONTINUE
         GO TO 410
  130    CONTINUE
*
*        Special code for 7 x 7 Householder
*
         v1 = v( 1 )
         t1 = tau*v1
         v2 = v( 2 )
         t2 = tau*v2
         v3 = v( 3 )
         t3 = tau*v3
         v4 = v( 4 )
         t4 = tau*v4
         v5 = v( 5 )
         t5 = tau*v5
         v6 = v( 6 )
         t6 = tau*v6
         v7 = v( 7 )
         t7 = tau*v7
         DO 140 j = 1, n
            sum = v1*c( 1, j ) + v2*c( 2, j ) + v3*c( 3, j ) +
     $            v4*c( 4, j ) + v5*c( 5, j ) + v6*c( 6, j ) +
     $            v7*c( 7, j )
            c( 1, j ) = c( 1, j ) - sum*t1
            c( 2, j ) = c( 2, j ) - sum*t2
            c( 3, j ) = c( 3, j ) - sum*t3
            c( 4, j ) = c( 4, j ) - sum*t4
            c( 5, j ) = c( 5, j ) - sum*t5
            c( 6, j ) = c( 6, j ) - sum*t6
            c( 7, j ) = c( 7, j ) - sum*t7
  140    CONTINUE
         GO TO 410
  150    CONTINUE
*
*        Special code for 8 x 8 Householder
*
         v1 = v( 1 )
         t1 = tau*v1
         v2 = v( 2 )
         t2 = tau*v2
         v3 = v( 3 )
         t3 = tau*v3
         v4 = v( 4 )
         t4 = tau*v4
         v5 = v( 5 )
         t5 = tau*v5
         v6 = v( 6 )
         t6 = tau*v6
         v7 = v( 7 )
         t7 = tau*v7
         v8 = v( 8 )
         t8 = tau*v8
         DO 160 j = 1, n
            sum = v1*c( 1, j ) + v2*c( 2, j ) + v3*c( 3, j ) +
     $            v4*c( 4, j ) + v5*c( 5, j ) + v6*c( 6, j ) +
     $            v7*c( 7, j ) + v8*c( 8, j )
            c( 1, j ) = c( 1, j ) - sum*t1
            c( 2, j ) = c( 2, j ) - sum*t2
            c( 3, j ) = c( 3, j ) - sum*t3
            c( 4, j ) = c( 4, j ) - sum*t4
            c( 5, j ) = c( 5, j ) - sum*t5
            c( 6, j ) = c( 6, j ) - sum*t6
            c( 7, j ) = c( 7, j ) - sum*t7
            c( 8, j ) = c( 8, j ) - sum*t8
  160    CONTINUE
         GO TO 410
  170    CONTINUE
*
*        Special code for 9 x 9 Householder
*
         v1 = v( 1 )
         t1 = tau*v1
         v2 = v( 2 )
         t2 = tau*v2
         v3 = v( 3 )
         t3 = tau*v3
         v4 = v( 4 )
         t4 = tau*v4
         v5 = v( 5 )
         t5 = tau*v5
         v6 = v( 6 )
         t6 = tau*v6
         v7 = v( 7 )
         t7 = tau*v7
         v8 = v( 8 )
         t8 = tau*v8
         v9 = v( 9 )
         t9 = tau*v9
         DO 180 j = 1, n
            sum = v1*c( 1, j ) + v2*c( 2, j ) + v3*c( 3, j ) +
     $            v4*c( 4, j ) + v5*c( 5, j ) + v6*c( 6, j ) +
     $            v7*c( 7, j ) + v8*c( 8, j ) + v9*c( 9, j )
            c( 1, j ) = c( 1, j ) - sum*t1
            c( 2, j ) = c( 2, j ) - sum*t2
            c( 3, j ) = c( 3, j ) - sum*t3
            c( 4, j ) = c( 4, j ) - sum*t4
            c( 5, j ) = c( 5, j ) - sum*t5
            c( 6, j ) = c( 6, j ) - sum*t6
            c( 7, j ) = c( 7, j ) - sum*t7
            c( 8, j ) = c( 8, j ) - sum*t8
            c( 9, j ) = c( 9, j ) - sum*t9
  180    CONTINUE
         GO TO 410
  190    CONTINUE
*
*        Special code for 10 x 10 Householder
*
         v1 = v( 1 )
         t1 = tau*v1
         v2 = v( 2 )
         t2 = tau*v2
         v3 = v( 3 )
         t3 = tau*v3
         v4 = v( 4 )
         t4 = tau*v4
         v5 = v( 5 )
         t5 = tau*v5
         v6 = v( 6 )
         t6 = tau*v6
         v7 = v( 7 )
         t7 = tau*v7
         v8 = v( 8 )
         t8 = tau*v8
         v9 = v( 9 )
         t9 = tau*v9
         v10 = v( 10 )
         t10 = tau*v10
         DO 200 j = 1, n
            sum = v1*c( 1, j ) + v2*c( 2, j ) + v3*c( 3, j ) +
     $            v4*c( 4, j ) + v5*c( 5, j ) + v6*c( 6, j ) +
     $            v7*c( 7, j ) + v8*c( 8, j ) + v9*c( 9, j ) +
     $            v10*c( 10, j )
            c( 1, j ) = c( 1, j ) - sum*t1
            c( 2, j ) = c( 2, j ) - sum*t2
            c( 3, j ) = c( 3, j ) - sum*t3
            c( 4, j ) = c( 4, j ) - sum*t4
            c( 5, j ) = c( 5, j ) - sum*t5
            c( 6, j ) = c( 6, j ) - sum*t6
            c( 7, j ) = c( 7, j ) - sum*t7
            c( 8, j ) = c( 8, j ) - sum*t8
            c( 9, j ) = c( 9, j ) - sum*t9
            c( 10, j ) = c( 10, j ) - sum*t10
  200    CONTINUE
         GO TO 410
      ELSE
*
*        Form  C * H, where H has order n.
*
         GO TO ( 210, 230, 250, 270, 290, 310, 330, 350,
     $           370, 390 )n
*
*        Code for general N
*
         CALL dlarf( side, m, n, v, 1, tau, c, ldc, work )
         GO TO 410
  210    CONTINUE
*
*        Special code for 1 x 1 Householder
*
         t1 = one - tau*v( 1 )*v( 1 )
         DO 220 j = 1, m
            c( j, 1 ) = t1*c( j, 1 )
  220    CONTINUE
         GO TO 410
  230    CONTINUE
*
*        Special code for 2 x 2 Householder
*
         v1 = v( 1 )
         t1 = tau*v1
         v2 = v( 2 )
         t2 = tau*v2
         DO 240 j = 1, m
            sum = v1*c( j, 1 ) + v2*c( j, 2 )
            c( j, 1 ) = c( j, 1 ) - sum*t1
            c( j, 2 ) = c( j, 2 ) - sum*t2
  240    CONTINUE
         GO TO 410
  250    CONTINUE
*
*        Special code for 3 x 3 Householder
*
         v1 = v( 1 )
         t1 = tau*v1
         v2 = v( 2 )
         t2 = tau*v2
         v3 = v( 3 )
         t3 = tau*v3
         DO 260 j = 1, m
            sum = v1*c( j, 1 ) + v2*c( j, 2 ) + v3*c( j, 3 )
            c( j, 1 ) = c( j, 1 ) - sum*t1
            c( j, 2 ) = c( j, 2 ) - sum*t2
            c( j, 3 ) = c( j, 3 ) - sum*t3
  260    CONTINUE
         GO TO 410
  270    CONTINUE
*
*        Special code for 4 x 4 Householder
*
         v1 = v( 1 )
         t1 = tau*v1
         v2 = v( 2 )
         t2 = tau*v2
         v3 = v( 3 )
         t3 = tau*v3
         v4 = v( 4 )
         t4 = tau*v4
         DO 280 j = 1, m
            sum = v1*c( j, 1 ) + v2*c( j, 2 ) + v3*c( j, 3 ) +
     $            v4*c( j, 4 )
            c( j, 1 ) = c( j, 1 ) - sum*t1
            c( j, 2 ) = c( j, 2 ) - sum*t2
            c( j, 3 ) = c( j, 3 ) - sum*t3
            c( j, 4 ) = c( j, 4 ) - sum*t4
  280    CONTINUE
         GO TO 410
  290    CONTINUE
*
*        Special code for 5 x 5 Householder
*
         v1 = v( 1 )
         t1 = tau*v1
         v2 = v( 2 )
         t2 = tau*v2
         v3 = v( 3 )
         t3 = tau*v3
         v4 = v( 4 )
         t4 = tau*v4
         v5 = v( 5 )
         t5 = tau*v5
         DO 300 j = 1, m
            sum = v1*c( j, 1 ) + v2*c( j, 2 ) + v3*c( j, 3 ) +
     $            v4*c( j, 4 ) + v5*c( j, 5 )
            c( j, 1 ) = c( j, 1 ) - sum*t1
            c( j, 2 ) = c( j, 2 ) - sum*t2
            c( j, 3 ) = c( j, 3 ) - sum*t3
            c( j, 4 ) = c( j, 4 ) - sum*t4
            c( j, 5 ) = c( j, 5 ) - sum*t5
  300    CONTINUE
         GO TO 410
  310    CONTINUE
*
*        Special code for 6 x 6 Householder
*
         v1 = v( 1 )
         t1 = tau*v1
         v2 = v( 2 )
         t2 = tau*v2
         v3 = v( 3 )
         t3 = tau*v3
         v4 = v( 4 )
         t4 = tau*v4
         v5 = v( 5 )
         t5 = tau*v5
         v6 = v( 6 )
         t6 = tau*v6
         DO 320 j = 1, m
            sum = v1*c( j, 1 ) + v2*c( j, 2 ) + v3*c( j, 3 ) +
     $            v4*c( j, 4 ) + v5*c( j, 5 ) + v6*c( j, 6 )
            c( j, 1 ) = c( j, 1 ) - sum*t1
            c( j, 2 ) = c( j, 2 ) - sum*t2
            c( j, 3 ) = c( j, 3 ) - sum*t3
            c( j, 4 ) = c( j, 4 ) - sum*t4
            c( j, 5 ) = c( j, 5 ) - sum*t5
            c( j, 6 ) = c( j, 6 ) - sum*t6
  320    CONTINUE
         GO TO 410
  330    CONTINUE
*
*        Special code for 7 x 7 Householder
*
         v1 = v( 1 )
         t1 = tau*v1
         v2 = v( 2 )
         t2 = tau*v2
         v3 = v( 3 )
         t3 = tau*v3
         v4 = v( 4 )
         t4 = tau*v4
         v5 = v( 5 )
         t5 = tau*v5
         v6 = v( 6 )
         t6 = tau*v6
         v7 = v( 7 )
         t7 = tau*v7
         DO 340 j = 1, m
            sum = v1*c( j, 1 ) + v2*c( j, 2 ) + v3*c( j, 3 ) +
     $            v4*c( j, 4 ) + v5*c( j, 5 ) + v6*c( j, 6 ) +
     $            v7*c( j, 7 )
            c( j, 1 ) = c( j, 1 ) - sum*t1
            c( j, 2 ) = c( j, 2 ) - sum*t2
            c( j, 3 ) = c( j, 3 ) - sum*t3
            c( j, 4 ) = c( j, 4 ) - sum*t4
            c( j, 5 ) = c( j, 5 ) - sum*t5
            c( j, 6 ) = c( j, 6 ) - sum*t6
            c( j, 7 ) = c( j, 7 ) - sum*t7
  340    CONTINUE
         GO TO 410
  350    CONTINUE
*
*        Special code for 8 x 8 Householder
*
         v1 = v( 1 )
         t1 = tau*v1
         v2 = v( 2 )
         t2 = tau*v2
         v3 = v( 3 )
         t3 = tau*v3
         v4 = v( 4 )
         t4 = tau*v4
         v5 = v( 5 )
         t5 = tau*v5
         v6 = v( 6 )
         t6 = tau*v6
         v7 = v( 7 )
         t7 = tau*v7
         v8 = v( 8 )
         t8 = tau*v8
         DO 360 j = 1, m
            sum = v1*c( j, 1 ) + v2*c( j, 2 ) + v3*c( j, 3 ) +
     $            v4*c( j, 4 ) + v5*c( j, 5 ) + v6*c( j, 6 ) +
     $            v7*c( j, 7 ) + v8*c( j, 8 )
            c( j, 1 ) = c( j, 1 ) - sum*t1
            c( j, 2 ) = c( j, 2 ) - sum*t2
            c( j, 3 ) = c( j, 3 ) - sum*t3
            c( j, 4 ) = c( j, 4 ) - sum*t4
            c( j, 5 ) = c( j, 5 ) - sum*t5
            c( j, 6 ) = c( j, 6 ) - sum*t6
            c( j, 7 ) = c( j, 7 ) - sum*t7
            c( j, 8 ) = c( j, 8 ) - sum*t8
  360    CONTINUE
         GO TO 410
  370    CONTINUE
*
*        Special code for 9 x 9 Householder
*
         v1 = v( 1 )
         t1 = tau*v1
         v2 = v( 2 )
         t2 = tau*v2
         v3 = v( 3 )
         t3 = tau*v3
         v4 = v( 4 )
         t4 = tau*v4
         v5 = v( 5 )
         t5 = tau*v5
         v6 = v( 6 )
         t6 = tau*v6
         v7 = v( 7 )
         t7 = tau*v7
         v8 = v( 8 )
         t8 = tau*v8
         v9 = v( 9 )
         t9 = tau*v9
         DO 380 j = 1, m
            sum = v1*c( j, 1 ) + v2*c( j, 2 ) + v3*c( j, 3 ) +
     $            v4*c( j, 4 ) + v5*c( j, 5 ) + v6*c( j, 6 ) +
     $            v7*c( j, 7 ) + v8*c( j, 8 ) + v9*c( j, 9 )
            c( j, 1 ) = c( j, 1 ) - sum*t1
            c( j, 2 ) = c( j, 2 ) - sum*t2
            c( j, 3 ) = c( j, 3 ) - sum*t3
            c( j, 4 ) = c( j, 4 ) - sum*t4
            c( j, 5 ) = c( j, 5 ) - sum*t5
            c( j, 6 ) = c( j, 6 ) - sum*t6
            c( j, 7 ) = c( j, 7 ) - sum*t7
            c( j, 8 ) = c( j, 8 ) - sum*t8
            c( j, 9 ) = c( j, 9 ) - sum*t9
  380    CONTINUE
         GO TO 410
  390    CONTINUE
*
*        Special code for 10 x 10 Householder
*
         v1 = v( 1 )
         t1 = tau*v1
         v2 = v( 2 )
         t2 = tau*v2
         v3 = v( 3 )
         t3 = tau*v3
         v4 = v( 4 )
         t4 = tau*v4
         v5 = v( 5 )
         t5 = tau*v5
         v6 = v( 6 )
         t6 = tau*v6
         v7 = v( 7 )
         t7 = tau*v7
         v8 = v( 8 )
         t8 = tau*v8
         v9 = v( 9 )
         t9 = tau*v9
         v10 = v( 10 )
         t10 = tau*v10
         DO 400 j = 1, m
            sum = v1*c( j, 1 ) + v2*c( j, 2 ) + v3*c( j, 3 ) +
     $            v4*c( j, 4 ) + v5*c( j, 5 ) + v6*c( j, 6 ) +
     $            v7*c( j, 7 ) + v8*c( j, 8 ) + v9*c( j, 9 ) +
     $            v10*c( j, 10 )
            c( j, 1 ) = c( j, 1 ) - sum*t1
            c( j, 2 ) = c( j, 2 ) - sum*t2
            c( j, 3 ) = c( j, 3 ) - sum*t3
            c( j, 4 ) = c( j, 4 ) - sum*t4
            c( j, 5 ) = c( j, 5 ) - sum*t5
            c( j, 6 ) = c( j, 6 ) - sum*t6
            c( j, 7 ) = c( j, 7 ) - sum*t7
            c( j, 8 ) = c( j, 8 ) - sum*t8
            c( j, 9 ) = c( j, 9 ) - sum*t9
            c( j, 10 ) = c( j, 10 ) - sum*t10
  400    CONTINUE
         GO TO 410
      END IF
  410 CONTINUE
      RETURN
*
*     End of DLARFX
*

◆ dlarfy()

subroutine dlarfy	(	character	uplo,
		integer	n,
		double precision, dimension( * )	v,
		integer	incv,
		double precision	tau,
		double precision, dimension( ldc, * )	c,
		integer	ldc,
		double precision, dimension( * )	work )

DLARFY

Purpose:

!>
!> DLARFY applies an elementary reflector, or Householder matrix, H,
!> to an n x n symmetric matrix C, from both the left and the right.
!>
!> H is represented in the form
!>
!>    H = I - tau * v * v'
!>
!> where  tau  is a scalar and  v  is a vector.
!>
!> If  tau  is  zero, then  H  is taken to be the unit matrix.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> Specifies whether the upper or lower triangular part of the !> symmetric matrix C is stored. !> = 'U': Upper triangle !> = 'L': Lower triangle !>
[in]	N	!> N is INTEGER !> The number of rows and columns of the matrix C. N >= 0. !>
[in]	V	!> V is DOUBLE PRECISION array, dimension !> (1 + (N-1)*abs(INCV)) !> The vector v as described above. !>
[in]	INCV	!> INCV is INTEGER !> The increment between successive elements of v. INCV must !> not be zero. !>
[in]	TAU	!> TAU is DOUBLE PRECISION !> The value tau as described above. !>
[in,out]	C	!> C is DOUBLE PRECISION array, dimension (LDC, N) !> On entry, the matrix C. !> On exit, C is overwritten by H * C * H'. !>
[in]	LDC	!> LDC is INTEGER !> The leading dimension of the array C. LDC >= max( 1, N ). !>
[out]	WORK	!> WORK is DOUBLE PRECISION array, dimension (N) !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 107 of file dlarfy.f.

*
*  -- LAPACK test routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          UPLO
      INTEGER            INCV, LDC, N
      DOUBLE PRECISION   TAU
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   C( LDC, * ), V( * ), WORK( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ONE, ZERO, HALF
      parameter( one = 1.0d+0, zero = 0.0d+0, half = 0.5d+0 )
*     ..
*     .. Local Scalars ..
      DOUBLE PRECISION   ALPHA
*     ..
*     .. External Subroutines ..
      EXTERNAL           daxpy, dsymv, dsyr2
*     ..
*     .. External Functions ..
      DOUBLE PRECISION   DDOT
      EXTERNAL           ddot
*     ..
*     .. Executable Statements ..
*
      IF( tau.EQ.zero )
     $   RETURN
*
*     Form  w:= C * v
*
      CALL dsymv( uplo, n, one, c, ldc, v, incv, zero, work, 1 )
*
      alpha = -half*tau*ddot( n, work, 1, v, incv )
      CALL daxpy( n, alpha, v, incv, work, 1 )
*
*     C := C - v * w' - w * v'
*
      CALL dsyr2( uplo, n, -tau, v, incv, work, 1, c, ldc )
*
      RETURN
*
*     End of DLARFY
*

◆ dlargv()

subroutine dlargv	(	integer	n,
		double precision, dimension( * )	x,
		integer	incx,
		double precision, dimension( * )	y,
		integer	incy,
		double precision, dimension( * )	c,
		integer	incc )

DLARGV generates a vector of plane rotations with real cosines and real sines.

Download DLARGV + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLARGV generates a vector of real plane rotations, determined by
!> elements of the real vectors x and y. For i = 1,2,...,n
!>
!>    (  c(i)  s(i) ) ( x(i) ) = ( a(i) )
!>    ( -s(i)  c(i) ) ( y(i) ) = (   0  )
!>

Parameters

[in]	N	!> N is INTEGER !> The number of plane rotations to be generated. !>
[in,out]	X	!> X is DOUBLE PRECISION array, !> dimension (1+(N-1)*INCX) !> On entry, the vector x. !> On exit, x(i) is overwritten by a(i), for i = 1,...,n. !>
[in]	INCX	!> INCX is INTEGER !> The increment between elements of X. INCX > 0. !>
[in,out]	Y	!> Y is DOUBLE PRECISION array, !> dimension (1+(N-1)*INCY) !> On entry, the vector y. !> On exit, the sines of the plane rotations. !>
[in]	INCY	!> INCY is INTEGER !> The increment between elements of Y. INCY > 0. !>
[out]	C	!> C is DOUBLE PRECISION array, dimension (1+(N-1)*INCC) !> The cosines of the plane rotations. !>
[in]	INCC	!> INCC is INTEGER !> The increment between elements of C. INCC > 0. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 103 of file dlargv.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INCC, INCX, INCY, N
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   C( * ), X( * ), Y( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ZERO, ONE
      parameter( zero = 0.0d+0, one = 1.0d+0 )
*     ..
*     .. Local Scalars ..
      INTEGER            I, IC, IX, IY
      DOUBLE PRECISION   F, G, T, TT
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, sqrt
*     ..
*     .. Executable Statements ..
*
      ix = 1
      iy = 1
      ic = 1
      DO 10 i = 1, n
         f = x( ix )
         g = y( iy )
         IF( g.EQ.zero ) THEN
            c( ic ) = one
         ELSE IF( f.EQ.zero ) THEN
            c( ic ) = zero
            y( iy ) = one
            x( ix ) = g
         ELSE IF( abs( f ).GT.abs( g ) ) THEN
            t = g / f
            tt = sqrt( one+t*t )
            c( ic ) = one / tt
            y( iy ) = t*c( ic )
            x( ix ) = f*tt
         ELSE
            t = f / g
            tt = sqrt( one+t*t )
            y( iy ) = one / tt
            c( ic ) = t*y( iy )
            x( ix ) = g*tt
         END IF
         ic = ic + incc
         iy = iy + incy
         ix = ix + incx
   10 CONTINUE
      RETURN
*
*     End of DLARGV
*

◆ dlarrv()

subroutine dlarrv	(	integer	n,
		double precision	vl,
		double precision	vu,
		double precision, dimension( * )	d,
		double precision, dimension( * )	l,
		double precision	pivmin,
		integer, dimension( * )	isplit,
		integer	m,
		integer	dol,
		integer	dou,
		double precision	minrgp,
		double precision	rtol1,
		double precision	rtol2,
		double precision, dimension( * )	w,
		double precision, dimension( * )	werr,
		double precision, dimension( * )	wgap,
		integer, dimension( * )	iblock,
		integer, dimension( * )	indexw,
		double precision, dimension( * )	gers,
		double precision, dimension( ldz, * )	z,
		integer	ldz,
		integer, dimension( * )	isuppz,
		double precision, dimension( * )	work,
		integer, dimension( * )	iwork,
		integer	info )

DLARRV computes the eigenvectors of the tridiagonal matrix T = L D LT given L, D and the eigenvalues of L D LT.

Download DLARRV + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLARRV computes the eigenvectors of the tridiagonal matrix
!> T = L D L**T given L, D and APPROXIMATIONS to the eigenvalues of L D L**T.
!> The input eigenvalues should have been computed by DLARRE.
!>

Parameters

[in]	N	!> N is INTEGER !> The order of the matrix. N >= 0. !>
[in]	VL	!> VL is DOUBLE PRECISION !> Lower bound of the interval that contains the desired !> eigenvalues. VL < VU. Needed to compute gaps on the left or right !> end of the extremal eigenvalues in the desired RANGE. !>
[in]	VU	!> VU is DOUBLE PRECISION !> Upper bound of the interval that contains the desired !> eigenvalues. VL < VU. !> Note: VU is currently not used by this implementation of DLARRV, VU is !> passed to DLARRV because it could be used compute gaps on the right end !> of the extremal eigenvalues. However, with not much initial accuracy in !> LAMBDA and VU, the formula can lead to an overestimation of the right gap !> and thus to inadequately early RQI 'convergence'. This is currently !> prevented this by forcing a small right gap. And so it turns out that VU !> is currently not used by this implementation of DLARRV. !>
[in,out]	D	!> D is DOUBLE PRECISION array, dimension (N) !> On entry, the N diagonal elements of the diagonal matrix D. !> On exit, D may be overwritten. !>
[in,out]	L	!> L is DOUBLE PRECISION array, dimension (N) !> On entry, the (N-1) subdiagonal elements of the unit !> bidiagonal matrix L are in elements 1 to N-1 of L !> (if the matrix is not split.) At the end of each block !> is stored the corresponding shift as given by DLARRE. !> On exit, L is overwritten. !>
[in]	PIVMIN	!> PIVMIN is DOUBLE PRECISION !> The minimum pivot allowed in the Sturm sequence. !>
[in]	ISPLIT	!> ISPLIT is INTEGER array, dimension (N) !> The splitting points, at which T breaks up into blocks. !> The first block consists of rows/columns 1 to !> ISPLIT( 1 ), the second of rows/columns ISPLIT( 1 )+1 !> through ISPLIT( 2 ), etc. !>
[in]	M	!> M is INTEGER !> The total number of input eigenvalues. 0 <= M <= N. !>
[in]	DOL	!> DOL is INTEGER !>
[in]	DOU	!> DOU is INTEGER !> If the user wants to compute only selected eigenvectors from all !> the eigenvalues supplied, he can specify an index range DOL:DOU. !> Or else the setting DOL=1, DOU=M should be applied. !> Note that DOL and DOU refer to the order in which the eigenvalues !> are stored in W. !> If the user wants to compute only selected eigenpairs, then !> the columns DOL-1 to DOU+1 of the eigenvector space Z contain the !> computed eigenvectors. All other columns of Z are set to zero. !>
[in]	MINRGP	!> MINRGP is DOUBLE PRECISION !>
[in]	RTOL1	!> RTOL1 is DOUBLE PRECISION !>
[in]	RTOL2	!> RTOL2 is DOUBLE PRECISION !> Parameters for bisection. !> An interval [LEFT,RIGHT] has converged if !> RIGHT-LEFT < MAX( RTOL1GAP, RTOL2MAX(\|LEFT\|,\|RIGHT\|) ) !>
[in,out]	W	!> W is DOUBLE PRECISION array, dimension (N) !> The first M elements of W contain the APPROXIMATE eigenvalues for !> which eigenvectors are to be computed. The eigenvalues !> should be grouped by split-off block and ordered from !> smallest to largest within the block ( The output array !> W from DLARRE is expected here ). Furthermore, they are with !> respect to the shift of the corresponding root representation !> for their block. On exit, W holds the eigenvalues of the !> UNshifted matrix. !>
[in,out]	WERR	!> WERR is DOUBLE PRECISION array, dimension (N) !> The first M elements contain the semiwidth of the uncertainty !> interval of the corresponding eigenvalue in W !>
[in,out]	WGAP	!> WGAP is DOUBLE PRECISION array, dimension (N) !> The separation from the right neighbor eigenvalue in W. !>
[in]	IBLOCK	!> IBLOCK is INTEGER array, dimension (N) !> The indices of the blocks (submatrices) associated with the !> corresponding eigenvalues in W; IBLOCK(i)=1 if eigenvalue !> W(i) belongs to the first block from the top, =2 if W(i) !> belongs to the second block, etc. !>
[in]	INDEXW	!> INDEXW is INTEGER array, dimension (N) !> The indices of the eigenvalues within each block (submatrix); !> for example, INDEXW(i)= 10 and IBLOCK(i)=2 imply that the !> i-th eigenvalue W(i) is the 10-th eigenvalue in the second block. !>
[in]	GERS	!> GERS is DOUBLE PRECISION array, dimension (2N) !> The N Gerschgorin intervals (the i-th Gerschgorin interval !> is (GERS(2i-1), GERS(2*i)). The Gerschgorin intervals should !> be computed from the original UNshifted matrix. !>
[out]	Z	!> Z is DOUBLE PRECISION array, dimension (LDZ, max(1,M) ) !> If INFO = 0, the first M columns of Z contain the !> orthonormal eigenvectors of the matrix T !> corresponding to the input eigenvalues, with the i-th !> column of Z holding the eigenvector associated with W(i). !> Note: the user must ensure that at least max(1,M) columns are !> supplied in the array Z. !>
[in]	LDZ	!> LDZ is INTEGER !> The leading dimension of the array Z. LDZ >= 1, and if !> JOBZ = 'V', LDZ >= max(1,N). !>
[out]	ISUPPZ	!> ISUPPZ is INTEGER array, dimension ( 2max(1,M) ) !> The support of the eigenvectors in Z, i.e., the indices !> indicating the nonzero elements in Z. The I-th eigenvector !> is nonzero only in elements ISUPPZ( 2I-1 ) through !> ISUPPZ( 2*I ). !>
[out]	WORK	!> WORK is DOUBLE PRECISION array, dimension (12*N) !>
[out]	IWORK	!> IWORK is INTEGER array, dimension (7*N) !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> !> > 0: A problem occurred in DLARRV. !> < 0: One of the called subroutines signaled an internal problem. !> Needs inspection of the corresponding parameter IINFO !> for further information. !> !> =-1: Problem in DLARRB when refining a child's eigenvalues. !> =-2: Problem in DLARRF when computing the RRR of a child. !> When a child is inside a tight cluster, it can be difficult !> to find an RRR. A partial remedy from the user's point of !> view is to make the parameter MINRGP smaller and recompile. !> However, as the orthogonality of the computed vectors is !> proportional to 1/MINRGP, the user should be aware that !> he might be trading in precision when he decreases MINRGP. !> =-3: Problem in DLARRB when refining a single eigenvalue !> after the Rayleigh correction was rejected. !> = 5: The Rayleigh Quotient Iteration failed to converge to !> full accuracy in MAXITR steps. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Contributors:: Beresford Parlett, University of California, Berkeley, USA
Jim Demmel, University of California, Berkeley, USA
Inderjit Dhillon, University of Texas, Austin, USA
Osni Marques, LBNL/NERSC, USA
Christof Voemel, University of California, Berkeley, USA

Definition at line 287 of file dlarrv.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            DOL, DOU, INFO, LDZ, M, N
      DOUBLE PRECISION   MINRGP, PIVMIN, RTOL1, RTOL2, VL, VU
*     ..
*     .. Array Arguments ..
      INTEGER            IBLOCK( * ), INDEXW( * ), ISPLIT( * ),
     $                   ISUPPZ( * ), IWORK( * )
      DOUBLE PRECISION   D( * ), GERS( * ), L( * ), W( * ), WERR( * ),
     $                   WGAP( * ), WORK( * )
      DOUBLE PRECISION  Z( LDZ, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      INTEGER            MAXITR
      parameter( maxitr = 10 )
      DOUBLE PRECISION   ZERO, ONE, TWO, THREE, FOUR, HALF
      parameter( zero = 0.0d0, one = 1.0d0,
     $                     two = 2.0d0, three = 3.0d0,
     $                     four = 4.0d0, half = 0.5d0)
*     ..
*     .. Local Scalars ..
      LOGICAL            ESKIP, NEEDBS, STP2II, TRYRQC, USEDBS, USEDRQ
      INTEGER            DONE, I, IBEGIN, IDONE, IEND, II, IINDC1,
     $                   IINDC2, IINDR, IINDWK, IINFO, IM, IN, INDEIG,
     $                   INDLD, INDLLD, INDWRK, ISUPMN, ISUPMX, ITER,
     $                   ITMP1, J, JBLK, K, MINIWSIZE, MINWSIZE, NCLUS,
     $                   NDEPTH, NEGCNT, NEWCLS, NEWFST, NEWFTT, NEWLST,
     $                   NEWSIZ, OFFSET, OLDCLS, OLDFST, OLDIEN, OLDLST,
     $                   OLDNCL, P, PARITY, Q, WBEGIN, WEND, WINDEX,
     $                   WINDMN, WINDPL, ZFROM, ZTO, ZUSEDL, ZUSEDU,
     $                   ZUSEDW
      DOUBLE PRECISION   BSTRES, BSTW, EPS, FUDGE, GAP, GAPTOL, GL, GU,
     $                   LAMBDA, LEFT, LGAP, MINGMA, NRMINV, RESID,
     $                   RGAP, RIGHT, RQCORR, RQTOL, SAVGAP, SGNDEF,
     $                   SIGMA, SPDIAM, SSIGMA, TAU, TMP, TOL, ZTZ
*     ..
*     .. External Functions ..
      DOUBLE PRECISION   DLAMCH
      EXTERNAL           dlamch
*     ..
*     .. External Subroutines ..
      EXTERNAL           dcopy, dlar1v, dlarrb, dlarrf, dlaset,
     $                   dscal
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC abs, dble, max, min
*     ..
*     .. Executable Statements ..
*     ..
 
      info = 0
*
*     Quick return if possible
*
      IF( (n.LE.0).OR.(m.LE.0) ) THEN
         RETURN
      END IF
*
*     The first N entries of WORK are reserved for the eigenvalues
      indld = n+1
      indlld= 2*n+1
      indwrk= 3*n+1
      minwsize = 12 * n
 
      DO 5 i= 1,minwsize
         work( i ) = zero
 5    CONTINUE
 
*     IWORK(IINDR+1:IINDR+N) hold the twist indices R for the
*     factorization used to compute the FP vector
      iindr = 0
*     IWORK(IINDC1+1:IINC2+N) are used to store the clusters of the current
*     layer and the one above.
      iindc1 = n
      iindc2 = 2*n
      iindwk = 3*n + 1
 
      miniwsize = 7 * n
      DO 10 i= 1,miniwsize
         iwork( i ) = 0
 10   CONTINUE
 
      zusedl = 1
      IF(dol.GT.1) THEN
*        Set lower bound for use of Z
         zusedl = dol-1
      ENDIF
      zusedu = m
      IF(dou.LT.m) THEN
*        Set lower bound for use of Z
         zusedu = dou+1
      ENDIF
*     The width of the part of Z that is used
      zusedw = zusedu - zusedl + 1
 
 
      CALL dlaset( 'Full', n, zusedw, zero, zero,
     $                    z(1,zusedl), ldz )
 
      eps = dlamch( 'Precision' )
      rqtol = two * eps
*
*     Set expert flags for standard code.
      tryrqc = .true.
 
      IF((dol.EQ.1).AND.(dou.EQ.m)) THEN
      ELSE
*        Only selected eigenpairs are computed. Since the other evalues
*        are not refined by RQ iteration, bisection has to compute to full
*        accuracy.
         rtol1 = four * eps
         rtol2 = four * eps
      ENDIF
 
*     The entries WBEGIN:WEND in W, WERR, WGAP correspond to the
*     desired eigenvalues. The support of the nonzero eigenvector
*     entries is contained in the interval IBEGIN:IEND.
*     Remark that if k eigenpairs are desired, then the eigenvectors
*     are stored in k contiguous columns of Z.
 
*     DONE is the number of eigenvectors already computed
      done = 0
      ibegin = 1
      wbegin = 1
      DO 170 jblk = 1, iblock( m )
         iend = isplit( jblk )
         sigma = l( iend )
*        Find the eigenvectors of the submatrix indexed IBEGIN
*        through IEND.
         wend = wbegin - 1
 15      CONTINUE
         IF( wend.LT.m ) THEN
            IF( iblock( wend+1 ).EQ.jblk ) THEN
               wend = wend + 1
               GO TO 15
            END IF
         END IF
         IF( wend.LT.wbegin ) THEN
            ibegin = iend + 1
            GO TO 170
         ELSEIF( (wend.LT.dol).OR.(wbegin.GT.dou) ) THEN
            ibegin = iend + 1
            wbegin = wend + 1
            GO TO 170
         END IF
 
*        Find local spectral diameter of the block
         gl = gers( 2*ibegin-1 )
         gu = gers( 2*ibegin )
         DO 20 i = ibegin+1 , iend
            gl = min( gers( 2*i-1 ), gl )
            gu = max( gers( 2*i ), gu )
 20      CONTINUE
         spdiam = gu - gl
 
*        OLDIEN is the last index of the previous block
         oldien = ibegin - 1
*        Calculate the size of the current block
         in = iend - ibegin + 1
*        The number of eigenvalues in the current block
         im = wend - wbegin + 1
 
*        This is for a 1x1 block
         IF( ibegin.EQ.iend ) THEN
            done = done+1
            z( ibegin, wbegin ) = one
            isuppz( 2*wbegin-1 ) = ibegin
            isuppz( 2*wbegin ) = ibegin
            w( wbegin ) = w( wbegin ) + sigma
            work( wbegin ) = w( wbegin )
            ibegin = iend + 1
            wbegin = wbegin + 1
            GO TO 170
         END IF
 
*        The desired (shifted) eigenvalues are stored in W(WBEGIN:WEND)
*        Note that these can be approximations, in this case, the corresp.
*        entries of WERR give the size of the uncertainty interval.
*        The eigenvalue approximations will be refined when necessary as
*        high relative accuracy is required for the computation of the
*        corresponding eigenvectors.
         CALL dcopy( im, w( wbegin ), 1,
     $                   work( wbegin ), 1 )
 
*        We store in W the eigenvalue approximations w.r.t. the original
*        matrix T.
         DO 30 i=1,im
            w(wbegin+i-1) = w(wbegin+i-1)+sigma
 30      CONTINUE
 
 
*        NDEPTH is the current depth of the representation tree
         ndepth = 0
*        PARITY is either 1 or 0
         parity = 1
*        NCLUS is the number of clusters for the next level of the
*        representation tree, we start with NCLUS = 1 for the root
         nclus = 1
         iwork( iindc1+1 ) = 1
         iwork( iindc1+2 ) = im
 
*        IDONE is the number of eigenvectors already computed in the current
*        block
         idone = 0
*        loop while( IDONE.LT.IM )
*        generate the representation tree for the current block and
*        compute the eigenvectors
   40    CONTINUE
         IF( idone.LT.im ) THEN
*           This is a crude protection against infinitely deep trees
            IF( ndepth.GT.m ) THEN
               info = -2
               RETURN
            ENDIF
*           breadth first processing of the current level of the representation
*           tree: OLDNCL = number of clusters on current level
            oldncl = nclus
*           reset NCLUS to count the number of child clusters
            nclus = 0
*
            parity = 1 - parity
            IF( parity.EQ.0 ) THEN
               oldcls = iindc1
               newcls = iindc2
            ELSE
               oldcls = iindc2
               newcls = iindc1
            END IF
*           Process the clusters on the current level
            DO 150 i = 1, oldncl
               j = oldcls + 2*i
*              OLDFST, OLDLST = first, last index of current cluster.
*                               cluster indices start with 1 and are relative
*                               to WBEGIN when accessing W, WGAP, WERR, Z
               oldfst = iwork( j-1 )
               oldlst = iwork( j )
               IF( ndepth.GT.0 ) THEN
*                 Retrieve relatively robust representation (RRR) of cluster
*                 that has been computed at the previous level
*                 The RRR is stored in Z and overwritten once the eigenvectors
*                 have been computed or when the cluster is refined
 
                  IF((dol.EQ.1).AND.(dou.EQ.m)) THEN
*                    Get representation from location of the leftmost evalue
*                    of the cluster
                     j = wbegin + oldfst - 1
                  ELSE
                     IF(wbegin+oldfst-1.LT.dol) THEN
*                       Get representation from the left end of Z array
                        j = dol - 1
                     ELSEIF(wbegin+oldfst-1.GT.dou) THEN
*                       Get representation from the right end of Z array
                        j = dou
                     ELSE
                        j = wbegin + oldfst - 1
                     ENDIF
                  ENDIF
                  CALL dcopy( in, z( ibegin, j ), 1, d( ibegin ), 1 )
                  CALL dcopy( in-1, z( ibegin, j+1 ), 1, l( ibegin ),
     $               1 )
                  sigma = z( iend, j+1 )
 
*                 Set the corresponding entries in Z to zero
                  CALL dlaset( 'Full', in, 2, zero, zero,
     $                         z( ibegin, j), ldz )
               END IF
 
*              Compute DL and DLL of current RRR
               DO 50 j = ibegin, iend-1
                  tmp = d( j )*l( j )
                  work( indld-1+j ) = tmp
                  work( indlld-1+j ) = tmp*l( j )
   50          CONTINUE
 
               IF( ndepth.GT.0 ) THEN
*                 P and Q are index of the first and last eigenvalue to compute
*                 within the current block
                  p = indexw( wbegin-1+oldfst )
                  q = indexw( wbegin-1+oldlst )
*                 Offset for the arrays WORK, WGAP and WERR, i.e., the P-OFFSET
*                 through the Q-OFFSET elements of these arrays are to be used.
*                  OFFSET = P-OLDFST
                  offset = indexw( wbegin ) - 1
*                 perform limited bisection (if necessary) to get approximate
*                 eigenvalues to the precision needed.
                  CALL dlarrb( in, d( ibegin ),
     $                         work(indlld+ibegin-1),
     $                         p, q, rtol1, rtol2, offset,
     $                         work(wbegin),wgap(wbegin),werr(wbegin),
     $                         work( indwrk ), iwork( iindwk ),
     $                         pivmin, spdiam, in, iinfo )
                  IF( iinfo.NE.0 ) THEN
                     info = -1
                     RETURN
                  ENDIF
*                 We also recompute the extremal gaps. W holds all eigenvalues
*                 of the unshifted matrix and must be used for computation
*                 of WGAP, the entries of WORK might stem from RRRs with
*                 different shifts. The gaps from WBEGIN-1+OLDFST to
*                 WBEGIN-1+OLDLST are correctly computed in DLARRB.
*                 However, we only allow the gaps to become greater since
*                 this is what should happen when we decrease WERR
                  IF( oldfst.GT.1) THEN
                     wgap( wbegin+oldfst-2 ) =
     $             max(wgap(wbegin+oldfst-2),
     $                 w(wbegin+oldfst-1)-werr(wbegin+oldfst-1)
     $                 - w(wbegin+oldfst-2)-werr(wbegin+oldfst-2) )
                  ENDIF
                  IF( wbegin + oldlst -1 .LT. wend ) THEN
                     wgap( wbegin+oldlst-1 ) =
     $               max(wgap(wbegin+oldlst-1),
     $                   w(wbegin+oldlst)-werr(wbegin+oldlst)
     $                   - w(wbegin+oldlst-1)-werr(wbegin+oldlst-1) )
                  ENDIF
*                 Each time the eigenvalues in WORK get refined, we store
*                 the newly found approximation with all shifts applied in W
                  DO 53 j=oldfst,oldlst
                     w(wbegin+j-1) = work(wbegin+j-1)+sigma
 53               CONTINUE
               END IF
 
*              Process the current node.
               newfst = oldfst
               DO 140 j = oldfst, oldlst
                  IF( j.EQ.oldlst ) THEN
*                    we are at the right end of the cluster, this is also the
*                    boundary of the child cluster
                     newlst = j
                  ELSE IF ( wgap( wbegin + j -1).GE.
     $                    minrgp* abs( work(wbegin + j -1) ) ) THEN
*                    the right relative gap is big enough, the child cluster
*                    (NEWFST,..,NEWLST) is well separated from the following
                     newlst = j
                   ELSE
*                    inside a child cluster, the relative gap is not
*                    big enough.
                     GOTO 140
                  END IF
 
*                 Compute size of child cluster found
                  newsiz = newlst - newfst + 1
 
*                 NEWFTT is the place in Z where the new RRR or the computed
*                 eigenvector is to be stored
                  IF((dol.EQ.1).AND.(dou.EQ.m)) THEN
*                    Store representation at location of the leftmost evalue
*                    of the cluster
                     newftt = wbegin + newfst - 1
                  ELSE
                     IF(wbegin+newfst-1.LT.dol) THEN
*                       Store representation at the left end of Z array
                        newftt = dol - 1
                     ELSEIF(wbegin+newfst-1.GT.dou) THEN
*                       Store representation at the right end of Z array
                        newftt = dou
                     ELSE
                        newftt = wbegin + newfst - 1
                     ENDIF
                  ENDIF
 
                  IF( newsiz.GT.1) THEN
*
*                    Current child is not a singleton but a cluster.
*                    Compute and store new representation of child.
*
*
*                    Compute left and right cluster gap.
*
*                    LGAP and RGAP are not computed from WORK because
*                    the eigenvalue approximations may stem from RRRs
*                    different shifts. However, W hold all eigenvalues
*                    of the unshifted matrix. Still, the entries in WGAP
*                    have to be computed from WORK since the entries
*                    in W might be of the same order so that gaps are not
*                    exhibited correctly for very close eigenvalues.
                     IF( newfst.EQ.1 ) THEN
                        lgap = max( zero,
     $                       w(wbegin)-werr(wbegin) - vl )
                    ELSE
                        lgap = wgap( wbegin+newfst-2 )
                     ENDIF
                     rgap = wgap( wbegin+newlst-1 )
*
*                    Compute left- and rightmost eigenvalue of child
*                    to high precision in order to shift as close
*                    as possible and obtain as large relative gaps
*                    as possible
*
                     DO 55 k =1,2
                        IF(k.EQ.1) THEN
                           p = indexw( wbegin-1+newfst )
                        ELSE
                           p = indexw( wbegin-1+newlst )
                        ENDIF
                        offset = indexw( wbegin ) - 1
                        CALL dlarrb( in, d(ibegin),
     $                       work( indlld+ibegin-1 ),p,p,
     $                       rqtol, rqtol, offset,
     $                       work(wbegin),wgap(wbegin),
     $                       werr(wbegin),work( indwrk ),
     $                       iwork( iindwk ), pivmin, spdiam,
     $                       in, iinfo )
 55                  CONTINUE
*
                     IF((wbegin+newlst-1.LT.dol).OR.
     $                  (wbegin+newfst-1.GT.dou)) THEN
*                       if the cluster contains no desired eigenvalues
*                       skip the computation of that branch of the rep. tree
*
*                       We could skip before the refinement of the extremal
*                       eigenvalues of the child, but then the representation
*                       tree could be different from the one when nothing is
*                       skipped. For this reason we skip at this place.
                        idone = idone + newlst - newfst + 1
                        GOTO 139
                     ENDIF
*
*                    Compute RRR of child cluster.
*                    Note that the new RRR is stored in Z
*
*                    DLARRF needs LWORK = 2*N
                     CALL dlarrf( in, d( ibegin ), l( ibegin ),
     $                         work(indld+ibegin-1),
     $                         newfst, newlst, work(wbegin),
     $                         wgap(wbegin), werr(wbegin),
     $                         spdiam, lgap, rgap, pivmin, tau,
     $                         z(ibegin, newftt),z(ibegin, newftt+1),
     $                         work( indwrk ), iinfo )
                     IF( iinfo.EQ.0 ) THEN
*                       a new RRR for the cluster was found by DLARRF
*                       update shift and store it
                        ssigma = sigma + tau
                        z( iend, newftt+1 ) = ssigma
*                       WORK() are the midpoints and WERR() the semi-width
*                       Note that the entries in W are unchanged.
                        DO 116 k = newfst, newlst
                           fudge =
     $                          three*eps*abs(work(wbegin+k-1))
                           work( wbegin + k - 1 ) =
     $                          work( wbegin + k - 1) - tau
                           fudge = fudge +
     $                          four*eps*abs(work(wbegin+k-1))
*                          Fudge errors
                           werr( wbegin + k - 1 ) =
     $                          werr( wbegin + k - 1 ) + fudge
*                          Gaps are not fudged. Provided that WERR is small
*                          when eigenvalues are close, a zero gap indicates
*                          that a new representation is needed for resolving
*                          the cluster. A fudge could lead to a wrong decision
*                          of judging eigenvalues 'separated' which in
*                          reality are not. This could have a negative impact
*                          on the orthogonality of the computed eigenvectors.
 116                    CONTINUE
 
                        nclus = nclus + 1
                        k = newcls + 2*nclus
                        iwork( k-1 ) = newfst
                        iwork( k ) = newlst
                     ELSE
                        info = -2
                        RETURN
                     ENDIF
                  ELSE
*
*                    Compute eigenvector of singleton
*
                     iter = 0
*
                     tol = four * log(dble(in)) * eps
*
                     k = newfst
                     windex = wbegin + k - 1
                     windmn = max(windex - 1,1)
                     windpl = min(windex + 1,m)
                     lambda = work( windex )
                     done = done + 1
*                    Check if eigenvector computation is to be skipped
                     IF((windex.LT.dol).OR.
     $                  (windex.GT.dou)) THEN
                        eskip = .true.
                        GOTO 125
                     ELSE
                        eskip = .false.
                     ENDIF
                     left = work( windex ) - werr( windex )
                     right = work( windex ) + werr( windex )
                     indeig = indexw( windex )
*                    Note that since we compute the eigenpairs for a child,
*                    all eigenvalue approximations are w.r.t the same shift.
*                    In this case, the entries in WORK should be used for
*                    computing the gaps since they exhibit even very small
*                    differences in the eigenvalues, as opposed to the
*                    entries in W which might "look" the same.
 
                     IF( k .EQ. 1) THEN
*                       In the case RANGE='I' and with not much initial
*                       accuracy in LAMBDA and VL, the formula
*                       LGAP = MAX( ZERO, (SIGMA - VL) + LAMBDA )
*                       can lead to an overestimation of the left gap and
*                       thus to inadequately early RQI 'convergence'.
*                       Prevent this by forcing a small left gap.
                        lgap = eps*max(abs(left),abs(right))
                     ELSE
                        lgap = wgap(windmn)
                     ENDIF
                     IF( k .EQ. im) THEN
*                       In the case RANGE='I' and with not much initial
*                       accuracy in LAMBDA and VU, the formula
*                       can lead to an overestimation of the right gap and
*                       thus to inadequately early RQI 'convergence'.
*                       Prevent this by forcing a small right gap.
                        rgap = eps*max(abs(left),abs(right))
                     ELSE
                        rgap = wgap(windex)
                     ENDIF
                     gap = min( lgap, rgap )
                     IF(( k .EQ. 1).OR.(k .EQ. im)) THEN
*                       The eigenvector support can become wrong
*                       because significant entries could be cut off due to a
*                       large GAPTOL parameter in LAR1V. Prevent this.
                        gaptol = zero
                     ELSE
                        gaptol = gap * eps
                     ENDIF
                     isupmn = in
                     isupmx = 1
*                    Update WGAP so that it holds the minimum gap
*                    to the left or the right. This is crucial in the
*                    case where bisection is used to ensure that the
*                    eigenvalue is refined up to the required precision.
*                    The correct value is restored afterwards.
                     savgap = wgap(windex)
                     wgap(windex) = gap
*                    We want to use the Rayleigh Quotient Correction
*                    as often as possible since it converges quadratically
*                    when we are close enough to the desired eigenvalue.
*                    However, the Rayleigh Quotient can have the wrong sign
*                    and lead us away from the desired eigenvalue. In this
*                    case, the best we can do is to use bisection.
                     usedbs = .false.
                     usedrq = .false.
*                    Bisection is initially turned off unless it is forced
                     needbs =  .NOT.tryrqc
 120                 CONTINUE
*                    Check if bisection should be used to refine eigenvalue
                     IF(needbs) THEN
*                       Take the bisection as new iterate
                        usedbs = .true.
                        itmp1 = iwork( iindr+windex )
                        offset = indexw( wbegin ) - 1
                        CALL dlarrb( in, d(ibegin),
     $                       work(indlld+ibegin-1),indeig,indeig,
     $                       zero, two*eps, offset,
     $                       work(wbegin),wgap(wbegin),
     $                       werr(wbegin),work( indwrk ),
     $                       iwork( iindwk ), pivmin, spdiam,
     $                       itmp1, iinfo )
                        IF( iinfo.NE.0 ) THEN
                           info = -3
                           RETURN
                        ENDIF
                        lambda = work( windex )
*                       Reset twist index from inaccurate LAMBDA to
*                       force computation of true MINGMA
                        iwork( iindr+windex ) = 0
                     ENDIF
*                    Given LAMBDA, compute the eigenvector.
                     CALL dlar1v( in, 1, in, lambda, d( ibegin ),
     $                    l( ibegin ), work(indld+ibegin-1),
     $                    work(indlld+ibegin-1),
     $                    pivmin, gaptol, z( ibegin, windex ),
     $                    .NOT.usedbs, negcnt, ztz, mingma,
     $                    iwork( iindr+windex ), isuppz( 2*windex-1 ),
     $                    nrminv, resid, rqcorr, work( indwrk ) )
                     IF(iter .EQ. 0) THEN
                        bstres = resid
                        bstw = lambda
                     ELSEIF(resid.LT.bstres) THEN
                        bstres = resid
                        bstw = lambda
                     ENDIF
                     isupmn = min(isupmn,isuppz( 2*windex-1 ))
                     isupmx = max(isupmx,isuppz( 2*windex ))
                     iter = iter + 1
 
*                    sin alpha <= |resid|/gap
*                    Note that both the residual and the gap are
*                    proportional to the matrix, so ||T|| doesn't play
*                    a role in the quotient
 
*
*                    Convergence test for Rayleigh-Quotient iteration
*                    (omitted when Bisection has been used)
*
                     IF( resid.GT.tol*gap .AND. abs( rqcorr ).GT.
     $                    rqtol*abs( lambda ) .AND. .NOT. usedbs)
     $                    THEN
*                       We need to check that the RQCORR update doesn't
*                       move the eigenvalue away from the desired one and
*                       towards a neighbor. -> protection with bisection
                        IF(indeig.LE.negcnt) THEN
*                          The wanted eigenvalue lies to the left
                           sgndef = -one
                        ELSE
*                          The wanted eigenvalue lies to the right
                           sgndef = one
                        ENDIF
*                       We only use the RQCORR if it improves the
*                       the iterate reasonably.
                        IF( ( rqcorr*sgndef.GE.zero )
     $                       .AND.( lambda + rqcorr.LE. right)
     $                       .AND.( lambda + rqcorr.GE. left)
     $                       ) THEN
                           usedrq = .true.
*                          Store new midpoint of bisection interval in WORK
                           IF(sgndef.EQ.one) THEN
*                             The current LAMBDA is on the left of the true
*                             eigenvalue
                              left = lambda
*                             We prefer to assume that the error estimate
*                             is correct. We could make the interval not
*                             as a bracket but to be modified if the RQCORR
*                             chooses to. In this case, the RIGHT side should
*                             be modified as follows:
*                              RIGHT = MAX(RIGHT, LAMBDA + RQCORR)
                           ELSE
*                             The current LAMBDA is on the right of the true
*                             eigenvalue
                              right = lambda
*                             See comment about assuming the error estimate is
*                             correct above.
*                              LEFT = MIN(LEFT, LAMBDA + RQCORR)
                           ENDIF
                           work( windex ) =
     $                       half * (right + left)
*                          Take RQCORR since it has the correct sign and
*                          improves the iterate reasonably
                           lambda = lambda + rqcorr
*                          Update width of error interval
                           werr( windex ) =
     $                             half * (right-left)
                        ELSE
                           needbs = .true.
                        ENDIF
                        IF(right-left.LT.rqtol*abs(lambda)) THEN
*                             The eigenvalue is computed to bisection accuracy
*                             compute eigenvector and stop
                           usedbs = .true.
                           GOTO 120
                        ELSEIF( iter.LT.maxitr ) THEN
                           GOTO 120
                        ELSEIF( iter.EQ.maxitr ) THEN
                           needbs = .true.
                           GOTO 120
                        ELSE
                           info = 5
                           RETURN
                        END IF
                     ELSE
                        stp2ii = .false.
        IF(usedrq .AND. usedbs .AND.
     $                     bstres.LE.resid) THEN
                           lambda = bstw
                           stp2ii = .true.
                        ENDIF
                        IF (stp2ii) THEN
*                          improve error angle by second step
                           CALL dlar1v( in, 1, in, lambda,
     $                          d( ibegin ), l( ibegin ),
     $                          work(indld+ibegin-1),
     $                          work(indlld+ibegin-1),
     $                          pivmin, gaptol, z( ibegin, windex ),
     $                          .NOT.usedbs, negcnt, ztz, mingma,
     $                          iwork( iindr+windex ),
     $                          isuppz( 2*windex-1 ),
     $                          nrminv, resid, rqcorr, work( indwrk ) )
                        ENDIF
                        work( windex ) = lambda
                     END IF
*
*                    Compute FP-vector support w.r.t. whole matrix
*
                     isuppz( 2*windex-1 ) = isuppz( 2*windex-1 )+oldien
                     isuppz( 2*windex ) = isuppz( 2*windex )+oldien
                     zfrom = isuppz( 2*windex-1 )
                     zto = isuppz( 2*windex )
                     isupmn = isupmn + oldien
                     isupmx = isupmx + oldien
*                    Ensure vector is ok if support in the RQI has changed
                     IF(isupmn.LT.zfrom) THEN
                        DO 122 ii = isupmn,zfrom-1
                           z( ii, windex ) = zero
 122                    CONTINUE
                     ENDIF
                     IF(isupmx.GT.zto) THEN
                        DO 123 ii = zto+1,isupmx
                           z( ii, windex ) = zero
 123                    CONTINUE
                     ENDIF
                     CALL dscal( zto-zfrom+1, nrminv,
     $                       z( zfrom, windex ), 1 )
 125                 CONTINUE
*                    Update W
                     w( windex ) = lambda+sigma
*                    Recompute the gaps on the left and right
*                    But only allow them to become larger and not
*                    smaller (which can only happen through "bad"
*                    cancellation and doesn't reflect the theory
*                    where the initial gaps are underestimated due
*                    to WERR being too crude.)
                     IF(.NOT.eskip) THEN
                        IF( k.GT.1) THEN
                           wgap( windmn ) = max( wgap(windmn),
     $                          w(windex)-werr(windex)
     $                          - w(windmn)-werr(windmn) )
                        ENDIF
                        IF( windex.LT.wend ) THEN
                           wgap( windex ) = max( savgap,
     $                          w( windpl )-werr( windpl )
     $                          - w( windex )-werr( windex) )
                        ENDIF
                     ENDIF
                     idone = idone + 1
                  ENDIF
*                 here ends the code for the current child
*
 139              CONTINUE
*                 Proceed to any remaining child nodes
                  newfst = j + 1
 140           CONTINUE
 150        CONTINUE
            ndepth = ndepth + 1
            GO TO 40
         END IF
         ibegin = iend + 1
         wbegin = wend + 1
 170  CONTINUE
*
 
      RETURN
*
*     End of DLARRV
*

◆ dlartv()

subroutine dlartv	(	integer	n,
		double precision, dimension( * )	x,
		integer	incx,
		double precision, dimension( * )	y,
		integer	incy,
		double precision, dimension( * )	c,
		double precision, dimension( * )	s,
		integer	incc )

DLARTV applies a vector of plane rotations with real cosines and real sines to the elements of a pair of vectors.

Download DLARTV + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLARTV applies a vector of real plane rotations to elements of the
!> real vectors x and y. For i = 1,2,...,n
!>
!>    ( x(i) ) := (  c(i)  s(i) ) ( x(i) )
!>    ( y(i) )    ( -s(i)  c(i) ) ( y(i) )
!>

Parameters

[in]	N	!> N is INTEGER !> The number of plane rotations to be applied. !>
[in,out]	X	!> X is DOUBLE PRECISION array, !> dimension (1+(N-1)*INCX) !> The vector x. !>
[in]	INCX	!> INCX is INTEGER !> The increment between elements of X. INCX > 0. !>
[in,out]	Y	!> Y is DOUBLE PRECISION array, !> dimension (1+(N-1)*INCY) !> The vector y. !>
[in]	INCY	!> INCY is INTEGER !> The increment between elements of Y. INCY > 0. !>
[in]	C	!> C is DOUBLE PRECISION array, dimension (1+(N-1)*INCC) !> The cosines of the plane rotations. !>
[in]	S	!> S is DOUBLE PRECISION array, dimension (1+(N-1)*INCC) !> The sines of the plane rotations. !>
[in]	INCC	!> INCC is INTEGER !> The increment between elements of C and S. INCC > 0. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 107 of file dlartv.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INCC, INCX, INCY, N
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   C( * ), S( * ), X( * ), Y( * )
*     ..
*
*  =====================================================================
*
*     .. Local Scalars ..
      INTEGER            I, IC, IX, IY
      DOUBLE PRECISION   XI, YI
*     ..
*     .. Executable Statements ..
*
      ix = 1
      iy = 1
      ic = 1
      DO 10 i = 1, n
         xi = x( ix )
         yi = y( iy )
         x( ix ) = c( ic )*xi + s( ic )*yi
         y( iy ) = c( ic )*yi - s( ic )*xi
         ix = ix + incx
         iy = iy + incy
         ic = ic + incc
   10 CONTINUE
      RETURN
*
*     End of DLARTV
*

◆ dlaswp()

subroutine dlaswp	(	integer	n,
		double precision, dimension( lda, * )	a,
		integer	lda,
		integer	k1,
		integer	k2,
		integer, dimension( * )	ipiv,
		integer	incx )

DLASWP performs a series of row interchanges on a general rectangular matrix.

Download DLASWP + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLASWP performs a series of row interchanges on the matrix A.
!> One row interchange is initiated for each of rows K1 through K2 of A.
!>

Parameters

[in]	N	!> N is INTEGER !> The number of columns of the matrix A. !>
[in,out]	A	!> A is DOUBLE PRECISION array, dimension (LDA,N) !> On entry, the matrix of column dimension N to which the row !> interchanges will be applied. !> On exit, the permuted matrix. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. !>
[in]	K1	!> K1 is INTEGER !> The first element of IPIV for which a row interchange will !> be done. !>
[in]	K2	!> K2 is INTEGER !> (K2-K1+1) is the number of elements of IPIV for which a row !> interchange will be done. !>
[in]	IPIV	!> IPIV is INTEGER array, dimension (K1+(K2-K1)abs(INCX)) !> The vector of pivot indices. Only the elements in positions !> K1 through K1+(K2-K1)abs(INCX) of IPIV are accessed. !> IPIV(K1+(K-K1)*abs(INCX)) = L implies rows K and L are to be !> interchanged. !>
[in]	INCX	!> INCX is INTEGER !> The increment between successive values of IPIV. If INCX !> is negative, the pivots are applied in reverse order. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  Modified by
!>   R. C. Whaley, Computer Science Dept., Univ. of Tenn., Knoxville, USA
!>

Definition at line 114 of file dlaswp.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INCX, K1, K2, LDA, N
*     ..
*     .. Array Arguments ..
      INTEGER            IPIV( * )
      DOUBLE PRECISION   A( LDA, * )
*     ..
*
* =====================================================================
*
*     .. Local Scalars ..
      INTEGER            I, I1, I2, INC, IP, IX, IX0, J, K, N32
      DOUBLE PRECISION   TEMP
*     ..
*     .. Executable Statements ..
*
*     Interchange row I with row IPIV(K1+(I-K1)*abs(INCX)) for each of rows
*     K1 through K2.
*
      IF( incx.GT.0 ) THEN
         ix0 = k1
         i1 = k1
         i2 = k2
         inc = 1
      ELSE IF( incx.LT.0 ) THEN
         ix0 = k1 + ( k1-k2 )*incx
         i1 = k2
         i2 = k1
         inc = -1
      ELSE
         RETURN
      END IF
*
      n32 = ( n / 32 )*32
      IF( n32.NE.0 ) THEN
         DO 30 j = 1, n32, 32
            ix = ix0
            DO 20 i = i1, i2, inc
               ip = ipiv( ix )
               IF( ip.NE.i ) THEN
                  DO 10 k = j, j + 31
                     temp = a( i, k )
                     a( i, k ) = a( ip, k )
                     a( ip, k ) = temp
   10             CONTINUE
               END IF
               ix = ix + incx
   20       CONTINUE
   30    CONTINUE
      END IF
      IF( n32.NE.n ) THEN
         n32 = n32 + 1
         ix = ix0
         DO 50 i = i1, i2, inc
            ip = ipiv( ix )
            IF( ip.NE.i ) THEN
               DO 40 k = n32, n
                  temp = a( i, k )
                  a( i, k ) = a( ip, k )
                  a( ip, k ) = temp
   40          CONTINUE
            END IF
            ix = ix + incx
   50    CONTINUE
      END IF
*
      RETURN
*
*     End of DLASWP
*

◆ dlat2s()

subroutine dlat2s	(	character	uplo,
		integer	n,
		double precision, dimension( lda, * )	a,
		integer	lda,
		real, dimension( ldsa, * )	sa,
		integer	ldsa,
		integer	info )

DLAT2S converts a double-precision triangular matrix to a single-precision triangular matrix.

Download DLAT2S + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLAT2S converts a DOUBLE PRECISION triangular matrix, SA, to a SINGLE
!> PRECISION triangular matrix, A.
!>
!> RMAX is the overflow for the SINGLE PRECISION arithmetic
!> DLAS2S checks that all the entries of A are between -RMAX and
!> RMAX. If not the conversion is aborted and a flag is raised.
!>
!> This is an auxiliary routine so there is no argument checking.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> = 'U': A is upper triangular; !> = 'L': A is lower triangular. !>
[in]	N	!> N is INTEGER !> The number of rows and columns of the matrix A. N >= 0. !>
[in]	A	!> A is DOUBLE PRECISION array, dimension (LDA,N) !> On entry, the N-by-N triangular coefficient matrix A. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,N). !>
[out]	SA	!> SA is REAL array, dimension (LDSA,N) !> Only the UPLO part of SA is referenced. On exit, if INFO=0, !> the N-by-N coefficient matrix SA; if INFO>0, the content of !> the UPLO part of SA is unspecified. !>
[in]	LDSA	!> LDSA is INTEGER !> The leading dimension of the array SA. LDSA >= max(1,M). !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit. !> = 1: an entry of the matrix A is greater than the SINGLE !> PRECISION overflow threshold, in this case, the content !> of the UPLO part of SA in exit is unspecified. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 110 of file dlat2s.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          UPLO
      INTEGER            INFO, LDA, LDSA, N
*     ..
*     .. Array Arguments ..
      REAL               SA( LDSA, * )
      DOUBLE PRECISION   A( LDA, * )
*     ..
*
*  =====================================================================
*
*     .. Local Scalars ..
      INTEGER            I, J
      DOUBLE PRECISION   RMAX
      LOGICAL            UPPER
*     ..
*     .. External Functions ..
      REAL               SLAMCH
      LOGICAL            LSAME
      EXTERNAL           slamch, lsame
*     ..
*     .. Executable Statements ..
*
      rmax = slamch( 'O' )
      upper = lsame( uplo, 'U' )
      IF( upper ) THEN
         DO 20 j = 1, n
            DO 10 i = 1, j
               IF( ( a( i, j ).LT.-rmax ) .OR. ( a( i, j ).GT.rmax ) )
     $             THEN
                  info = 1
                  GO TO 50
               END IF
               sa( i, j ) = a( i, j )
   10       CONTINUE
   20    CONTINUE
      ELSE
         DO 40 j = 1, n
            DO 30 i = j, n
               IF( ( a( i, j ).LT.-rmax ) .OR. ( a( i, j ).GT.rmax ) )
     $             THEN
                  info = 1
                  GO TO 50
               END IF
               sa( i, j ) = a( i, j )
   30       CONTINUE
   40    CONTINUE
      END IF
   50 CONTINUE
*
      RETURN
*
*     End of DLAT2S
*

◆ dlatbs()

subroutine dlatbs	(	character	uplo,
		character	trans,
		character	diag,
		character	normin,
		integer	n,
		integer	kd,
		double precision, dimension( ldab, * )	ab,
		integer	ldab,
		double precision, dimension( * )	x,
		double precision	scale,
		double precision, dimension( * )	cnorm,
		integer	info )

DLATBS solves a triangular banded system of equations.

Download DLATBS + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLATBS solves one of the triangular systems
!>
!>    A *x = s*b  or  A**T*x = s*b
!>
!> with scaling to prevent overflow, where A is an upper or lower
!> triangular band matrix.  Here A**T denotes the transpose of A, x and b
!> are n-element vectors, and s is a scaling factor, usually less than
!> or equal to 1, chosen so that the components of x will be less than
!> the overflow threshold.  If the unscaled problem will not cause
!> overflow, the Level 2 BLAS routine DTBSV is called.  If the matrix A
!> is singular (A(j,j) = 0 for some j), then s is set to 0 and a
!> non-trivial solution to A*x = 0 is returned.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> Specifies whether the matrix A is upper or lower triangular. !> = 'U': Upper triangular !> = 'L': Lower triangular !>
[in]	TRANS	!> TRANS is CHARACTER1 !> Specifies the operation applied to A. !> = 'N': Solve A x = sb (No transpose) !> = 'T': Solve AT x = sb (Transpose) !> = 'C': Solve AT x = s*b (Conjugate transpose = Transpose) !>
[in]	DIAG	!> DIAG is CHARACTER*1 !> Specifies whether or not the matrix A is unit triangular. !> = 'N': Non-unit triangular !> = 'U': Unit triangular !>
[in]	NORMIN	!> NORMIN is CHARACTER*1 !> Specifies whether CNORM has been set or not. !> = 'Y': CNORM contains the column norms on entry !> = 'N': CNORM is not set on entry. On exit, the norms will !> be computed and stored in CNORM. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in]	KD	!> KD is INTEGER !> The number of subdiagonals or superdiagonals in the !> triangular matrix A. KD >= 0. !>
[in]	AB	!> AB is DOUBLE PRECISION array, dimension (LDAB,N) !> The upper or lower triangular band matrix A, stored in the !> first KD+1 rows of the array. The j-th column of A is stored !> in the j-th column of the array AB as follows: !> if UPLO = 'U', AB(kd+1+i-j,j) = A(i,j) for max(1,j-kd)<=i<=j; !> if UPLO = 'L', AB(1+i-j,j) = A(i,j) for j<=i<=min(n,j+kd). !>
[in]	LDAB	!> LDAB is INTEGER !> The leading dimension of the array AB. LDAB >= KD+1. !>
[in,out]	X	!> X is DOUBLE PRECISION array, dimension (N) !> On entry, the right hand side b of the triangular system. !> On exit, X is overwritten by the solution vector x. !>
[out]	SCALE	!> SCALE is DOUBLE PRECISION !> The scaling factor s for the triangular system !> A * x = sb or AT x = sb. !> If SCALE = 0, the matrix A is singular or badly scaled, and !> the vector x is an exact or approximate solution to Ax = 0. !>
[in,out]	CNORM	!> CNORM is DOUBLE PRECISION array, dimension (N) !> !> If NORMIN = 'Y', CNORM is an input argument and CNORM(j) !> contains the norm of the off-diagonal part of the j-th column !> of A. If TRANS = 'N', CNORM(j) must be greater than or equal !> to the infinity-norm, and if TRANS = 'T' or 'C', CNORM(j) !> must be greater than or equal to the 1-norm. !> !> If NORMIN = 'N', CNORM is an output argument and CNORM(j) !> returns the 1-norm of the offdiagonal part of the j-th column !> of A. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -k, the k-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  A rough bound on x is computed; if that is less than overflow, DTBSV
!>  is called, otherwise, specific code is used which checks for possible
!>  overflow or divide-by-zero at every operation.
!>
!>  A columnwise scheme is used for solving A*x = b.  The basic algorithm
!>  if A is lower triangular is
!>
!>       x[1:n] := b[1:n]
!>       for j = 1, ..., n
!>            x(j) := x(j) / A(j,j)
!>            x[j+1:n] := x[j+1:n] - x(j) * A[j+1:n,j]
!>       end
!>
!>  Define bounds on the components of x after j iterations of the loop:
!>     M(j) = bound on x[1:j]
!>     G(j) = bound on x[j+1:n]
!>  Initially, let M(0) = 0 and G(0) = max{x(i), i=1,...,n}.
!>
!>  Then for iteration j+1 we have
!>     M(j+1) <= G(j) / | A(j+1,j+1) |
!>     G(j+1) <= G(j) + M(j+1) * | A[j+2:n,j+1] |
!>            <= G(j) ( 1 + CNORM(j+1) / | A(j+1,j+1) | )
!>
!>  where CNORM(j+1) is greater than or equal to the infinity-norm of
!>  column j+1 of A, not counting the diagonal.  Hence
!>
!>     G(j) <= G(0) product ( 1 + CNORM(i) / | A(i,i) | )
!>                  1<=i<=j
!>  and
!>
!>     |x(j)| <= ( G(0) / |A(j,j)| ) product ( 1 + CNORM(i) / |A(i,i)| )
!>                                   1<=i< j
!>
!>  Since |x(j)| <= M(j), we use the Level 2 BLAS routine DTBSV if the
!>  reciprocal of the largest M(j), j=1,..,n, is larger than
!>  max(underflow, 1/overflow).
!>
!>  The bound on x(j) is also used to determine when a step in the
!>  columnwise method can be performed without fear of overflow.  If
!>  the computed bound is greater than a large constant, x is scaled to
!>  prevent overflow, but if the bound overflows, x is set to 0, x(j) to
!>  1, and scale to 0, and a non-trivial solution to A*x = 0 is found.
!>
!>  Similarly, a row-wise scheme is used to solve A**T*x = b.  The basic
!>  algorithm for A upper triangular is
!>
!>       for j = 1, ..., n
!>            x(j) := ( b(j) - A[1:j-1,j]**T * x[1:j-1] ) / A(j,j)
!>       end
!>
!>  We simultaneously compute two bounds
!>       G(j) = bound on ( b(i) - A[1:i-1,i]**T * x[1:i-1] ), 1<=i<=j
!>       M(j) = bound on x(i), 1<=i<=j
!>
!>  The initial values are G(0) = 0, M(0) = max{b(i), i=1,..,n}, and we
!>  add the constraint G(j) >= G(j-1) and M(j) >= M(j-1) for j >= 1.
!>  Then the bound on x(j) is
!>
!>       M(j) <= M(j-1) * ( 1 + CNORM(j) ) / | A(j,j) |
!>
!>            <= M(0) * product ( ( 1 + CNORM(i) ) / |A(i,i)| )
!>                      1<=i<=j
!>
!>  and we can safely call DTBSV if 1/M(n) and 1/G(n) are both greater
!>  than max(underflow, 1/overflow).
!>

Definition at line 240 of file dlatbs.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          DIAG, NORMIN, TRANS, UPLO
      INTEGER            INFO, KD, LDAB, N
      DOUBLE PRECISION   SCALE
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   AB( LDAB, * ), CNORM( * ), X( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ZERO, HALF, ONE
      parameter( zero = 0.0d+0, half = 0.5d+0, one = 1.0d+0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            NOTRAN, NOUNIT, UPPER
      INTEGER            I, IMAX, J, JFIRST, JINC, JLAST, JLEN, MAIND
      DOUBLE PRECISION   BIGNUM, GROW, REC, SMLNUM, SUMJ, TJJ, TJJS,
     $                   TMAX, TSCAL, USCAL, XBND, XJ, XMAX
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      INTEGER            IDAMAX
      DOUBLE PRECISION   DASUM, DDOT, DLAMCH
      EXTERNAL           lsame, idamax, dasum, ddot, dlamch
*     ..
*     .. External Subroutines ..
      EXTERNAL           daxpy, dscal, dtbsv, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, max, min
*     ..
*     .. Executable Statements ..
*
      info = 0
      upper = lsame( uplo, 'U' )
      notran = lsame( trans, 'N' )
      nounit = lsame( diag, 'N' )
*
*     Test the input parameters.
*
      IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -1
      ELSE IF( .NOT.notran .AND. .NOT.lsame( trans, 'T' ) .AND. .NOT.
     $         lsame( trans, 'C' ) ) THEN
         info = -2
      ELSE IF( .NOT.nounit .AND. .NOT.lsame( diag, 'U' ) ) THEN
         info = -3
      ELSE IF( .NOT.lsame( normin, 'Y' ) .AND. .NOT.
     $         lsame( normin, 'N' ) ) THEN
         info = -4
      ELSE IF( n.LT.0 ) THEN
         info = -5
      ELSE IF( kd.LT.0 ) THEN
         info = -6
      ELSE IF( ldab.LT.kd+1 ) THEN
         info = -8
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'DLATBS', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
*     Determine machine dependent parameters to control overflow.
*
      smlnum = dlamch( 'Safe minimum' ) / dlamch( 'Precision' )
      bignum = one / smlnum
      scale = one
*
      IF( lsame( normin, 'N' ) ) THEN
*
*        Compute the 1-norm of each column, not including the diagonal.
*
         IF( upper ) THEN
*
*           A is upper triangular.
*
            DO 10 j = 1, n
               jlen = min( kd, j-1 )
               cnorm( j ) = dasum( jlen, ab( kd+1-jlen, j ), 1 )
   10       CONTINUE
         ELSE
*
*           A is lower triangular.
*
            DO 20 j = 1, n
               jlen = min( kd, n-j )
               IF( jlen.GT.0 ) THEN
                  cnorm( j ) = dasum( jlen, ab( 2, j ), 1 )
               ELSE
                  cnorm( j ) = zero
               END IF
   20       CONTINUE
         END IF
      END IF
*
*     Scale the column norms by TSCAL if the maximum element in CNORM is
*     greater than BIGNUM.
*
      imax = idamax( n, cnorm, 1 )
      tmax = cnorm( imax )
      IF( tmax.LE.bignum ) THEN
         tscal = one
      ELSE
         tscal = one / ( smlnum*tmax )
         CALL dscal( n, tscal, cnorm, 1 )
      END IF
*
*     Compute a bound on the computed solution vector to see if the
*     Level 2 BLAS routine DTBSV can be used.
*
      j = idamax( n, x, 1 )
      xmax = abs( x( j ) )
      xbnd = xmax
      IF( notran ) THEN
*
*        Compute the growth in A * x = b.
*
         IF( upper ) THEN
            jfirst = n
            jlast = 1
            jinc = -1
            maind = kd + 1
         ELSE
            jfirst = 1
            jlast = n
            jinc = 1
            maind = 1
         END IF
*
         IF( tscal.NE.one ) THEN
            grow = zero
            GO TO 50
         END IF
*
         IF( nounit ) THEN
*
*           A is non-unit triangular.
*
*           Compute GROW = 1/G(j) and XBND = 1/M(j).
*           Initially, G(0) = max{x(i), i=1,...,n}.
*
            grow = one / max( xbnd, smlnum )
            xbnd = grow
            DO 30 j = jfirst, jlast, jinc
*
*              Exit the loop if the growth factor is too small.
*
               IF( grow.LE.smlnum )
     $            GO TO 50
*
*              M(j) = G(j-1) / abs(A(j,j))
*
               tjj = abs( ab( maind, j ) )
               xbnd = min( xbnd, min( one, tjj )*grow )
               IF( tjj+cnorm( j ).GE.smlnum ) THEN
*
*                 G(j) = G(j-1)*( 1 + CNORM(j) / abs(A(j,j)) )
*
                  grow = grow*( tjj / ( tjj+cnorm( j ) ) )
               ELSE
*
*                 G(j) could overflow, set GROW to 0.
*
                  grow = zero
               END IF
   30       CONTINUE
            grow = xbnd
         ELSE
*
*           A is unit triangular.
*
*           Compute GROW = 1/G(j), where G(0) = max{x(i), i=1,...,n}.
*
            grow = min( one, one / max( xbnd, smlnum ) )
            DO 40 j = jfirst, jlast, jinc
*
*              Exit the loop if the growth factor is too small.
*
               IF( grow.LE.smlnum )
     $            GO TO 50
*
*              G(j) = G(j-1)*( 1 + CNORM(j) )
*
               grow = grow*( one / ( one+cnorm( j ) ) )
   40       CONTINUE
         END IF
   50    CONTINUE
*
      ELSE
*
*        Compute the growth in A**T * x = b.
*
         IF( upper ) THEN
            jfirst = 1
            jlast = n
            jinc = 1
            maind = kd + 1
         ELSE
            jfirst = n
            jlast = 1
            jinc = -1
            maind = 1
         END IF
*
         IF( tscal.NE.one ) THEN
            grow = zero
            GO TO 80
         END IF
*
         IF( nounit ) THEN
*
*           A is non-unit triangular.
*
*           Compute GROW = 1/G(j) and XBND = 1/M(j).
*           Initially, M(0) = max{x(i), i=1,...,n}.
*
            grow = one / max( xbnd, smlnum )
            xbnd = grow
            DO 60 j = jfirst, jlast, jinc
*
*              Exit the loop if the growth factor is too small.
*
               IF( grow.LE.smlnum )
     $            GO TO 80
*
*              G(j) = max( G(j-1), M(j-1)*( 1 + CNORM(j) ) )
*
               xj = one + cnorm( j )
               grow = min( grow, xbnd / xj )
*
*              M(j) = M(j-1)*( 1 + CNORM(j) ) / abs(A(j,j))
*
               tjj = abs( ab( maind, j ) )
               IF( xj.GT.tjj )
     $            xbnd = xbnd*( tjj / xj )
   60       CONTINUE
            grow = min( grow, xbnd )
         ELSE
*
*           A is unit triangular.
*
*           Compute GROW = 1/G(j), where G(0) = max{x(i), i=1,...,n}.
*
            grow = min( one, one / max( xbnd, smlnum ) )
            DO 70 j = jfirst, jlast, jinc
*
*              Exit the loop if the growth factor is too small.
*
               IF( grow.LE.smlnum )
     $            GO TO 80
*
*              G(j) = ( 1 + CNORM(j) )*G(j-1)
*
               xj = one + cnorm( j )
               grow = grow / xj
   70       CONTINUE
         END IF
   80    CONTINUE
      END IF
*
      IF( ( grow*tscal ).GT.smlnum ) THEN
*
*        Use the Level 2 BLAS solve if the reciprocal of the bound on
*        elements of X is not too small.
*
         CALL dtbsv( uplo, trans, diag, n, kd, ab, ldab, x, 1 )
      ELSE
*
*        Use a Level 1 BLAS solve, scaling intermediate results.
*
         IF( xmax.GT.bignum ) THEN
*
*           Scale X so that its components are less than or equal to
*           BIGNUM in absolute value.
*
            scale = bignum / xmax
            CALL dscal( n, scale, x, 1 )
            xmax = bignum
         END IF
*
         IF( notran ) THEN
*
*           Solve A * x = b
*
            DO 110 j = jfirst, jlast, jinc
*
*              Compute x(j) = b(j) / A(j,j), scaling x if necessary.
*
               xj = abs( x( j ) )
               IF( nounit ) THEN
                  tjjs = ab( maind, j )*tscal
               ELSE
                  tjjs = tscal
                  IF( tscal.EQ.one )
     $               GO TO 100
               END IF
               tjj = abs( tjjs )
               IF( tjj.GT.smlnum ) THEN
*
*                    abs(A(j,j)) > SMLNUM:
*
                  IF( tjj.LT.one ) THEN
                     IF( xj.GT.tjj*bignum ) THEN
*
*                          Scale x by 1/b(j).
*
                        rec = one / xj
                        CALL dscal( n, rec, x, 1 )
                        scale = scale*rec
                        xmax = xmax*rec
                     END IF
                  END IF
                  x( j ) = x( j ) / tjjs
                  xj = abs( x( j ) )
               ELSE IF( tjj.GT.zero ) THEN
*
*                    0 < abs(A(j,j)) <= SMLNUM:
*
                  IF( xj.GT.tjj*bignum ) THEN
*
*                       Scale x by (1/abs(x(j)))*abs(A(j,j))*BIGNUM
*                       to avoid overflow when dividing by A(j,j).
*
                     rec = ( tjj*bignum ) / xj
                     IF( cnorm( j ).GT.one ) THEN
*
*                          Scale by 1/CNORM(j) to avoid overflow when
*                          multiplying x(j) times column j.
*
                        rec = rec / cnorm( j )
                     END IF
                     CALL dscal( n, rec, x, 1 )
                     scale = scale*rec
                     xmax = xmax*rec
                  END IF
                  x( j ) = x( j ) / tjjs
                  xj = abs( x( j ) )
               ELSE
*
*                    A(j,j) = 0:  Set x(1:n) = 0, x(j) = 1, and
*                    scale = 0, and compute a solution to A*x = 0.
*
                  DO 90 i = 1, n
                     x( i ) = zero
   90             CONTINUE
                  x( j ) = one
                  xj = one
                  scale = zero
                  xmax = zero
               END IF
  100          CONTINUE
*
*              Scale x if necessary to avoid overflow when adding a
*              multiple of column j of A.
*
               IF( xj.GT.one ) THEN
                  rec = one / xj
                  IF( cnorm( j ).GT.( bignum-xmax )*rec ) THEN
*
*                    Scale x by 1/(2*abs(x(j))).
*
                     rec = rec*half
                     CALL dscal( n, rec, x, 1 )
                     scale = scale*rec
                  END IF
               ELSE IF( xj*cnorm( j ).GT.( bignum-xmax ) ) THEN
*
*                 Scale x by 1/2.
*
                  CALL dscal( n, half, x, 1 )
                  scale = scale*half
               END IF
*
               IF( upper ) THEN
                  IF( j.GT.1 ) THEN
*
*                    Compute the update
*                       x(max(1,j-kd):j-1) := x(max(1,j-kd):j-1) -
*                                             x(j)* A(max(1,j-kd):j-1,j)
*
                     jlen = min( kd, j-1 )
                     CALL daxpy( jlen, -x( j )*tscal,
     $                           ab( kd+1-jlen, j ), 1, x( j-jlen ), 1 )
                     i = idamax( j-1, x, 1 )
                     xmax = abs( x( i ) )
                  END IF
               ELSE IF( j.LT.n ) THEN
*
*                 Compute the update
*                    x(j+1:min(j+kd,n)) := x(j+1:min(j+kd,n)) -
*                                          x(j) * A(j+1:min(j+kd,n),j)
*
                  jlen = min( kd, n-j )
                  IF( jlen.GT.0 )
     $               CALL daxpy( jlen, -x( j )*tscal, ab( 2, j ), 1,
     $                           x( j+1 ), 1 )
                  i = j + idamax( n-j, x( j+1 ), 1 )
                  xmax = abs( x( i ) )
               END IF
  110       CONTINUE
*
         ELSE
*
*           Solve A**T * x = b
*
            DO 160 j = jfirst, jlast, jinc
*
*              Compute x(j) = b(j) - sum A(k,j)*x(k).
*                                    k<>j
*
               xj = abs( x( j ) )
               uscal = tscal
               rec = one / max( xmax, one )
               IF( cnorm( j ).GT.( bignum-xj )*rec ) THEN
*
*                 If x(j) could overflow, scale x by 1/(2*XMAX).
*
                  rec = rec*half
                  IF( nounit ) THEN
                     tjjs = ab( maind, j )*tscal
                  ELSE
                     tjjs = tscal
                  END IF
                  tjj = abs( tjjs )
                  IF( tjj.GT.one ) THEN
*
*                       Divide by A(j,j) when scaling x if A(j,j) > 1.
*
                     rec = min( one, rec*tjj )
                     uscal = uscal / tjjs
                  END IF
                  IF( rec.LT.one ) THEN
                     CALL dscal( n, rec, x, 1 )
                     scale = scale*rec
                     xmax = xmax*rec
                  END IF
               END IF
*
               sumj = zero
               IF( uscal.EQ.one ) THEN
*
*                 If the scaling needed for A in the dot product is 1,
*                 call DDOT to perform the dot product.
*
                  IF( upper ) THEN
                     jlen = min( kd, j-1 )
                     sumj = ddot( jlen, ab( kd+1-jlen, j ), 1,
     $                      x( j-jlen ), 1 )
                  ELSE
                     jlen = min( kd, n-j )
                     IF( jlen.GT.0 )
     $                  sumj = ddot( jlen, ab( 2, j ), 1, x( j+1 ), 1 )
                  END IF
               ELSE
*
*                 Otherwise, use in-line code for the dot product.
*
                  IF( upper ) THEN
                     jlen = min( kd, j-1 )
                     DO 120 i = 1, jlen
                        sumj = sumj + ( ab( kd+i-jlen, j )*uscal )*
     $                         x( j-jlen-1+i )
  120                CONTINUE
                  ELSE
                     jlen = min( kd, n-j )
                     DO 130 i = 1, jlen
                        sumj = sumj + ( ab( i+1, j )*uscal )*x( j+i )
  130                CONTINUE
                  END IF
               END IF
*
               IF( uscal.EQ.tscal ) THEN
*
*                 Compute x(j) := ( x(j) - sumj ) / A(j,j) if 1/A(j,j)
*                 was not used to scale the dotproduct.
*
                  x( j ) = x( j ) - sumj
                  xj = abs( x( j ) )
                  IF( nounit ) THEN
*
*                    Compute x(j) = x(j) / A(j,j), scaling if necessary.
*
                     tjjs = ab( maind, j )*tscal
                  ELSE
                     tjjs = tscal
                     IF( tscal.EQ.one )
     $                  GO TO 150
                  END IF
                  tjj = abs( tjjs )
                  IF( tjj.GT.smlnum ) THEN
*
*                       abs(A(j,j)) > SMLNUM:
*
                     IF( tjj.LT.one ) THEN
                        IF( xj.GT.tjj*bignum ) THEN
*
*                             Scale X by 1/abs(x(j)).
*
                           rec = one / xj
                           CALL dscal( n, rec, x, 1 )
                           scale = scale*rec
                           xmax = xmax*rec
                        END IF
                     END IF
                     x( j ) = x( j ) / tjjs
                  ELSE IF( tjj.GT.zero ) THEN
*
*                       0 < abs(A(j,j)) <= SMLNUM:
*
                     IF( xj.GT.tjj*bignum ) THEN
*
*                          Scale x by (1/abs(x(j)))*abs(A(j,j))*BIGNUM.
*
                        rec = ( tjj*bignum ) / xj
                        CALL dscal( n, rec, x, 1 )
                        scale = scale*rec
                        xmax = xmax*rec
                     END IF
                     x( j ) = x( j ) / tjjs
                  ELSE
*
*                       A(j,j) = 0:  Set x(1:n) = 0, x(j) = 1, and
*                       scale = 0, and compute a solution to A**T*x = 0.
*
                     DO 140 i = 1, n
                        x( i ) = zero
  140                CONTINUE
                     x( j ) = one
                     scale = zero
                     xmax = zero
                  END IF
  150             CONTINUE
               ELSE
*
*                 Compute x(j) := x(j) / A(j,j) - sumj if the dot
*                 product has already been divided by 1/A(j,j).
*
                  x( j ) = x( j ) / tjjs - sumj
               END IF
               xmax = max( xmax, abs( x( j ) ) )
  160       CONTINUE
         END IF
         scale = scale / tscal
      END IF
*
*     Scale the column norms by 1/TSCAL for return.
*
      IF( tscal.NE.one ) THEN
         CALL dscal( n, one / tscal, cnorm, 1 )
      END IF
*
      RETURN
*
*     End of DLATBS
*

◆ dlatdf()

subroutine dlatdf	(	integer	ijob,
		integer	n,
		double precision, dimension( ldz, * )	z,
		integer	ldz,
		double precision, dimension( * )	rhs,
		double precision	rdsum,
		double precision	rdscal,
		integer, dimension( * )	ipiv,
		integer, dimension( * )	jpiv )

DLATDF uses the LU factorization of the n-by-n matrix computed by sgetc2 and computes a contribution to the reciprocal Dif-estimate.

Download DLATDF + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLATDF uses the LU factorization of the n-by-n matrix Z computed by
!> DGETC2 and computes a contribution to the reciprocal Dif-estimate
!> by solving Z * x = b for x, and choosing the r.h.s. b such that
!> the norm of x is as large as possible. On entry RHS = b holds the
!> contribution from earlier solved sub-systems, and on return RHS = x.
!>
!> The factorization of Z returned by DGETC2 has the form Z = P*L*U*Q,
!> where P and Q are permutation matrices. L is lower triangular with
!> unit diagonal elements and U is upper triangular.
!>

Parameters

[in]	IJOB	!> IJOB is INTEGER !> IJOB = 2: First compute an approximative null-vector e !> of Z using DGECON, e is normalized and solve for !> Zx = +-e - f with the sign giving the greater value !> of 2-norm(x). About 5 times as expensive as Default. !> IJOB .ne. 2: Local look ahead strategy where all entries of !> the r.h.s. b is chosen as either +1 or -1 (Default). !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix Z. !>
[in]	Z	!> Z is DOUBLE PRECISION array, dimension (LDZ, N) !> On entry, the LU part of the factorization of the n-by-n !> matrix Z computed by DGETC2: Z = P * L * U * Q !>
[in]	LDZ	!> LDZ is INTEGER !> The leading dimension of the array Z. LDA >= max(1, N). !>
[in,out]	RHS	!> RHS is DOUBLE PRECISION array, dimension (N) !> On entry, RHS contains contributions from other subsystems. !> On exit, RHS contains the solution of the subsystem with !> entries according to the value of IJOB (see above). !>
[in,out]	RDSUM	!> RDSUM is DOUBLE PRECISION !> On entry, the sum of squares of computed contributions to !> the Dif-estimate under computation by DTGSYL, where the !> scaling factor RDSCAL (see below) has been factored out. !> On exit, the corresponding sum of squares updated with the !> contributions from the current sub-system. !> If TRANS = 'T' RDSUM is not touched. !> NOTE: RDSUM only makes sense when DTGSY2 is called by STGSYL. !>
[in,out]	RDSCAL	!> RDSCAL is DOUBLE PRECISION !> On entry, scaling factor used to prevent overflow in RDSUM. !> On exit, RDSCAL is updated w.r.t. the current contributions !> in RDSUM. !> If TRANS = 'T', RDSCAL is not touched. !> NOTE: RDSCAL only makes sense when DTGSY2 is called by !> DTGSYL. !>
[in]	IPIV	!> IPIV is INTEGER array, dimension (N). !> The pivot indices; for 1 <= i <= N, row i of the !> matrix has been interchanged with row IPIV(i). !>
[in]	JPIV	!> JPIV is INTEGER array, dimension (N). !> The pivot indices; for 1 <= j <= N, column j of the !> matrix has been interchanged with column JPIV(j). !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:: This routine is a further developed implementation of algorithm BSOLVE in [1] using complete pivoting in the LU factorization.

Contributors:: Bo Kagstrom and Peter Poromaa, Department of Computing Science, Umea University, S-901 87 Umea, Sweden.

References:

!>
!>
!>  [1] Bo Kagstrom and Lars Westin,
!>      Generalized Schur Methods with Condition Estimators for
!>      Solving the Generalized Sylvester Equation, IEEE Transactions
!>      on Automatic Control, Vol. 34, No. 7, July 1989, pp 745-751.
!>
!>  [2] Peter Poromaa,
!>      On Efficient and Robust Estimators for the Separation
!>      between two Regular Matrix Pairs with Applications in
!>      Condition Estimation. Report IMINF-95.05, Departement of
!>      Computing Science, Umea University, S-901 87 Umea, Sweden, 1995.
!>

Definition at line 169 of file dlatdf.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            IJOB, LDZ, N
      DOUBLE PRECISION   RDSCAL, RDSUM
*     ..
*     .. Array Arguments ..
      INTEGER            IPIV( * ), JPIV( * )
      DOUBLE PRECISION   RHS( * ), Z( LDZ, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      INTEGER            MAXDIM
      parameter( maxdim = 8 )
      DOUBLE PRECISION   ZERO, ONE
      parameter( zero = 0.0d+0, one = 1.0d+0 )
*     ..
*     .. Local Scalars ..
      INTEGER            I, INFO, J, K
      DOUBLE PRECISION   BM, BP, PMONE, SMINU, SPLUS, TEMP
*     ..
*     .. Local Arrays ..
      INTEGER            IWORK( MAXDIM )
      DOUBLE PRECISION   WORK( 4*MAXDIM ), XM( MAXDIM ), XP( MAXDIM )
*     ..
*     .. External Subroutines ..
      EXTERNAL           daxpy, dcopy, dgecon, dgesc2, dlassq, dlaswp,
     $                   dscal
*     ..
*     .. External Functions ..
      DOUBLE PRECISION   DASUM, DDOT
      EXTERNAL           dasum, ddot
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, sqrt
*     ..
*     .. Executable Statements ..
*
      IF( ijob.NE.2 ) THEN
*
*        Apply permutations IPIV to RHS
*
         CALL dlaswp( 1, rhs, ldz, 1, n-1, ipiv, 1 )
*
*        Solve for L-part choosing RHS either to +1 or -1.
*
         pmone = -one
*
         DO 10 j = 1, n - 1
            bp = rhs( j ) + one
            bm = rhs( j ) - one
            splus = one
*
*           Look-ahead for L-part RHS(1:N-1) = + or -1, SPLUS and
*           SMIN computed more efficiently than in BSOLVE [1].
*
            splus = splus + ddot( n-j, z( j+1, j ), 1, z( j+1, j ), 1 )
            sminu = ddot( n-j, z( j+1, j ), 1, rhs( j+1 ), 1 )
            splus = splus*rhs( j )
            IF( splus.GT.sminu ) THEN
               rhs( j ) = bp
            ELSE IF( sminu.GT.splus ) THEN
               rhs( j ) = bm
            ELSE
*
*              In this case the updating sums are equal and we can
*              choose RHS(J) +1 or -1. The first time this happens
*              we choose -1, thereafter +1. This is a simple way to
*              get good estimates of matrices like Byers well-known
*              example (see [1]). (Not done in BSOLVE.)
*
               rhs( j ) = rhs( j ) + pmone
               pmone = one
            END IF
*
*           Compute the remaining r.h.s.
*
            temp = -rhs( j )
            CALL daxpy( n-j, temp, z( j+1, j ), 1, rhs( j+1 ), 1 )
*
   10    CONTINUE
*
*        Solve for U-part, look-ahead for RHS(N) = +-1. This is not done
*        in BSOLVE and will hopefully give us a better estimate because
*        any ill-conditioning of the original matrix is transferred to U
*        and not to L. U(N, N) is an approximation to sigma_min(LU).
*
         CALL dcopy( n-1, rhs, 1, xp, 1 )
         xp( n ) = rhs( n ) + one
         rhs( n ) = rhs( n ) - one
         splus = zero
         sminu = zero
         DO 30 i = n, 1, -1
            temp = one / z( i, i )
            xp( i ) = xp( i )*temp
            rhs( i ) = rhs( i )*temp
            DO 20 k = i + 1, n
               xp( i ) = xp( i ) - xp( k )*( z( i, k )*temp )
               rhs( i ) = rhs( i ) - rhs( k )*( z( i, k )*temp )
   20       CONTINUE
            splus = splus + abs( xp( i ) )
            sminu = sminu + abs( rhs( i ) )
   30    CONTINUE
         IF( splus.GT.sminu )
     $      CALL dcopy( n, xp, 1, rhs, 1 )
*
*        Apply the permutations JPIV to the computed solution (RHS)
*
         CALL dlaswp( 1, rhs, ldz, 1, n-1, jpiv, -1 )
*
*        Compute the sum of squares
*
         CALL dlassq( n, rhs, 1, rdscal, rdsum )
*
      ELSE
*
*        IJOB = 2, Compute approximate nullvector XM of Z
*
         CALL dgecon( 'I', n, z, ldz, one, temp, work, iwork, info )
         CALL dcopy( n, work( n+1 ), 1, xm, 1 )
*
*        Compute RHS
*
         CALL dlaswp( 1, xm, ldz, 1, n-1, ipiv, -1 )
         temp = one / sqrt( ddot( n, xm, 1, xm, 1 ) )
         CALL dscal( n, temp, xm, 1 )
         CALL dcopy( n, xm, 1, xp, 1 )
         CALL daxpy( n, one, rhs, 1, xp, 1 )
         CALL daxpy( n, -one, xm, 1, rhs, 1 )
         CALL dgesc2( n, z, ldz, rhs, ipiv, jpiv, temp )
         CALL dgesc2( n, z, ldz, xp, ipiv, jpiv, temp )
         IF( dasum( n, xp, 1 ).GT.dasum( n, rhs, 1 ) )
     $      CALL dcopy( n, xp, 1, rhs, 1 )
*
*        Compute the sum of squares
*
         CALL dlassq( n, rhs, 1, rdscal, rdsum )
*
      END IF
*
      RETURN
*
*     End of DLATDF
*

◆ dlatps()

subroutine dlatps	(	character	uplo,
		character	trans,
		character	diag,
		character	normin,
		integer	n,
		double precision, dimension( * )	ap,
		double precision, dimension( * )	x,
		double precision	scale,
		double precision, dimension( * )	cnorm,
		integer	info )

DLATPS solves a triangular system of equations with the matrix held in packed storage.

Download DLATPS + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLATPS solves one of the triangular systems
!>
!>    A *x = s*b  or  A**T*x = s*b
!>
!> with scaling to prevent overflow, where A is an upper or lower
!> triangular matrix stored in packed form.  Here A**T denotes the
!> transpose of A, x and b are n-element vectors, and s is a scaling
!> factor, usually less than or equal to 1, chosen so that the
!> components of x will be less than the overflow threshold.  If the
!> unscaled problem will not cause overflow, the Level 2 BLAS routine
!> DTPSV is called. If the matrix A is singular (A(j,j) = 0 for some j),
!> then s is set to 0 and a non-trivial solution to A*x = 0 is returned.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> Specifies whether the matrix A is upper or lower triangular. !> = 'U': Upper triangular !> = 'L': Lower triangular !>
[in]	TRANS	!> TRANS is CHARACTER1 !> Specifies the operation applied to A. !> = 'N': Solve A x = sb (No transpose) !> = 'T': Solve AT x = sb (Transpose) !> = 'C': Solve AT x = s*b (Conjugate transpose = Transpose) !>
[in]	DIAG	!> DIAG is CHARACTER*1 !> Specifies whether or not the matrix A is unit triangular. !> = 'N': Non-unit triangular !> = 'U': Unit triangular !>
[in]	NORMIN	!> NORMIN is CHARACTER*1 !> Specifies whether CNORM has been set or not. !> = 'Y': CNORM contains the column norms on entry !> = 'N': CNORM is not set on entry. On exit, the norms will !> be computed and stored in CNORM. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in]	AP	!> AP is DOUBLE PRECISION array, dimension (N(N+1)/2) !> The upper or lower triangular matrix A, packed columnwise in !> a linear array. The j-th column of A is stored in the array !> AP as follows: !> if UPLO = 'U', AP(i + (j-1)j/2) = A(i,j) for 1<=i<=j; !> if UPLO = 'L', AP(i + (j-1)*(2n-j)/2) = A(i,j) for j<=i<=n. !>
[in,out]	X	!> X is DOUBLE PRECISION array, dimension (N) !> On entry, the right hand side b of the triangular system. !> On exit, X is overwritten by the solution vector x. !>
[out]	SCALE	!> SCALE is DOUBLE PRECISION !> The scaling factor s for the triangular system !> A * x = sb or AT x = sb. !> If SCALE = 0, the matrix A is singular or badly scaled, and !> the vector x is an exact or approximate solution to Ax = 0. !>
[in,out]	CNORM	!> CNORM is DOUBLE PRECISION array, dimension (N) !> !> If NORMIN = 'Y', CNORM is an input argument and CNORM(j) !> contains the norm of the off-diagonal part of the j-th column !> of A. If TRANS = 'N', CNORM(j) must be greater than or equal !> to the infinity-norm, and if TRANS = 'T' or 'C', CNORM(j) !> must be greater than or equal to the 1-norm. !> !> If NORMIN = 'N', CNORM is an output argument and CNORM(j) !> returns the 1-norm of the offdiagonal part of the j-th column !> of A. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -k, the k-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  A rough bound on x is computed; if that is less than overflow, DTPSV
!>  is called, otherwise, specific code is used which checks for possible
!>  overflow or divide-by-zero at every operation.
!>
!>  A columnwise scheme is used for solving A*x = b.  The basic algorithm
!>  if A is lower triangular is
!>
!>       x[1:n] := b[1:n]
!>       for j = 1, ..., n
!>            x(j) := x(j) / A(j,j)
!>            x[j+1:n] := x[j+1:n] - x(j) * A[j+1:n,j]
!>       end
!>
!>  Define bounds on the components of x after j iterations of the loop:
!>     M(j) = bound on x[1:j]
!>     G(j) = bound on x[j+1:n]
!>  Initially, let M(0) = 0 and G(0) = max{x(i), i=1,...,n}.
!>
!>  Then for iteration j+1 we have
!>     M(j+1) <= G(j) / | A(j+1,j+1) |
!>     G(j+1) <= G(j) + M(j+1) * | A[j+2:n,j+1] |
!>            <= G(j) ( 1 + CNORM(j+1) / | A(j+1,j+1) | )
!>
!>  where CNORM(j+1) is greater than or equal to the infinity-norm of
!>  column j+1 of A, not counting the diagonal.  Hence
!>
!>     G(j) <= G(0) product ( 1 + CNORM(i) / | A(i,i) | )
!>                  1<=i<=j
!>  and
!>
!>     |x(j)| <= ( G(0) / |A(j,j)| ) product ( 1 + CNORM(i) / |A(i,i)| )
!>                                   1<=i< j
!>
!>  Since |x(j)| <= M(j), we use the Level 2 BLAS routine DTPSV if the
!>  reciprocal of the largest M(j), j=1,..,n, is larger than
!>  max(underflow, 1/overflow).
!>
!>  The bound on x(j) is also used to determine when a step in the
!>  columnwise method can be performed without fear of overflow.  If
!>  the computed bound is greater than a large constant, x is scaled to
!>  prevent overflow, but if the bound overflows, x is set to 0, x(j) to
!>  1, and scale to 0, and a non-trivial solution to A*x = 0 is found.
!>
!>  Similarly, a row-wise scheme is used to solve A**T*x = b.  The basic
!>  algorithm for A upper triangular is
!>
!>       for j = 1, ..., n
!>            x(j) := ( b(j) - A[1:j-1,j]**T * x[1:j-1] ) / A(j,j)
!>       end
!>
!>  We simultaneously compute two bounds
!>       G(j) = bound on ( b(i) - A[1:i-1,i]**T * x[1:i-1] ), 1<=i<=j
!>       M(j) = bound on x(i), 1<=i<=j
!>
!>  The initial values are G(0) = 0, M(0) = max{b(i), i=1,..,n}, and we
!>  add the constraint G(j) >= G(j-1) and M(j) >= M(j-1) for j >= 1.
!>  Then the bound on x(j) is
!>
!>       M(j) <= M(j-1) * ( 1 + CNORM(j) ) / | A(j,j) |
!>
!>            <= M(0) * product ( ( 1 + CNORM(i) ) / |A(i,i)| )
!>                      1<=i<=j
!>
!>  and we can safely call DTPSV if 1/M(n) and 1/G(n) are both greater
!>  than max(underflow, 1/overflow).
!>

Definition at line 227 of file dlatps.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          DIAG, NORMIN, TRANS, UPLO
      INTEGER            INFO, N
      DOUBLE PRECISION   SCALE
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   AP( * ), CNORM( * ), X( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ZERO, HALF, ONE
      parameter( zero = 0.0d+0, half = 0.5d+0, one = 1.0d+0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            NOTRAN, NOUNIT, UPPER
      INTEGER            I, IMAX, IP, J, JFIRST, JINC, JLAST, JLEN
      DOUBLE PRECISION   BIGNUM, GROW, REC, SMLNUM, SUMJ, TJJ, TJJS,
     $                   TMAX, TSCAL, USCAL, XBND, XJ, XMAX
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      INTEGER            IDAMAX
      DOUBLE PRECISION   DASUM, DDOT, DLAMCH
      EXTERNAL           lsame, idamax, dasum, ddot, dlamch
*     ..
*     .. External Subroutines ..
      EXTERNAL           daxpy, dscal, dtpsv, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, max, min
*     ..
*     .. Executable Statements ..
*
      info = 0
      upper = lsame( uplo, 'U' )
      notran = lsame( trans, 'N' )
      nounit = lsame( diag, 'N' )
*
*     Test the input parameters.
*
      IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -1
      ELSE IF( .NOT.notran .AND. .NOT.lsame( trans, 'T' ) .AND. .NOT.
     $         lsame( trans, 'C' ) ) THEN
         info = -2
      ELSE IF( .NOT.nounit .AND. .NOT.lsame( diag, 'U' ) ) THEN
         info = -3
      ELSE IF( .NOT.lsame( normin, 'Y' ) .AND. .NOT.
     $         lsame( normin, 'N' ) ) THEN
         info = -4
      ELSE IF( n.LT.0 ) THEN
         info = -5
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'DLATPS', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
*     Determine machine dependent parameters to control overflow.
*
      smlnum = dlamch( 'Safe minimum' ) / dlamch( 'Precision' )
      bignum = one / smlnum
      scale = one
*
      IF( lsame( normin, 'N' ) ) THEN
*
*        Compute the 1-norm of each column, not including the diagonal.
*
         IF( upper ) THEN
*
*           A is upper triangular.
*
            ip = 1
            DO 10 j = 1, n
               cnorm( j ) = dasum( j-1, ap( ip ), 1 )
               ip = ip + j
   10       CONTINUE
         ELSE
*
*           A is lower triangular.
*
            ip = 1
            DO 20 j = 1, n - 1
               cnorm( j ) = dasum( n-j, ap( ip+1 ), 1 )
               ip = ip + n - j + 1
   20       CONTINUE
            cnorm( n ) = zero
         END IF
      END IF
*
*     Scale the column norms by TSCAL if the maximum element in CNORM is
*     greater than BIGNUM.
*
      imax = idamax( n, cnorm, 1 )
      tmax = cnorm( imax )
      IF( tmax.LE.bignum ) THEN
         tscal = one
      ELSE
         tscal = one / ( smlnum*tmax )
         CALL dscal( n, tscal, cnorm, 1 )
      END IF
*
*     Compute a bound on the computed solution vector to see if the
*     Level 2 BLAS routine DTPSV can be used.
*
      j = idamax( n, x, 1 )
      xmax = abs( x( j ) )
      xbnd = xmax
      IF( notran ) THEN
*
*        Compute the growth in A * x = b.
*
         IF( upper ) THEN
            jfirst = n
            jlast = 1
            jinc = -1
         ELSE
            jfirst = 1
            jlast = n
            jinc = 1
         END IF
*
         IF( tscal.NE.one ) THEN
            grow = zero
            GO TO 50
         END IF
*
         IF( nounit ) THEN
*
*           A is non-unit triangular.
*
*           Compute GROW = 1/G(j) and XBND = 1/M(j).
*           Initially, G(0) = max{x(i), i=1,...,n}.
*
            grow = one / max( xbnd, smlnum )
            xbnd = grow
            ip = jfirst*( jfirst+1 ) / 2
            jlen = n
            DO 30 j = jfirst, jlast, jinc
*
*              Exit the loop if the growth factor is too small.
*
               IF( grow.LE.smlnum )
     $            GO TO 50
*
*              M(j) = G(j-1) / abs(A(j,j))
*
               tjj = abs( ap( ip ) )
               xbnd = min( xbnd, min( one, tjj )*grow )
               IF( tjj+cnorm( j ).GE.smlnum ) THEN
*
*                 G(j) = G(j-1)*( 1 + CNORM(j) / abs(A(j,j)) )
*
                  grow = grow*( tjj / ( tjj+cnorm( j ) ) )
               ELSE
*
*                 G(j) could overflow, set GROW to 0.
*
                  grow = zero
               END IF
               ip = ip + jinc*jlen
               jlen = jlen - 1
   30       CONTINUE
            grow = xbnd
         ELSE
*
*           A is unit triangular.
*
*           Compute GROW = 1/G(j), where G(0) = max{x(i), i=1,...,n}.
*
            grow = min( one, one / max( xbnd, smlnum ) )
            DO 40 j = jfirst, jlast, jinc
*
*              Exit the loop if the growth factor is too small.
*
               IF( grow.LE.smlnum )
     $            GO TO 50
*
*              G(j) = G(j-1)*( 1 + CNORM(j) )
*
               grow = grow*( one / ( one+cnorm( j ) ) )
   40       CONTINUE
         END IF
   50    CONTINUE
*
      ELSE
*
*        Compute the growth in A**T * x = b.
*
         IF( upper ) THEN
            jfirst = 1
            jlast = n
            jinc = 1
         ELSE
            jfirst = n
            jlast = 1
            jinc = -1
         END IF
*
         IF( tscal.NE.one ) THEN
            grow = zero
            GO TO 80
         END IF
*
         IF( nounit ) THEN
*
*           A is non-unit triangular.
*
*           Compute GROW = 1/G(j) and XBND = 1/M(j).
*           Initially, M(0) = max{x(i), i=1,...,n}.
*
            grow = one / max( xbnd, smlnum )
            xbnd = grow
            ip = jfirst*( jfirst+1 ) / 2
            jlen = 1
            DO 60 j = jfirst, jlast, jinc
*
*              Exit the loop if the growth factor is too small.
*
               IF( grow.LE.smlnum )
     $            GO TO 80
*
*              G(j) = max( G(j-1), M(j-1)*( 1 + CNORM(j) ) )
*
               xj = one + cnorm( j )
               grow = min( grow, xbnd / xj )
*
*              M(j) = M(j-1)*( 1 + CNORM(j) ) / abs(A(j,j))
*
               tjj = abs( ap( ip ) )
               IF( xj.GT.tjj )
     $            xbnd = xbnd*( tjj / xj )
               jlen = jlen + 1
               ip = ip + jinc*jlen
   60       CONTINUE
            grow = min( grow, xbnd )
         ELSE
*
*           A is unit triangular.
*
*           Compute GROW = 1/G(j), where G(0) = max{x(i), i=1,...,n}.
*
            grow = min( one, one / max( xbnd, smlnum ) )
            DO 70 j = jfirst, jlast, jinc
*
*              Exit the loop if the growth factor is too small.
*
               IF( grow.LE.smlnum )
     $            GO TO 80
*
*              G(j) = ( 1 + CNORM(j) )*G(j-1)
*
               xj = one + cnorm( j )
               grow = grow / xj
   70       CONTINUE
         END IF
   80    CONTINUE
      END IF
*
      IF( ( grow*tscal ).GT.smlnum ) THEN
*
*        Use the Level 2 BLAS solve if the reciprocal of the bound on
*        elements of X is not too small.
*
         CALL dtpsv( uplo, trans, diag, n, ap, x, 1 )
      ELSE
*
*        Use a Level 1 BLAS solve, scaling intermediate results.
*
         IF( xmax.GT.bignum ) THEN
*
*           Scale X so that its components are less than or equal to
*           BIGNUM in absolute value.
*
            scale = bignum / xmax
            CALL dscal( n, scale, x, 1 )
            xmax = bignum
         END IF
*
         IF( notran ) THEN
*
*           Solve A * x = b
*
            ip = jfirst*( jfirst+1 ) / 2
            DO 110 j = jfirst, jlast, jinc
*
*              Compute x(j) = b(j) / A(j,j), scaling x if necessary.
*
               xj = abs( x( j ) )
               IF( nounit ) THEN
                  tjjs = ap( ip )*tscal
               ELSE
                  tjjs = tscal
                  IF( tscal.EQ.one )
     $               GO TO 100
               END IF
               tjj = abs( tjjs )
               IF( tjj.GT.smlnum ) THEN
*
*                    abs(A(j,j)) > SMLNUM:
*
                  IF( tjj.LT.one ) THEN
                     IF( xj.GT.tjj*bignum ) THEN
*
*                          Scale x by 1/b(j).
*
                        rec = one / xj
                        CALL dscal( n, rec, x, 1 )
                        scale = scale*rec
                        xmax = xmax*rec
                     END IF
                  END IF
                  x( j ) = x( j ) / tjjs
                  xj = abs( x( j ) )
               ELSE IF( tjj.GT.zero ) THEN
*
*                    0 < abs(A(j,j)) <= SMLNUM:
*
                  IF( xj.GT.tjj*bignum ) THEN
*
*                       Scale x by (1/abs(x(j)))*abs(A(j,j))*BIGNUM
*                       to avoid overflow when dividing by A(j,j).
*
                     rec = ( tjj*bignum ) / xj
                     IF( cnorm( j ).GT.one ) THEN
*
*                          Scale by 1/CNORM(j) to avoid overflow when
*                          multiplying x(j) times column j.
*
                        rec = rec / cnorm( j )
                     END IF
                     CALL dscal( n, rec, x, 1 )
                     scale = scale*rec
                     xmax = xmax*rec
                  END IF
                  x( j ) = x( j ) / tjjs
                  xj = abs( x( j ) )
               ELSE
*
*                    A(j,j) = 0:  Set x(1:n) = 0, x(j) = 1, and
*                    scale = 0, and compute a solution to A*x = 0.
*
                  DO 90 i = 1, n
                     x( i ) = zero
   90             CONTINUE
                  x( j ) = one
                  xj = one
                  scale = zero
                  xmax = zero
               END IF
  100          CONTINUE
*
*              Scale x if necessary to avoid overflow when adding a
*              multiple of column j of A.
*
               IF( xj.GT.one ) THEN
                  rec = one / xj
                  IF( cnorm( j ).GT.( bignum-xmax )*rec ) THEN
*
*                    Scale x by 1/(2*abs(x(j))).
*
                     rec = rec*half
                     CALL dscal( n, rec, x, 1 )
                     scale = scale*rec
                  END IF
               ELSE IF( xj*cnorm( j ).GT.( bignum-xmax ) ) THEN
*
*                 Scale x by 1/2.
*
                  CALL dscal( n, half, x, 1 )
                  scale = scale*half
               END IF
*
               IF( upper ) THEN
                  IF( j.GT.1 ) THEN
*
*                    Compute the update
*                       x(1:j-1) := x(1:j-1) - x(j) * A(1:j-1,j)
*
                     CALL daxpy( j-1, -x( j )*tscal, ap( ip-j+1 ), 1, x,
     $                           1 )
                     i = idamax( j-1, x, 1 )
                     xmax = abs( x( i ) )
                  END IF
                  ip = ip - j
               ELSE
                  IF( j.LT.n ) THEN
*
*                    Compute the update
*                       x(j+1:n) := x(j+1:n) - x(j) * A(j+1:n,j)
*
                     CALL daxpy( n-j, -x( j )*tscal, ap( ip+1 ), 1,
     $                           x( j+1 ), 1 )
                     i = j + idamax( n-j, x( j+1 ), 1 )
                     xmax = abs( x( i ) )
                  END IF
                  ip = ip + n - j + 1
               END IF
  110       CONTINUE
*
         ELSE
*
*           Solve A**T * x = b
*
            ip = jfirst*( jfirst+1 ) / 2
            jlen = 1
            DO 160 j = jfirst, jlast, jinc
*
*              Compute x(j) = b(j) - sum A(k,j)*x(k).
*                                    k<>j
*
               xj = abs( x( j ) )
               uscal = tscal
               rec = one / max( xmax, one )
               IF( cnorm( j ).GT.( bignum-xj )*rec ) THEN
*
*                 If x(j) could overflow, scale x by 1/(2*XMAX).
*
                  rec = rec*half
                  IF( nounit ) THEN
                     tjjs = ap( ip )*tscal
                  ELSE
                     tjjs = tscal
                  END IF
                  tjj = abs( tjjs )
                  IF( tjj.GT.one ) THEN
*
*                       Divide by A(j,j) when scaling x if A(j,j) > 1.
*
                     rec = min( one, rec*tjj )
                     uscal = uscal / tjjs
                  END IF
                  IF( rec.LT.one ) THEN
                     CALL dscal( n, rec, x, 1 )
                     scale = scale*rec
                     xmax = xmax*rec
                  END IF
               END IF
*
               sumj = zero
               IF( uscal.EQ.one ) THEN
*
*                 If the scaling needed for A in the dot product is 1,
*                 call DDOT to perform the dot product.
*
                  IF( upper ) THEN
                     sumj = ddot( j-1, ap( ip-j+1 ), 1, x, 1 )
                  ELSE IF( j.LT.n ) THEN
                     sumj = ddot( n-j, ap( ip+1 ), 1, x( j+1 ), 1 )
                  END IF
               ELSE
*
*                 Otherwise, use in-line code for the dot product.
*
                  IF( upper ) THEN
                     DO 120 i = 1, j - 1
                        sumj = sumj + ( ap( ip-j+i )*uscal )*x( i )
  120                CONTINUE
                  ELSE IF( j.LT.n ) THEN
                     DO 130 i = 1, n - j
                        sumj = sumj + ( ap( ip+i )*uscal )*x( j+i )
  130                CONTINUE
                  END IF
               END IF
*
               IF( uscal.EQ.tscal ) THEN
*
*                 Compute x(j) := ( x(j) - sumj ) / A(j,j) if 1/A(j,j)
*                 was not used to scale the dotproduct.
*
                  x( j ) = x( j ) - sumj
                  xj = abs( x( j ) )
                  IF( nounit ) THEN
*
*                    Compute x(j) = x(j) / A(j,j), scaling if necessary.
*
                     tjjs = ap( ip )*tscal
                  ELSE
                     tjjs = tscal
                     IF( tscal.EQ.one )
     $                  GO TO 150
                  END IF
                  tjj = abs( tjjs )
                  IF( tjj.GT.smlnum ) THEN
*
*                       abs(A(j,j)) > SMLNUM:
*
                     IF( tjj.LT.one ) THEN
                        IF( xj.GT.tjj*bignum ) THEN
*
*                             Scale X by 1/abs(x(j)).
*
                           rec = one / xj
                           CALL dscal( n, rec, x, 1 )
                           scale = scale*rec
                           xmax = xmax*rec
                        END IF
                     END IF
                     x( j ) = x( j ) / tjjs
                  ELSE IF( tjj.GT.zero ) THEN
*
*                       0 < abs(A(j,j)) <= SMLNUM:
*
                     IF( xj.GT.tjj*bignum ) THEN
*
*                          Scale x by (1/abs(x(j)))*abs(A(j,j))*BIGNUM.
*
                        rec = ( tjj*bignum ) / xj
                        CALL dscal( n, rec, x, 1 )
                        scale = scale*rec
                        xmax = xmax*rec
                     END IF
                     x( j ) = x( j ) / tjjs
                  ELSE
*
*                       A(j,j) = 0:  Set x(1:n) = 0, x(j) = 1, and
*                       scale = 0, and compute a solution to A**T*x = 0.
*
                     DO 140 i = 1, n
                        x( i ) = zero
  140                CONTINUE
                     x( j ) = one
                     scale = zero
                     xmax = zero
                  END IF
  150             CONTINUE
               ELSE
*
*                 Compute x(j) := x(j) / A(j,j)  - sumj if the dot
*                 product has already been divided by 1/A(j,j).
*
                  x( j ) = x( j ) / tjjs - sumj
               END IF
               xmax = max( xmax, abs( x( j ) ) )
               jlen = jlen + 1
               ip = ip + jinc*jlen
  160       CONTINUE
         END IF
         scale = scale / tscal
      END IF
*
*     Scale the column norms by 1/TSCAL for return.
*
      IF( tscal.NE.one ) THEN
         CALL dscal( n, one / tscal, cnorm, 1 )
      END IF
*
      RETURN
*
*     End of DLATPS
*

◆ dlatrd()

subroutine dlatrd	(	character	uplo,
		integer	n,
		integer	nb,
		double precision, dimension( lda, * )	a,
		integer	lda,
		double precision, dimension( * )	e,
		double precision, dimension( * )	tau,
		double precision, dimension( ldw, * )	w,
		integer	ldw )

DLATRD reduces the first nb rows and columns of a symmetric/Hermitian matrix A to real tridiagonal form by an orthogonal similarity transformation.

Download DLATRD + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLATRD reduces NB rows and columns of a real symmetric matrix A to
!> symmetric tridiagonal form by an orthogonal similarity
!> transformation Q**T * A * Q, and returns the matrices V and W which are
!> needed to apply the transformation to the unreduced part of A.
!>
!> If UPLO = 'U', DLATRD reduces the last NB rows and columns of a
!> matrix, of which the upper triangle is supplied;
!> if UPLO = 'L', DLATRD reduces the first NB rows and columns of a
!> matrix, of which the lower triangle is supplied.
!>
!> This is an auxiliary routine called by DSYTRD.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> Specifies whether the upper or lower triangular part of the !> symmetric matrix A is stored: !> = 'U': Upper triangular !> = 'L': Lower triangular !>
[in]	N	!> N is INTEGER !> The order of the matrix A. !>
[in]	NB	!> NB is INTEGER !> The number of rows and columns to be reduced. !>
[in,out]	A	!> A is DOUBLE PRECISION array, dimension (LDA,N) !> On entry, the symmetric matrix A. If UPLO = 'U', the leading !> n-by-n upper triangular part of A contains the upper !> triangular part of the matrix A, and the strictly lower !> triangular part of A is not referenced. If UPLO = 'L', the !> leading n-by-n lower triangular part of A contains the lower !> triangular part of the matrix A, and the strictly upper !> triangular part of A is not referenced. !> On exit: !> if UPLO = 'U', the last NB columns have been reduced to !> tridiagonal form, with the diagonal elements overwriting !> the diagonal elements of A; the elements above the diagonal !> with the array TAU, represent the orthogonal matrix Q as a !> product of elementary reflectors; !> if UPLO = 'L', the first NB columns have been reduced to !> tridiagonal form, with the diagonal elements overwriting !> the diagonal elements of A; the elements below the diagonal !> with the array TAU, represent the orthogonal matrix Q as a !> product of elementary reflectors. !> See Further Details. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= (1,N). !>
[out]	E	!> E is DOUBLE PRECISION array, dimension (N-1) !> If UPLO = 'U', E(n-nb:n-1) contains the superdiagonal !> elements of the last NB columns of the reduced matrix; !> if UPLO = 'L', E(1:nb) contains the subdiagonal elements of !> the first NB columns of the reduced matrix. !>
[out]	TAU	!> TAU is DOUBLE PRECISION array, dimension (N-1) !> The scalar factors of the elementary reflectors, stored in !> TAU(n-nb:n-1) if UPLO = 'U', and in TAU(1:nb) if UPLO = 'L'. !> See Further Details. !>
[out]	W	!> W is DOUBLE PRECISION array, dimension (LDW,NB) !> The n-by-nb matrix W required to update the unreduced part !> of A. !>
[in]	LDW	!> LDW is INTEGER !> The leading dimension of the array W. LDW >= max(1,N). !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  If UPLO = 'U', the matrix Q is represented as a product of elementary
!>  reflectors
!>
!>     Q = H(n) H(n-1) . . . H(n-nb+1).
!>
!>  Each H(i) has the form
!>
!>     H(i) = I - tau * v * v**T
!>
!>  where tau is a real scalar, and v is a real vector with
!>  v(i:n) = 0 and v(i-1) = 1; v(1:i-1) is stored on exit in A(1:i-1,i),
!>  and tau in TAU(i-1).
!>
!>  If UPLO = 'L', the matrix Q is represented as a product of elementary
!>  reflectors
!>
!>     Q = H(1) H(2) . . . H(nb).
!>
!>  Each H(i) has the form
!>
!>     H(i) = I - tau * v * v**T
!>
!>  where tau is a real scalar, and v is a real vector with
!>  v(1:i) = 0 and v(i+1) = 1; v(i+1:n) is stored on exit in A(i+1:n,i),
!>  and tau in TAU(i).
!>
!>  The elements of the vectors v together form the n-by-nb matrix V
!>  which is needed, with W, to apply the transformation to the unreduced
!>  part of the matrix, using a symmetric rank-2k update of the form:
!>  A := A - V*W**T - W*V**T.
!>
!>  The contents of A on exit are illustrated by the following examples
!>  with n = 5 and nb = 2:
!>
!>  if UPLO = 'U':                       if UPLO = 'L':
!>
!>    (  a   a   a   v4  v5 )              (  d                  )
!>    (      a   a   v4  v5 )              (  1   d              )
!>    (          a   1   v5 )              (  v1  1   a          )
!>    (              d   1  )              (  v1  v2  a   a      )
!>    (                  d  )              (  v1  v2  a   a   a  )
!>
!>  where d denotes a diagonal element of the reduced matrix, a denotes
!>  an element of the original matrix that is unchanged, and vi denotes
!>  an element of the vector defining H(i).
!>

Definition at line 197 of file dlatrd.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          UPLO
      INTEGER            LDA, LDW, N, NB
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   A( LDA, * ), E( * ), TAU( * ), W( LDW, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ZERO, ONE, HALF
      parameter( zero = 0.0d+0, one = 1.0d+0, half = 0.5d+0 )
*     ..
*     .. Local Scalars ..
      INTEGER            I, IW
      DOUBLE PRECISION   ALPHA
*     ..
*     .. External Subroutines ..
      EXTERNAL           daxpy, dgemv, dlarfg, dscal, dsymv
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      DOUBLE PRECISION   DDOT
      EXTERNAL           lsame, ddot
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          min
*     ..
*     .. Executable Statements ..
*
*     Quick return if possible
*
      IF( n.LE.0 )
     $   RETURN
*
      IF( lsame( uplo, 'U' ) ) THEN
*
*        Reduce last NB columns of upper triangle
*
         DO 10 i = n, n - nb + 1, -1
            iw = i - n + nb
            IF( i.LT.n ) THEN
*
*              Update A(1:i,i)
*
               CALL dgemv( 'No transpose', i, n-i, -one, a( 1, i+1 ),
     $                     lda, w( i, iw+1 ), ldw, one, a( 1, i ), 1 )
               CALL dgemv( 'No transpose', i, n-i, -one, w( 1, iw+1 ),
     $                     ldw, a( i, i+1 ), lda, one, a( 1, i ), 1 )
            END IF
            IF( i.GT.1 ) THEN
*
*              Generate elementary reflector H(i) to annihilate
*              A(1:i-2,i)
*
               CALL dlarfg( i-1, a( i-1, i ), a( 1, i ), 1, tau( i-1 ) )
               e( i-1 ) = a( i-1, i )
               a( i-1, i ) = one
*
*              Compute W(1:i-1,i)
*
               CALL dsymv( 'Upper', i-1, one, a, lda, a( 1, i ), 1,
     $                     zero, w( 1, iw ), 1 )
               IF( i.LT.n ) THEN
                  CALL dgemv( 'Transpose', i-1, n-i, one, w( 1, iw+1 ),
     $                        ldw, a( 1, i ), 1, zero, w( i+1, iw ), 1 )
                  CALL dgemv( 'No transpose', i-1, n-i, -one,
     $                        a( 1, i+1 ), lda, w( i+1, iw ), 1, one,
     $                        w( 1, iw ), 1 )
                  CALL dgemv( 'Transpose', i-1, n-i, one, a( 1, i+1 ),
     $                        lda, a( 1, i ), 1, zero, w( i+1, iw ), 1 )
                  CALL dgemv( 'No transpose', i-1, n-i, -one,
     $                        w( 1, iw+1 ), ldw, w( i+1, iw ), 1, one,
     $                        w( 1, iw ), 1 )
               END IF
               CALL dscal( i-1, tau( i-1 ), w( 1, iw ), 1 )
               alpha = -half*tau( i-1 )*ddot( i-1, w( 1, iw ), 1,
     $                 a( 1, i ), 1 )
               CALL daxpy( i-1, alpha, a( 1, i ), 1, w( 1, iw ), 1 )
            END IF
*
   10    CONTINUE
      ELSE
*
*        Reduce first NB columns of lower triangle
*
         DO 20 i = 1, nb
*
*           Update A(i:n,i)
*
            CALL dgemv( 'No transpose', n-i+1, i-1, -one, a( i, 1 ),
     $                  lda, w( i, 1 ), ldw, one, a( i, i ), 1 )
            CALL dgemv( 'No transpose', n-i+1, i-1, -one, w( i, 1 ),
     $                  ldw, a( i, 1 ), lda, one, a( i, i ), 1 )
            IF( i.LT.n ) THEN
*
*              Generate elementary reflector H(i) to annihilate
*              A(i+2:n,i)
*
               CALL dlarfg( n-i, a( i+1, i ), a( min( i+2, n ), i ), 1,
     $                      tau( i ) )
               e( i ) = a( i+1, i )
               a( i+1, i ) = one
*
*              Compute W(i+1:n,i)
*
               CALL dsymv( 'Lower', n-i, one, a( i+1, i+1 ), lda,
     $                     a( i+1, i ), 1, zero, w( i+1, i ), 1 )
               CALL dgemv( 'Transpose', n-i, i-1, one, w( i+1, 1 ), ldw,
     $                     a( i+1, i ), 1, zero, w( 1, i ), 1 )
               CALL dgemv( 'No transpose', n-i, i-1, -one, a( i+1, 1 ),
     $                     lda, w( 1, i ), 1, one, w( i+1, i ), 1 )
               CALL dgemv( 'Transpose', n-i, i-1, one, a( i+1, 1 ), lda,
     $                     a( i+1, i ), 1, zero, w( 1, i ), 1 )
               CALL dgemv( 'No transpose', n-i, i-1, -one, w( i+1, 1 ),
     $                     ldw, w( 1, i ), 1, one, w( i+1, i ), 1 )
               CALL dscal( n-i, tau( i ), w( i+1, i ), 1 )
               alpha = -half*tau( i )*ddot( n-i, w( i+1, i ), 1,
     $                 a( i+1, i ), 1 )
               CALL daxpy( n-i, alpha, a( i+1, i ), 1, w( i+1, i ), 1 )
            END IF
*
   20    CONTINUE
      END IF
*
      RETURN
*
*     End of DLATRD
*

◆ dlatrs()

subroutine dlatrs	(	character	uplo,
		character	trans,
		character	diag,
		character	normin,
		integer	n,
		double precision, dimension( lda, * )	a,
		integer	lda,
		double precision, dimension( * )	x,
		double precision	scale,
		double precision, dimension( * )	cnorm,
		integer	info )

DLATRS solves a triangular system of equations with the scale factor set to prevent overflow.

Download DLATRS + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLATRS solves one of the triangular systems
!>
!>    A *x = s*b  or  A**T *x = s*b
!>
!> with scaling to prevent overflow.  Here A is an upper or lower
!> triangular matrix, A**T denotes the transpose of A, x and b are
!> n-element vectors, and s is a scaling factor, usually less than
!> or equal to 1, chosen so that the components of x will be less than
!> the overflow threshold.  If the unscaled problem will not cause
!> overflow, the Level 2 BLAS routine DTRSV is called.  If the matrix A
!> is singular (A(j,j) = 0 for some j), then s is set to 0 and a
!> non-trivial solution to A*x = 0 is returned.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> Specifies whether the matrix A is upper or lower triangular. !> = 'U': Upper triangular !> = 'L': Lower triangular !>
[in]	TRANS	!> TRANS is CHARACTER1 !> Specifies the operation applied to A. !> = 'N': Solve A x = sb (No transpose) !> = 'T': Solve AT x = sb (Transpose) !> = 'C': Solve AT x = s*b (Conjugate transpose = Transpose) !>
[in]	DIAG	!> DIAG is CHARACTER*1 !> Specifies whether or not the matrix A is unit triangular. !> = 'N': Non-unit triangular !> = 'U': Unit triangular !>
[in]	NORMIN	!> NORMIN is CHARACTER*1 !> Specifies whether CNORM has been set or not. !> = 'Y': CNORM contains the column norms on entry !> = 'N': CNORM is not set on entry. On exit, the norms will !> be computed and stored in CNORM. !>
[in]	N	!> N is INTEGER !> The order of the matrix A. N >= 0. !>
[in]	A	!> A is DOUBLE PRECISION array, dimension (LDA,N) !> The triangular matrix A. If UPLO = 'U', the leading n by n !> upper triangular part of the array A contains the upper !> triangular matrix, and the strictly lower triangular part of !> A is not referenced. If UPLO = 'L', the leading n by n lower !> triangular part of the array A contains the lower triangular !> matrix, and the strictly upper triangular part of A is not !> referenced. If DIAG = 'U', the diagonal elements of A are !> also not referenced and are assumed to be 1. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max (1,N). !>
[in,out]	X	!> X is DOUBLE PRECISION array, dimension (N) !> On entry, the right hand side b of the triangular system. !> On exit, X is overwritten by the solution vector x. !>
[out]	SCALE	!> SCALE is DOUBLE PRECISION !> The scaling factor s for the triangular system !> A * x = sb or AT x = sb. !> If SCALE = 0, the matrix A is singular or badly scaled, and !> the vector x is an exact or approximate solution to Ax = 0. !>
[in,out]	CNORM	!> CNORM is DOUBLE PRECISION array, dimension (N) !> !> If NORMIN = 'Y', CNORM is an input argument and CNORM(j) !> contains the norm of the off-diagonal part of the j-th column !> of A. If TRANS = 'N', CNORM(j) must be greater than or equal !> to the infinity-norm, and if TRANS = 'T' or 'C', CNORM(j) !> must be greater than or equal to the 1-norm. !> !> If NORMIN = 'N', CNORM is an output argument and CNORM(j) !> returns the 1-norm of the offdiagonal part of the j-th column !> of A. !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -k, the k-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  A rough bound on x is computed; if that is less than overflow, DTRSV
!>  is called, otherwise, specific code is used which checks for possible
!>  overflow or divide-by-zero at every operation.
!>
!>  A columnwise scheme is used for solving A*x = b.  The basic algorithm
!>  if A is lower triangular is
!>
!>       x[1:n] := b[1:n]
!>       for j = 1, ..., n
!>            x(j) := x(j) / A(j,j)
!>            x[j+1:n] := x[j+1:n] - x(j) * A[j+1:n,j]
!>       end
!>
!>  Define bounds on the components of x after j iterations of the loop:
!>     M(j) = bound on x[1:j]
!>     G(j) = bound on x[j+1:n]
!>  Initially, let M(0) = 0 and G(0) = max{x(i), i=1,...,n}.
!>
!>  Then for iteration j+1 we have
!>     M(j+1) <= G(j) / | A(j+1,j+1) |
!>     G(j+1) <= G(j) + M(j+1) * | A[j+2:n,j+1] |
!>            <= G(j) ( 1 + CNORM(j+1) / | A(j+1,j+1) | )
!>
!>  where CNORM(j+1) is greater than or equal to the infinity-norm of
!>  column j+1 of A, not counting the diagonal.  Hence
!>
!>     G(j) <= G(0) product ( 1 + CNORM(i) / | A(i,i) | )
!>                  1<=i<=j
!>  and
!>
!>     |x(j)| <= ( G(0) / |A(j,j)| ) product ( 1 + CNORM(i) / |A(i,i)| )
!>                                   1<=i< j
!>
!>  Since |x(j)| <= M(j), we use the Level 2 BLAS routine DTRSV if the
!>  reciprocal of the largest M(j), j=1,..,n, is larger than
!>  max(underflow, 1/overflow).
!>
!>  The bound on x(j) is also used to determine when a step in the
!>  columnwise method can be performed without fear of overflow.  If
!>  the computed bound is greater than a large constant, x is scaled to
!>  prevent overflow, but if the bound overflows, x is set to 0, x(j) to
!>  1, and scale to 0, and a non-trivial solution to A*x = 0 is found.
!>
!>  Similarly, a row-wise scheme is used to solve A**T*x = b.  The basic
!>  algorithm for A upper triangular is
!>
!>       for j = 1, ..., n
!>            x(j) := ( b(j) - A[1:j-1,j]**T * x[1:j-1] ) / A(j,j)
!>       end
!>
!>  We simultaneously compute two bounds
!>       G(j) = bound on ( b(i) - A[1:i-1,i]**T * x[1:i-1] ), 1<=i<=j
!>       M(j) = bound on x(i), 1<=i<=j
!>
!>  The initial values are G(0) = 0, M(0) = max{b(i), i=1,..,n}, and we
!>  add the constraint G(j) >= G(j-1) and M(j) >= M(j-1) for j >= 1.
!>  Then the bound on x(j) is
!>
!>       M(j) <= M(j-1) * ( 1 + CNORM(j) ) / | A(j,j) |
!>
!>            <= M(0) * product ( ( 1 + CNORM(i) ) / |A(i,i)| )
!>                      1<=i<=j
!>
!>  and we can safely call DTRSV if 1/M(n) and 1/G(n) are both greater
!>  than max(underflow, 1/overflow).
!>

Definition at line 236 of file dlatrs.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          DIAG, NORMIN, TRANS, UPLO
      INTEGER            INFO, LDA, N
      DOUBLE PRECISION   SCALE
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   A( LDA, * ), CNORM( * ), X( * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ZERO, HALF, ONE
      parameter( zero = 0.0d+0, half = 0.5d+0, one = 1.0d+0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            NOTRAN, NOUNIT, UPPER
      INTEGER            I, IMAX, J, JFIRST, JINC, JLAST
      DOUBLE PRECISION   BIGNUM, GROW, REC, SMLNUM, SUMJ, TJJ, TJJS,
     $                   TMAX, TSCAL, USCAL, XBND, XJ, XMAX
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      INTEGER            IDAMAX
      DOUBLE PRECISION   DASUM, DDOT, DLAMCH
      EXTERNAL           lsame, idamax, dasum, ddot, dlamch
*     ..
*     .. External Subroutines ..
      EXTERNAL           daxpy, dscal, dtrsv, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs, max, min
*     ..
*     .. Executable Statements ..
*
      info = 0
      upper = lsame( uplo, 'U' )
      notran = lsame( trans, 'N' )
      nounit = lsame( diag, 'N' )
*
*     Test the input parameters.
*
      IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -1
      ELSE IF( .NOT.notran .AND. .NOT.lsame( trans, 'T' ) .AND. .NOT.
     $         lsame( trans, 'C' ) ) THEN
         info = -2
      ELSE IF( .NOT.nounit .AND. .NOT.lsame( diag, 'U' ) ) THEN
         info = -3
      ELSE IF( .NOT.lsame( normin, 'Y' ) .AND. .NOT.
     $         lsame( normin, 'N' ) ) THEN
         info = -4
      ELSE IF( n.LT.0 ) THEN
         info = -5
      ELSE IF( lda.LT.max( 1, n ) ) THEN
         info = -7
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'DLATRS', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
*     Determine machine dependent parameters to control overflow.
*
      smlnum = dlamch( 'Safe minimum' ) / dlamch( 'Precision' )
      bignum = one / smlnum
      scale = one
*
      IF( lsame( normin, 'N' ) ) THEN
*
*        Compute the 1-norm of each column, not including the diagonal.
*
         IF( upper ) THEN
*
*           A is upper triangular.
*
            DO 10 j = 1, n
               cnorm( j ) = dasum( j-1, a( 1, j ), 1 )
   10       CONTINUE
         ELSE
*
*           A is lower triangular.
*
            DO 20 j = 1, n - 1
               cnorm( j ) = dasum( n-j, a( j+1, j ), 1 )
   20       CONTINUE
            cnorm( n ) = zero
         END IF
      END IF
*
*     Scale the column norms by TSCAL if the maximum element in CNORM is
*     greater than BIGNUM.
*
      imax = idamax( n, cnorm, 1 )
      tmax = cnorm( imax )
      IF( tmax.LE.bignum ) THEN
         tscal = one
      ELSE
         tscal = one / ( smlnum*tmax )
         CALL dscal( n, tscal, cnorm, 1 )
      END IF
*
*     Compute a bound on the computed solution vector to see if the
*     Level 2 BLAS routine DTRSV can be used.
*
      j = idamax( n, x, 1 )
      xmax = abs( x( j ) )
      xbnd = xmax
      IF( notran ) THEN
*
*        Compute the growth in A * x = b.
*
         IF( upper ) THEN
            jfirst = n
            jlast = 1
            jinc = -1
         ELSE
            jfirst = 1
            jlast = n
            jinc = 1
         END IF
*
         IF( tscal.NE.one ) THEN
            grow = zero
            GO TO 50
         END IF
*
         IF( nounit ) THEN
*
*           A is non-unit triangular.
*
*           Compute GROW = 1/G(j) and XBND = 1/M(j).
*           Initially, G(0) = max{x(i), i=1,...,n}.
*
            grow = one / max( xbnd, smlnum )
            xbnd = grow
            DO 30 j = jfirst, jlast, jinc
*
*              Exit the loop if the growth factor is too small.
*
               IF( grow.LE.smlnum )
     $            GO TO 50
*
*              M(j) = G(j-1) / abs(A(j,j))
*
               tjj = abs( a( j, j ) )
               xbnd = min( xbnd, min( one, tjj )*grow )
               IF( tjj+cnorm( j ).GE.smlnum ) THEN
*
*                 G(j) = G(j-1)*( 1 + CNORM(j) / abs(A(j,j)) )
*
                  grow = grow*( tjj / ( tjj+cnorm( j ) ) )
               ELSE
*
*                 G(j) could overflow, set GROW to 0.
*
                  grow = zero
               END IF
   30       CONTINUE
            grow = xbnd
         ELSE
*
*           A is unit triangular.
*
*           Compute GROW = 1/G(j), where G(0) = max{x(i), i=1,...,n}.
*
            grow = min( one, one / max( xbnd, smlnum ) )
            DO 40 j = jfirst, jlast, jinc
*
*              Exit the loop if the growth factor is too small.
*
               IF( grow.LE.smlnum )
     $            GO TO 50
*
*              G(j) = G(j-1)*( 1 + CNORM(j) )
*
               grow = grow*( one / ( one+cnorm( j ) ) )
   40       CONTINUE
         END IF
   50    CONTINUE
*
      ELSE
*
*        Compute the growth in A**T * x = b.
*
         IF( upper ) THEN
            jfirst = 1
            jlast = n
            jinc = 1
         ELSE
            jfirst = n
            jlast = 1
            jinc = -1
         END IF
*
         IF( tscal.NE.one ) THEN
            grow = zero
            GO TO 80
         END IF
*
         IF( nounit ) THEN
*
*           A is non-unit triangular.
*
*           Compute GROW = 1/G(j) and XBND = 1/M(j).
*           Initially, M(0) = max{x(i), i=1,...,n}.
*
            grow = one / max( xbnd, smlnum )
            xbnd = grow
            DO 60 j = jfirst, jlast, jinc
*
*              Exit the loop if the growth factor is too small.
*
               IF( grow.LE.smlnum )
     $            GO TO 80
*
*              G(j) = max( G(j-1), M(j-1)*( 1 + CNORM(j) ) )
*
               xj = one + cnorm( j )
               grow = min( grow, xbnd / xj )
*
*              M(j) = M(j-1)*( 1 + CNORM(j) ) / abs(A(j,j))
*
               tjj = abs( a( j, j ) )
               IF( xj.GT.tjj )
     $            xbnd = xbnd*( tjj / xj )
   60       CONTINUE
            grow = min( grow, xbnd )
         ELSE
*
*           A is unit triangular.
*
*           Compute GROW = 1/G(j), where G(0) = max{x(i), i=1,...,n}.
*
            grow = min( one, one / max( xbnd, smlnum ) )
            DO 70 j = jfirst, jlast, jinc
*
*              Exit the loop if the growth factor is too small.
*
               IF( grow.LE.smlnum )
     $            GO TO 80
*
*              G(j) = ( 1 + CNORM(j) )*G(j-1)
*
               xj = one + cnorm( j )
               grow = grow / xj
   70       CONTINUE
         END IF
   80    CONTINUE
      END IF
*
      IF( ( grow*tscal ).GT.smlnum ) THEN
*
*        Use the Level 2 BLAS solve if the reciprocal of the bound on
*        elements of X is not too small.
*
         CALL dtrsv( uplo, trans, diag, n, a, lda, x, 1 )
      ELSE
*
*        Use a Level 1 BLAS solve, scaling intermediate results.
*
         IF( xmax.GT.bignum ) THEN
*
*           Scale X so that its components are less than or equal to
*           BIGNUM in absolute value.
*
            scale = bignum / xmax
            CALL dscal( n, scale, x, 1 )
            xmax = bignum
         END IF
*
         IF( notran ) THEN
*
*           Solve A * x = b
*
            DO 110 j = jfirst, jlast, jinc
*
*              Compute x(j) = b(j) / A(j,j), scaling x if necessary.
*
               xj = abs( x( j ) )
               IF( nounit ) THEN
                  tjjs = a( j, j )*tscal
               ELSE
                  tjjs = tscal
                  IF( tscal.EQ.one )
     $               GO TO 100
               END IF
               tjj = abs( tjjs )
               IF( tjj.GT.smlnum ) THEN
*
*                    abs(A(j,j)) > SMLNUM:
*
                  IF( tjj.LT.one ) THEN
                     IF( xj.GT.tjj*bignum ) THEN
*
*                          Scale x by 1/b(j).
*
                        rec = one / xj
                        CALL dscal( n, rec, x, 1 )
                        scale = scale*rec
                        xmax = xmax*rec
                     END IF
                  END IF
                  x( j ) = x( j ) / tjjs
                  xj = abs( x( j ) )
               ELSE IF( tjj.GT.zero ) THEN
*
*                    0 < abs(A(j,j)) <= SMLNUM:
*
                  IF( xj.GT.tjj*bignum ) THEN
*
*                       Scale x by (1/abs(x(j)))*abs(A(j,j))*BIGNUM
*                       to avoid overflow when dividing by A(j,j).
*
                     rec = ( tjj*bignum ) / xj
                     IF( cnorm( j ).GT.one ) THEN
*
*                          Scale by 1/CNORM(j) to avoid overflow when
*                          multiplying x(j) times column j.
*
                        rec = rec / cnorm( j )
                     END IF
                     CALL dscal( n, rec, x, 1 )
                     scale = scale*rec
                     xmax = xmax*rec
                  END IF
                  x( j ) = x( j ) / tjjs
                  xj = abs( x( j ) )
               ELSE
*
*                    A(j,j) = 0:  Set x(1:n) = 0, x(j) = 1, and
*                    scale = 0, and compute a solution to A*x = 0.
*
                  DO 90 i = 1, n
                     x( i ) = zero
   90             CONTINUE
                  x( j ) = one
                  xj = one
                  scale = zero
                  xmax = zero
               END IF
  100          CONTINUE
*
*              Scale x if necessary to avoid overflow when adding a
*              multiple of column j of A.
*
               IF( xj.GT.one ) THEN
                  rec = one / xj
                  IF( cnorm( j ).GT.( bignum-xmax )*rec ) THEN
*
*                    Scale x by 1/(2*abs(x(j))).
*
                     rec = rec*half
                     CALL dscal( n, rec, x, 1 )
                     scale = scale*rec
                  END IF
               ELSE IF( xj*cnorm( j ).GT.( bignum-xmax ) ) THEN
*
*                 Scale x by 1/2.
*
                  CALL dscal( n, half, x, 1 )
                  scale = scale*half
               END IF
*
               IF( upper ) THEN
                  IF( j.GT.1 ) THEN
*
*                    Compute the update
*                       x(1:j-1) := x(1:j-1) - x(j) * A(1:j-1,j)
*
                     CALL daxpy( j-1, -x( j )*tscal, a( 1, j ), 1, x,
     $                           1 )
                     i = idamax( j-1, x, 1 )
                     xmax = abs( x( i ) )
                  END IF
               ELSE
                  IF( j.LT.n ) THEN
*
*                    Compute the update
*                       x(j+1:n) := x(j+1:n) - x(j) * A(j+1:n,j)
*
                     CALL daxpy( n-j, -x( j )*tscal, a( j+1, j ), 1,
     $                           x( j+1 ), 1 )
                     i = j + idamax( n-j, x( j+1 ), 1 )
                     xmax = abs( x( i ) )
                  END IF
               END IF
  110       CONTINUE
*
         ELSE
*
*           Solve A**T * x = b
*
            DO 160 j = jfirst, jlast, jinc
*
*              Compute x(j) = b(j) - sum A(k,j)*x(k).
*                                    k<>j
*
               xj = abs( x( j ) )
               uscal = tscal
               rec = one / max( xmax, one )
               IF( cnorm( j ).GT.( bignum-xj )*rec ) THEN
*
*                 If x(j) could overflow, scale x by 1/(2*XMAX).
*
                  rec = rec*half
                  IF( nounit ) THEN
                     tjjs = a( j, j )*tscal
                  ELSE
                     tjjs = tscal
                  END IF
                  tjj = abs( tjjs )
                  IF( tjj.GT.one ) THEN
*
*                       Divide by A(j,j) when scaling x if A(j,j) > 1.
*
                     rec = min( one, rec*tjj )
                     uscal = uscal / tjjs
                  END IF
                  IF( rec.LT.one ) THEN
                     CALL dscal( n, rec, x, 1 )
                     scale = scale*rec
                     xmax = xmax*rec
                  END IF
               END IF
*
               sumj = zero
               IF( uscal.EQ.one ) THEN
*
*                 If the scaling needed for A in the dot product is 1,
*                 call DDOT to perform the dot product.
*
                  IF( upper ) THEN
                     sumj = ddot( j-1, a( 1, j ), 1, x, 1 )
                  ELSE IF( j.LT.n ) THEN
                     sumj = ddot( n-j, a( j+1, j ), 1, x( j+1 ), 1 )
                  END IF
               ELSE
*
*                 Otherwise, use in-line code for the dot product.
*
                  IF( upper ) THEN
                     DO 120 i = 1, j - 1
                        sumj = sumj + ( a( i, j )*uscal )*x( i )
  120                CONTINUE
                  ELSE IF( j.LT.n ) THEN
                     DO 130 i = j + 1, n
                        sumj = sumj + ( a( i, j )*uscal )*x( i )
  130                CONTINUE
                  END IF
               END IF
*
               IF( uscal.EQ.tscal ) THEN
*
*                 Compute x(j) := ( x(j) - sumj ) / A(j,j) if 1/A(j,j)
*                 was not used to scale the dotproduct.
*
                  x( j ) = x( j ) - sumj
                  xj = abs( x( j ) )
                  IF( nounit ) THEN
                     tjjs = a( j, j )*tscal
                  ELSE
                     tjjs = tscal
                     IF( tscal.EQ.one )
     $                  GO TO 150
                  END IF
*
*                    Compute x(j) = x(j) / A(j,j), scaling if necessary.
*
                  tjj = abs( tjjs )
                  IF( tjj.GT.smlnum ) THEN
*
*                       abs(A(j,j)) > SMLNUM:
*
                     IF( tjj.LT.one ) THEN
                        IF( xj.GT.tjj*bignum ) THEN
*
*                             Scale X by 1/abs(x(j)).
*
                           rec = one / xj
                           CALL dscal( n, rec, x, 1 )
                           scale = scale*rec
                           xmax = xmax*rec
                        END IF
                     END IF
                     x( j ) = x( j ) / tjjs
                  ELSE IF( tjj.GT.zero ) THEN
*
*                       0 < abs(A(j,j)) <= SMLNUM:
*
                     IF( xj.GT.tjj*bignum ) THEN
*
*                          Scale x by (1/abs(x(j)))*abs(A(j,j))*BIGNUM.
*
                        rec = ( tjj*bignum ) / xj
                        CALL dscal( n, rec, x, 1 )
                        scale = scale*rec
                        xmax = xmax*rec
                     END IF
                     x( j ) = x( j ) / tjjs
                  ELSE
*
*                       A(j,j) = 0:  Set x(1:n) = 0, x(j) = 1, and
*                       scale = 0, and compute a solution to A**T*x = 0.
*
                     DO 140 i = 1, n
                        x( i ) = zero
  140                CONTINUE
                     x( j ) = one
                     scale = zero
                     xmax = zero
                  END IF
  150             CONTINUE
               ELSE
*
*                 Compute x(j) := x(j) / A(j,j)  - sumj if the dot
*                 product has already been divided by 1/A(j,j).
*
                  x( j ) = x( j ) / tjjs - sumj
               END IF
               xmax = max( xmax, abs( x( j ) ) )
  160       CONTINUE
         END IF
         scale = scale / tscal
      END IF
*
*     Scale the column norms by 1/TSCAL for return.
*
      IF( tscal.NE.one ) THEN
         CALL dscal( n, one / tscal, cnorm, 1 )
      END IF
*
      RETURN
*
*     End of DLATRS
*

◆ dlauu2()

subroutine dlauu2	(	character	uplo,
		integer	n,
		double precision, dimension( lda, * )	a,
		integer	lda,
		integer	info )

DLAUU2 computes the product UUH or LHL, where U and L are upper or lower triangular matrices (unblocked algorithm).

Download DLAUU2 + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLAUU2 computes the product U * U**T or L**T * L, where the triangular
!> factor U or L is stored in the upper or lower triangular part of
!> the array A.
!>
!> If UPLO = 'U' or 'u' then the upper triangle of the result is stored,
!> overwriting the factor U in A.
!> If UPLO = 'L' or 'l' then the lower triangle of the result is stored,
!> overwriting the factor L in A.
!>
!> This is the unblocked form of the algorithm, calling Level 2 BLAS.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> Specifies whether the triangular factor stored in the array A !> is upper or lower triangular: !> = 'U': Upper triangular !> = 'L': Lower triangular !>
[in]	N	!> N is INTEGER !> The order of the triangular factor U or L. N >= 0. !>
[in,out]	A	!> A is DOUBLE PRECISION array, dimension (LDA,N) !> On entry, the triangular factor U or L. !> On exit, if UPLO = 'U', the upper triangle of A is !> overwritten with the upper triangle of the product U * UT; !> if UPLO = 'L', the lower triangle of A is overwritten with !> the lower triangle of the product LT * L. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,N). !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -k, the k-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 101 of file dlauu2.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          UPLO
      INTEGER            INFO, LDA, N
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   A( LDA, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ONE
      parameter( one = 1.0d+0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            UPPER
      INTEGER            I
      DOUBLE PRECISION   AII
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      DOUBLE PRECISION   DDOT
      EXTERNAL           lsame, ddot
*     ..
*     .. External Subroutines ..
      EXTERNAL           dgemv, dscal, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      upper = lsame( uplo, 'U' )
      IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( lda.LT.max( 1, n ) ) THEN
         info = -4
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'DLAUU2', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
      IF( upper ) THEN
*
*        Compute the product U * U**T.
*
         DO 10 i = 1, n
            aii = a( i, i )
            IF( i.LT.n ) THEN
               a( i, i ) = ddot( n-i+1, a( i, i ), lda, a( i, i ), lda )
               CALL dgemv( 'No transpose', i-1, n-i, one, a( 1, i+1 ),
     $                     lda, a( i, i+1 ), lda, aii, a( 1, i ), 1 )
            ELSE
               CALL dscal( i, aii, a( 1, i ), 1 )
            END IF
   10    CONTINUE
*
      ELSE
*
*        Compute the product L**T * L.
*
         DO 20 i = 1, n
            aii = a( i, i )
            IF( i.LT.n ) THEN
               a( i, i ) = ddot( n-i+1, a( i, i ), 1, a( i, i ), 1 )
               CALL dgemv( 'Transpose', n-i, i-1, one, a( i+1, 1 ), lda,
     $                     a( i+1, i ), 1, aii, a( i, 1 ), lda )
            ELSE
               CALL dscal( i, aii, a( i, 1 ), lda )
            END IF
   20    CONTINUE
      END IF
*
      RETURN
*
*     End of DLAUU2
*

◆ dlauum()

subroutine dlauum	(	character	uplo,
		integer	n,
		double precision, dimension( lda, * )	a,
		integer	lda,
		integer	info )

DLAUUM computes the product UUH or LHL, where U and L are upper or lower triangular matrices (blocked algorithm).

Download DLAUUM + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DLAUUM computes the product U * U**T or L**T * L, where the triangular
!> factor U or L is stored in the upper or lower triangular part of
!> the array A.
!>
!> If UPLO = 'U' or 'u' then the upper triangle of the result is stored,
!> overwriting the factor U in A.
!> If UPLO = 'L' or 'l' then the lower triangle of the result is stored,
!> overwriting the factor L in A.
!>
!> This is the blocked form of the algorithm, calling Level 3 BLAS.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> Specifies whether the triangular factor stored in the array A !> is upper or lower triangular: !> = 'U': Upper triangular !> = 'L': Lower triangular !>
[in]	N	!> N is INTEGER !> The order of the triangular factor U or L. N >= 0. !>
[in,out]	A	!> A is DOUBLE PRECISION array, dimension (LDA,N) !> On entry, the triangular factor U or L. !> On exit, if UPLO = 'U', the upper triangle of A is !> overwritten with the upper triangle of the product U * UT; !> if UPLO = 'L', the lower triangle of A is overwritten with !> the lower triangle of the product LT * L. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= max(1,N). !>
[out]	INFO	!> INFO is INTEGER !> = 0: successful exit !> < 0: if INFO = -k, the k-th argument had an illegal value !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 101 of file dlauum.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          UPLO
      INTEGER            INFO, LDA, N
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   A( LDA, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ONE
      parameter( one = 1.0d+0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            UPPER
      INTEGER            I, IB, NB
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      INTEGER            ILAENV
      EXTERNAL           lsame, ilaenv
*     ..
*     .. External Subroutines ..
      EXTERNAL           dgemm, dlauu2, dsyrk, dtrmm, xerbla
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          max, min
*     ..
*     .. Executable Statements ..
*
*     Test the input parameters.
*
      info = 0
      upper = lsame( uplo, 'U' )
      IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
         info = -1
      ELSE IF( n.LT.0 ) THEN
         info = -2
      ELSE IF( lda.LT.max( 1, n ) ) THEN
         info = -4
      END IF
      IF( info.NE.0 ) THEN
         CALL xerbla( 'DLAUUM', -info )
         RETURN
      END IF
*
*     Quick return if possible
*
      IF( n.EQ.0 )
     $   RETURN
*
*     Determine the block size for this environment.
*
      nb = ilaenv( 1, 'DLAUUM', uplo, n, -1, -1, -1 )
*
      IF( nb.LE.1 .OR. nb.GE.n ) THEN
*
*        Use unblocked code
*
         CALL dlauu2( uplo, n, a, lda, info )
      ELSE
*
*        Use blocked code
*
         IF( upper ) THEN
*
*           Compute the product U * U**T.
*
            DO 10 i = 1, n, nb
               ib = min( nb, n-i+1 )
               CALL dtrmm( 'Right', 'Upper', 'Transpose', 'Non-unit',
     $                     i-1, ib, one, a( i, i ), lda, a( 1, i ),
     $                     lda )
               CALL dlauu2( 'Upper', ib, a( i, i ), lda, info )
               IF( i+ib.LE.n ) THEN
                  CALL dgemm( 'No transpose', 'Transpose', i-1, ib,
     $                        n-i-ib+1, one, a( 1, i+ib ), lda,
     $                        a( i, i+ib ), lda, one, a( 1, i ), lda )
                  CALL dsyrk( 'Upper', 'No transpose', ib, n-i-ib+1,
     $                        one, a( i, i+ib ), lda, one, a( i, i ),
     $                        lda )
               END IF
   10       CONTINUE
         ELSE
*
*           Compute the product L**T * L.
*
            DO 20 i = 1, n, nb
               ib = min( nb, n-i+1 )
               CALL dtrmm( 'Left', 'Lower', 'Transpose', 'Non-unit', ib,
     $                     i-1, one, a( i, i ), lda, a( i, 1 ), lda )
               CALL dlauu2( 'Lower', ib, a( i, i ), lda, info )
               IF( i+ib.LE.n ) THEN
                  CALL dgemm( 'Transpose', 'No transpose', ib, i-1,
     $                        n-i-ib+1, one, a( i+ib, i ), lda,
     $                        a( i+ib, 1 ), lda, one, a( i, 1 ), lda )
                  CALL dsyrk( 'Lower', 'Transpose', ib, n-i-ib+1, one,
     $                        a( i+ib, i ), lda, one, a( i, i ), lda )
               END IF
   20       CONTINUE
         END IF
      END IF
*
      RETURN
*
*     End of DLAUUM
*

◆ drscl()

subroutine drscl	(	integer	n,
		double precision	sa,
		double precision, dimension( * )	sx,
		integer	incx )

DRSCL multiplies a vector by the reciprocal of a real scalar.

Download DRSCL + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DRSCL multiplies an n-element real vector x by the real scalar 1/a.
!> This is done without overflow or underflow as long as
!> the final result x/a does not overflow or underflow.
!>

Parameters

[in]	N	!> N is INTEGER !> The number of components of the vector x. !>
[in]	SA	!> SA is DOUBLE PRECISION !> The scalar a which is used to divide each component of x. !> SA must be >= 0, or the subroutine will divide by zero. !>
[in,out]	SX	!> SX is DOUBLE PRECISION array, dimension !> (1+(N-1)*abs(INCX)) !> The n-element vector x. !>
[in]	INCX	!> INCX is INTEGER !> The increment between successive values of the vector SX. !> > 0: SX(1) = X(1) and SX(1+(i-1)*INCX) = x(i), 1< i<= n !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Definition at line 83 of file drscl.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      INTEGER            INCX, N
      DOUBLE PRECISION   SA
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   SX( * )
*     ..
*
* =====================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ONE, ZERO
      parameter( one = 1.0d+0, zero = 0.0d+0 )
*     ..
*     .. Local Scalars ..
      LOGICAL            DONE
      DOUBLE PRECISION   BIGNUM, CDEN, CDEN1, CNUM, CNUM1, MUL, SMLNUM
*     ..
*     .. External Functions ..
      DOUBLE PRECISION   DLAMCH
      EXTERNAL           dlamch
*     ..
*     .. External Subroutines ..
      EXTERNAL           dscal, dlabad
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          abs
*     ..
*     .. Executable Statements ..
*
*     Quick return if possible
*
      IF( n.LE.0 )
     $   RETURN
*
*     Get machine parameters
*
      smlnum = dlamch( 'S' )
      bignum = one / smlnum
      CALL dlabad( smlnum, bignum )
*
*     Initialize the denominator to SA and the numerator to 1.
*
      cden = sa
      cnum = one
*
   10 CONTINUE
      cden1 = cden*smlnum
      cnum1 = cnum / bignum
      IF( abs( cden1 ).GT.abs( cnum ) .AND. cnum.NE.zero ) THEN
*
*        Pre-multiply X by SMLNUM if CDEN is large compared to CNUM.
*
         mul = smlnum
         done = .false.
         cden = cden1
      ELSE IF( abs( cnum1 ).GT.abs( cden ) ) THEN
*
*        Pre-multiply X by BIGNUM if CDEN is small compared to CNUM.
*
         mul = bignum
         done = .false.
         cnum = cnum1
      ELSE
*
*        Multiply X by CNUM / CDEN and return.
*
         mul = cnum / cden
         done = .true.
      END IF
*
*     Scale the vector X by MUL
*
      CALL dscal( n, mul, sx, incx )
*
      IF( .NOT.done )
     $   GO TO 10
*
      RETURN
*
*     End of DRSCL
*

◆ dtprfb()

subroutine dtprfb	(	character	side,
		character	trans,
		character	direct,
		character	storev,
		integer	m,
		integer	n,
		integer	k,
		integer	l,
		double precision, dimension( ldv, * )	v,
		integer	ldv,
		double precision, dimension( ldt, * )	t,
		integer	ldt,
		double precision, dimension( lda, * )	a,
		integer	lda,
		double precision, dimension( ldb, * )	b,
		integer	ldb,
		double precision, dimension( ldwork, * )	work,
		integer	ldwork )

DTPRFB applies a real or complex "triangular-pentagonal" blocked reflector to a real or complex matrix, which is composed of two blocks.

Download DTPRFB + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> DTPRFB applies a real  block reflector H or its
!> transpose H**T to a real matrix C, which is composed of two
!> blocks A and B, either from the left or right.
!>
!>

Parameters

[in]	SIDE	!> SIDE is CHARACTER1 !> = 'L': apply H or HT from the Left !> = 'R': apply H or H*T from the Right !>
[in]	TRANS	!> TRANS is CHARACTER1 !> = 'N': apply H (No transpose) !> = 'T': apply H*T (Transpose) !>
[in]	DIRECT	!> DIRECT is CHARACTER*1 !> Indicates how H is formed from a product of elementary !> reflectors !> = 'F': H = H(1) H(2) . . . H(k) (Forward) !> = 'B': H = H(k) . . . H(2) H(1) (Backward) !>
[in]	STOREV	!> STOREV is CHARACTER*1 !> Indicates how the vectors which define the elementary !> reflectors are stored: !> = 'C': Columns !> = 'R': Rows !>
[in]	M	!> M is INTEGER !> The number of rows of the matrix B. !> M >= 0. !>
[in]	N	!> N is INTEGER !> The number of columns of the matrix B. !> N >= 0. !>
[in]	K	!> K is INTEGER !> The order of the matrix T, i.e. the number of elementary !> reflectors whose product defines the block reflector. !> K >= 0. !>
[in]	L	!> L is INTEGER !> The order of the trapezoidal part of V. !> K >= L >= 0. See Further Details. !>
[in]	V	!> V is DOUBLE PRECISION array, dimension !> (LDV,K) if STOREV = 'C' !> (LDV,M) if STOREV = 'R' and SIDE = 'L' !> (LDV,N) if STOREV = 'R' and SIDE = 'R' !> The pentagonal matrix V, which contains the elementary reflectors !> H(1), H(2), ..., H(K). See Further Details. !>
[in]	LDV	!> LDV is INTEGER !> The leading dimension of the array V. !> If STOREV = 'C' and SIDE = 'L', LDV >= max(1,M); !> if STOREV = 'C' and SIDE = 'R', LDV >= max(1,N); !> if STOREV = 'R', LDV >= K. !>
[in]	T	!> T is DOUBLE PRECISION array, dimension (LDT,K) !> The triangular K-by-K matrix T in the representation of the !> block reflector. !>
[in]	LDT	!> LDT is INTEGER !> The leading dimension of the array T. !> LDT >= K. !>
[in,out]	A	!> A is DOUBLE PRECISION array, dimension !> (LDA,N) if SIDE = 'L' or (LDA,K) if SIDE = 'R' !> On entry, the K-by-N or M-by-K matrix A. !> On exit, A is overwritten by the corresponding block of !> HC or HTC or CH or CH**T. See Further Details. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. !> If SIDE = 'L', LDA >= max(1,K); !> If SIDE = 'R', LDA >= max(1,M). !>
[in,out]	B	!> B is DOUBLE PRECISION array, dimension (LDB,N) !> On entry, the M-by-N matrix B. !> On exit, B is overwritten by the corresponding block of !> HC or HTC or CH or CH**T. See Further Details. !>
[in]	LDB	!> LDB is INTEGER !> The leading dimension of the array B. !> LDB >= max(1,M). !>
[out]	WORK	!> WORK is DOUBLE PRECISION array, dimension !> (LDWORK,N) if SIDE = 'L', !> (LDWORK,K) if SIDE = 'R'. !>
[in]	LDWORK	!> LDWORK is INTEGER !> The leading dimension of the array WORK. !> If SIDE = 'L', LDWORK >= K; !> if SIDE = 'R', LDWORK >= M. !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  The matrix C is a composite matrix formed from blocks A and B.
!>  The block B is of size M-by-N; if SIDE = 'R', A is of size M-by-K,
!>  and if SIDE = 'L', A is of size K-by-N.
!>
!>  If SIDE = 'R' and DIRECT = 'F', C = [A B].
!>
!>  If SIDE = 'L' and DIRECT = 'F', C = [A]
!>                                      [B].
!>
!>  If SIDE = 'R' and DIRECT = 'B', C = [B A].
!>
!>  If SIDE = 'L' and DIRECT = 'B', C = [B]
!>                                      [A].
!>
!>  The pentagonal matrix V is composed of a rectangular block V1 and a
!>  trapezoidal block V2.  The size of the trapezoidal block is determined by
!>  the parameter L, where 0<=L<=K.  If L=K, the V2 block of V is triangular;
!>  if L=0, there is no trapezoidal block, thus V = V1 is rectangular.
!>
!>  If DIRECT = 'F' and STOREV = 'C':  V = [V1]
!>                                         [V2]
!>     - V2 is upper trapezoidal (first L rows of K-by-K upper triangular)
!>
!>  If DIRECT = 'F' and STOREV = 'R':  V = [V1 V2]
!>
!>     - V2 is lower trapezoidal (first L columns of K-by-K lower triangular)
!>
!>  If DIRECT = 'B' and STOREV = 'C':  V = [V2]
!>                                         [V1]
!>     - V2 is lower trapezoidal (last L rows of K-by-K lower triangular)
!>
!>  If DIRECT = 'B' and STOREV = 'R':  V = [V2 V1]
!>
!>     - V2 is upper trapezoidal (last L columns of K-by-K upper triangular)
!>
!>  If STOREV = 'C' and SIDE = 'L', V is M-by-K with V2 L-by-K.
!>
!>  If STOREV = 'C' and SIDE = 'R', V is N-by-K with V2 L-by-K.
!>
!>  If STOREV = 'R' and SIDE = 'L', V is K-by-M with V2 K-by-L.
!>
!>  If STOREV = 'R' and SIDE = 'R', V is K-by-N with V2 K-by-L.
!>

Definition at line 249 of file dtprfb.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER DIRECT, SIDE, STOREV, TRANS
      INTEGER   K, L, LDA, LDB, LDT, LDV, LDWORK, M, N
*     ..
*     .. Array Arguments ..
      DOUBLE PRECISION   A( LDA, * ), B( LDB, * ), T( LDT, * ),
     $          V( LDV, * ), WORK( LDWORK, * )
*     ..
*
*  ==========================================================================
*
*     .. Parameters ..
      DOUBLE PRECISION   ONE, ZERO
      parameter( one = 1.0, zero = 0.0 )
*     ..
*     .. Local Scalars ..
      INTEGER   I, J, MP, NP, KP
      LOGICAL   LEFT, FORWARD, COLUMN, RIGHT, BACKWARD, ROW
*     ..
*     .. External Functions ..
      LOGICAL   LSAME
      EXTERNAL  lsame
*     ..
*     .. External Subroutines ..
      EXTERNAL  dgemm, dtrmm
*     ..
*     .. Executable Statements ..
*
*     Quick return if possible
*
      IF( m.LE.0 .OR. n.LE.0 .OR. k.LE.0 .OR. l.LT.0 ) RETURN
*
      IF( lsame( storev, 'C' ) ) THEN
         column = .true.
         row = .false.
      ELSE IF ( lsame( storev, 'R' ) ) THEN
         column = .false.
         row = .true.
      ELSE
         column = .false.
         row = .false.
      END IF
*
      IF( lsame( side, 'L' ) ) THEN
         left = .true.
         right = .false.
      ELSE IF( lsame( side, 'R' ) ) THEN
         left = .false.
         right = .true.
      ELSE
         left = .false.
         right = .false.
      END IF
*
      IF( lsame( direct, 'F' ) ) THEN
         forward = .true.
         backward = .false.
      ELSE IF( lsame( direct, 'B' ) ) THEN
         forward = .false.
         backward = .true.
      ELSE
         forward = .false.
         backward = .false.
      END IF
*
* ---------------------------------------------------------------------------
*
      IF( column .AND. forward .AND. left  ) THEN
*
* ---------------------------------------------------------------------------
*
*        Let  W =  [ I ]    (K-by-K)
*                  [ V ]    (M-by-K)
*
*        Form  H C  or  H**T C  where  C = [ A ]  (K-by-N)
*                                          [ B ]  (M-by-N)
*
*        H = I - W T W**T          or  H**T = I - W T**T W**T
*
*        A = A -   T (A + V**T B)  or  A = A -   T**T (A + V**T B)
*        B = B - V T (A + V**T B)  or  B = B - V T**T (A + V**T B)
*
* ---------------------------------------------------------------------------
*
         mp = min( m-l+1, m )
         kp = min( l+1, k )
*
         DO j = 1, n
            DO i = 1, l
               work( i, j ) = b( m-l+i, j )
            END DO
         END DO
         CALL dtrmm( 'L', 'U', 'T', 'N', l, n, one, v( mp, 1 ), ldv,
     $               work, ldwork )
         CALL dgemm( 'T', 'N', l, n, m-l, one, v, ldv, b, ldb,
     $               one, work, ldwork )
         CALL dgemm( 'T', 'N', k-l, n, m, one, v( 1, kp ), ldv,
     $               b, ldb, zero, work( kp, 1 ), ldwork )
*
         DO j = 1, n
            DO i = 1, k
               work( i, j ) = work( i, j ) + a( i, j )
            END DO
         END DO
*
         CALL dtrmm( 'L', 'U', trans, 'N', k, n, one, t, ldt,
     $               work, ldwork )
*
         DO j = 1, n
            DO i = 1, k
               a( i, j ) = a( i, j ) - work( i, j )
            END DO
         END DO
*
         CALL dgemm( 'N', 'N', m-l, n, k, -one, v, ldv, work, ldwork,
     $               one, b, ldb )
         CALL dgemm( 'N', 'N', l, n, k-l, -one, v( mp, kp ), ldv,
     $               work( kp, 1 ), ldwork, one, b( mp, 1 ),  ldb )
         CALL dtrmm( 'L', 'U', 'N', 'N', l, n, one, v( mp, 1 ), ldv,
     $               work, ldwork )
         DO j = 1, n
            DO i = 1, l
               b( m-l+i, j ) = b( m-l+i, j ) - work( i, j )
            END DO
         END DO
*
* ---------------------------------------------------------------------------
*
      ELSE IF( column .AND. forward .AND. right ) THEN
*
* ---------------------------------------------------------------------------
*
*        Let  W =  [ I ]    (K-by-K)
*                  [ V ]    (N-by-K)
*
*        Form  C H or  C H**T  where  C = [ A B ] (A is M-by-K, B is M-by-N)
*
*        H = I - W T W**T          or  H**T = I - W T**T W**T
*
*        A = A - (A + B V) T      or  A = A - (A + B V) T**T
*        B = B - (A + B V) T V**T  or  B = B - (A + B V) T**T V**T
*
* ---------------------------------------------------------------------------
*
         np = min( n-l+1, n )
         kp = min( l+1, k )
*
         DO j = 1, l
            DO i = 1, m
               work( i, j ) = b( i, n-l+j )
            END DO
         END DO
         CALL dtrmm( 'R', 'U', 'N', 'N', m, l, one, v( np, 1 ), ldv,
     $               work, ldwork )
         CALL dgemm( 'N', 'N', m, l, n-l, one, b, ldb,
     $               v, ldv, one, work, ldwork )
         CALL dgemm( 'N', 'N', m, k-l, n, one, b, ldb,
     $               v( 1, kp ), ldv, zero, work( 1, kp ), ldwork )
*
         DO j = 1, k
            DO i = 1, m
               work( i, j ) = work( i, j ) + a( i, j )
            END DO
         END DO
*
         CALL dtrmm( 'R', 'U', trans, 'N', m, k, one, t, ldt,
     $               work, ldwork )
*
         DO j = 1, k
            DO i = 1, m
               a( i, j ) = a( i, j ) - work( i, j )
            END DO
         END DO
*
         CALL dgemm( 'N', 'T', m, n-l, k, -one, work, ldwork,
     $               v, ldv, one, b, ldb )
         CALL dgemm( 'N', 'T', m, l, k-l, -one, work( 1, kp ), ldwork,
     $               v( np, kp ), ldv, one, b( 1, np ), ldb )
         CALL dtrmm( 'R', 'U', 'T', 'N', m, l, one, v( np, 1 ), ldv,
     $               work, ldwork )
         DO j = 1, l
            DO i = 1, m
               b( i, n-l+j ) = b( i, n-l+j ) - work( i, j )
            END DO
         END DO
*
* ---------------------------------------------------------------------------
*
      ELSE IF( column .AND. backward .AND. left ) THEN
*
* ---------------------------------------------------------------------------
*
*        Let  W =  [ V ]    (M-by-K)
*                  [ I ]    (K-by-K)
*
*        Form  H C  or  H**T C  where  C = [ B ]  (M-by-N)
*                                          [ A ]  (K-by-N)
*
*        H = I - W T W**T          or  H**T = I - W T**T W**T
*
*        A = A -   T (A + V**T B)  or  A = A -   T**T (A + V**T B)
*        B = B - V T (A + V**T B)  or  B = B - V T**T (A + V**T B)
*
* ---------------------------------------------------------------------------
*
         mp = min( l+1, m )
         kp = min( k-l+1, k )
*
         DO j = 1, n
            DO i = 1, l
               work( k-l+i, j ) = b( i, j )
            END DO
         END DO
*
         CALL dtrmm( 'L', 'L', 'T', 'N', l, n, one, v( 1, kp ), ldv,
     $               work( kp, 1 ), ldwork )
         CALL dgemm( 'T', 'N', l, n, m-l, one, v( mp, kp ), ldv,
     $               b( mp, 1 ), ldb, one, work( kp, 1 ), ldwork )
         CALL dgemm( 'T', 'N', k-l, n, m, one, v, ldv,
     $               b, ldb, zero, work, ldwork )
*
         DO j = 1, n
            DO i = 1, k
               work( i, j ) = work( i, j ) + a( i, j )
            END DO
         END DO
*
         CALL dtrmm( 'L', 'L', trans, 'N', k, n, one, t, ldt,
     $               work, ldwork )
*
         DO j = 1, n
            DO i = 1, k
               a( i, j ) = a( i, j ) - work( i, j )
            END DO
         END DO
*
         CALL dgemm( 'N', 'N', m-l, n, k, -one, v( mp, 1 ), ldv,
     $               work, ldwork, one, b( mp, 1 ), ldb )
         CALL dgemm( 'N', 'N', l, n, k-l, -one, v, ldv,
     $               work, ldwork, one, b,  ldb )
         CALL dtrmm( 'L', 'L', 'N', 'N', l, n, one, v( 1, kp ), ldv,
     $               work( kp, 1 ), ldwork )
         DO j = 1, n
            DO i = 1, l
               b( i, j ) = b( i, j ) - work( k-l+i, j )
            END DO
         END DO
*
* ---------------------------------------------------------------------------
*
      ELSE IF( column .AND. backward .AND. right ) THEN
*
* ---------------------------------------------------------------------------
*
*        Let  W =  [ V ]    (N-by-K)
*                  [ I ]    (K-by-K)
*
*        Form  C H  or  C H**T  where  C = [ B A ] (B is M-by-N, A is M-by-K)
*
*        H = I - W T W**T          or  H**T = I - W T**T W**T
*
*        A = A - (A + B V) T      or  A = A - (A + B V) T**T
*        B = B - (A + B V) T V**T  or  B = B - (A + B V) T**T V**T
*
* ---------------------------------------------------------------------------
*
         np = min( l+1, n )
         kp = min( k-l+1, k )
*
         DO j = 1, l
            DO i = 1, m
               work( i, k-l+j ) = b( i, j )
            END DO
         END DO
         CALL dtrmm( 'R', 'L', 'N', 'N', m, l, one, v( 1, kp ), ldv,
     $               work( 1, kp ), ldwork )
         CALL dgemm( 'N', 'N', m, l, n-l, one, b( 1, np ), ldb,
     $               v( np, kp ), ldv, one, work( 1, kp ), ldwork )
         CALL dgemm( 'N', 'N', m, k-l, n, one, b, ldb,
     $               v, ldv, zero, work, ldwork )
*
         DO j = 1, k
            DO i = 1, m
               work( i, j ) = work( i, j ) + a( i, j )
            END DO
         END DO
*
         CALL dtrmm( 'R', 'L', trans, 'N', m, k, one, t, ldt,
     $               work, ldwork )
*
         DO j = 1, k
            DO i = 1, m
               a( i, j ) = a( i, j ) - work( i, j )
            END DO
         END DO
*
         CALL dgemm( 'N', 'T', m, n-l, k, -one, work, ldwork,
     $               v( np, 1 ), ldv, one, b( 1, np ), ldb )
         CALL dgemm( 'N', 'T', m, l, k-l, -one, work, ldwork,
     $               v, ldv, one, b, ldb )
         CALL dtrmm( 'R', 'L', 'T', 'N', m, l, one, v( 1, kp ), ldv,
     $               work( 1, kp ), ldwork )
         DO j = 1, l
            DO i = 1, m
               b( i, j ) = b( i, j ) - work( i, k-l+j )
            END DO
         END DO
*
* ---------------------------------------------------------------------------
*
      ELSE IF( row .AND. forward .AND. left ) THEN
*
* ---------------------------------------------------------------------------
*
*        Let  W =  [ I V ] ( I is K-by-K, V is K-by-M )
*
*        Form  H C  or  H**T C  where  C = [ A ]  (K-by-N)
*                                          [ B ]  (M-by-N)
*
*        H = I - W**T T W          or  H**T = I - W**T T**T W
*
*        A = A -     T (A + V B)  or  A = A -     T**T (A + V B)
*        B = B - V**T T (A + V B)  or  B = B - V**T T**T (A + V B)
*
* ---------------------------------------------------------------------------
*
         mp = min( m-l+1, m )
         kp = min( l+1, k )
*
         DO j = 1, n
            DO i = 1, l
               work( i, j ) = b( m-l+i, j )
            END DO
         END DO
         CALL dtrmm( 'L', 'L', 'N', 'N', l, n, one, v( 1, mp ), ldv,
     $               work, ldb )
         CALL dgemm( 'N', 'N', l, n, m-l, one, v, ldv,b, ldb,
     $               one, work, ldwork )
         CALL dgemm( 'N', 'N', k-l, n, m, one, v( kp, 1 ), ldv,
     $               b, ldb, zero, work( kp, 1 ), ldwork )
*
         DO j = 1, n
            DO i = 1, k
               work( i, j ) = work( i, j ) + a( i, j )
            END DO
         END DO
*
         CALL dtrmm( 'L', 'U', trans, 'N', k, n, one, t, ldt,
     $               work, ldwork )
*
         DO j = 1, n
            DO i = 1, k
               a( i, j ) = a( i, j ) - work( i, j )
            END DO
         END DO
*
         CALL dgemm( 'T', 'N', m-l, n, k, -one, v, ldv, work, ldwork,
     $               one, b, ldb )
         CALL dgemm( 'T', 'N', l, n, k-l, -one, v( kp, mp ), ldv,
     $               work( kp, 1 ), ldwork, one, b( mp, 1 ), ldb )
         CALL dtrmm( 'L', 'L', 'T', 'N', l, n, one, v( 1, mp ), ldv,
     $               work, ldwork )
         DO j = 1, n
            DO i = 1, l
               b( m-l+i, j ) = b( m-l+i, j ) - work( i, j )
            END DO
         END DO
*
* ---------------------------------------------------------------------------
*
      ELSE IF( row .AND. forward .AND. right ) THEN
*
* ---------------------------------------------------------------------------
*
*        Let  W =  [ I V ] ( I is K-by-K, V is K-by-N )
*
*        Form  C H  or  C H**T  where  C = [ A B ] (A is M-by-K, B is M-by-N)
*
*        H = I - W**T T W            or  H**T = I - W**T T**T W
*
*        A = A - (A + B V**T) T      or  A = A - (A + B V**T) T**T
*        B = B - (A + B V**T) T V    or  B = B - (A + B V**T) T**T V
*
* ---------------------------------------------------------------------------
*
         np = min( n-l+1, n )
         kp = min( l+1, k )
*
         DO j = 1, l
            DO i = 1, m
               work( i, j ) = b( i, n-l+j )
            END DO
         END DO
         CALL dtrmm( 'R', 'L', 'T', 'N', m, l, one, v( 1, np ), ldv,
     $               work, ldwork )
         CALL dgemm( 'N', 'T', m, l, n-l, one, b, ldb, v, ldv,
     $               one, work, ldwork )
         CALL dgemm( 'N', 'T', m, k-l, n, one, b, ldb,
     $               v( kp, 1 ), ldv, zero, work( 1, kp ), ldwork )
*
         DO j = 1, k
            DO i = 1, m
               work( i, j ) = work( i, j ) + a( i, j )
            END DO
         END DO
*
         CALL dtrmm( 'R', 'U', trans, 'N', m, k, one, t, ldt,
     $               work, ldwork )
*
         DO j = 1, k
            DO i = 1, m
               a( i, j ) = a( i, j ) - work( i, j )
            END DO
         END DO
*
         CALL dgemm( 'N', 'N', m, n-l, k, -one, work, ldwork,
     $               v, ldv, one, b, ldb )
         CALL dgemm( 'N', 'N', m, l, k-l, -one, work( 1, kp ), ldwork,
     $               v( kp, np ), ldv, one, b( 1, np ), ldb )
         CALL dtrmm( 'R', 'L', 'N', 'N', m, l, one, v( 1, np ), ldv,
     $               work, ldwork )
         DO j = 1, l
            DO i = 1, m
               b( i, n-l+j ) = b( i, n-l+j ) - work( i, j )
            END DO
         END DO
*
* ---------------------------------------------------------------------------
*
      ELSE IF( row .AND. backward .AND. left ) THEN
*
* ---------------------------------------------------------------------------
*
*        Let  W =  [ V I ] ( I is K-by-K, V is K-by-M )
*
*        Form  H C  or  H**T C  where  C = [ B ]  (M-by-N)
*                                          [ A ]  (K-by-N)
*
*        H = I - W**T T W          or  H**T = I - W**T T**T W
*
*        A = A -     T (A + V B)  or  A = A -     T**T (A + V B)
*        B = B - V**T T (A + V B)  or  B = B - V**T T**T (A + V B)
*
* ---------------------------------------------------------------------------
*
         mp = min( l+1, m )
         kp = min( k-l+1, k )
*
         DO j = 1, n
            DO i = 1, l
               work( k-l+i, j ) = b( i, j )
            END DO
         END DO
         CALL dtrmm( 'L', 'U', 'N', 'N', l, n, one, v( kp, 1 ), ldv,
     $               work( kp, 1 ), ldwork )
         CALL dgemm( 'N', 'N', l, n, m-l, one, v( kp, mp ), ldv,
     $               b( mp, 1 ), ldb, one, work( kp, 1 ), ldwork )
         CALL dgemm( 'N', 'N', k-l, n, m, one, v, ldv, b, ldb,
     $               zero, work, ldwork )
*
         DO j = 1, n
            DO i = 1, k
               work( i, j ) = work( i, j ) + a( i, j )
            END DO
         END DO
*
         CALL dtrmm( 'L', 'L ', trans, 'N', k, n, one, t, ldt,
     $               work, ldwork )
*
         DO j = 1, n
            DO i = 1, k
               a( i, j ) = a( i, j ) - work( i, j )
            END DO
         END DO
*
         CALL dgemm( 'T', 'N', m-l, n, k, -one, v( 1, mp ), ldv,
     $               work, ldwork, one, b( mp, 1 ), ldb )
         CALL dgemm( 'T', 'N', l, n, k-l, -one, v, ldv,
     $               work, ldwork, one, b, ldb )
         CALL dtrmm( 'L', 'U', 'T', 'N', l, n, one, v( kp, 1 ), ldv,
     $               work( kp, 1 ), ldwork )
         DO j = 1, n
            DO i = 1, l
               b( i, j ) = b( i, j ) - work( k-l+i, j )
            END DO
         END DO
*
* ---------------------------------------------------------------------------
*
      ELSE IF( row .AND. backward .AND. right ) THEN
*
* ---------------------------------------------------------------------------
*
*        Let  W =  [ V I ] ( I is K-by-K, V is K-by-N )
*
*        Form  C H  or  C H**T  where  C = [ B A ] (A is M-by-K, B is M-by-N)
*
*        H = I - W**T T W            or  H**T = I - W**T T**T W
*
*        A = A - (A + B V**T) T      or  A = A - (A + B V**T) T**T
*        B = B - (A + B V**T) T V    or  B = B - (A + B V**T) T**T V
*
* ---------------------------------------------------------------------------
*
         np = min( l+1, n )
         kp = min( k-l+1, k )
*
         DO j = 1, l
            DO i = 1, m
               work( i, k-l+j ) = b( i, j )
            END DO
         END DO
         CALL dtrmm( 'R', 'U', 'T', 'N', m, l, one, v( kp, 1 ), ldv,
     $               work( 1, kp ), ldwork )
         CALL dgemm( 'N', 'T', m, l, n-l, one, b( 1, np ), ldb,
     $               v( kp, np ), ldv, one, work( 1, kp ), ldwork )
         CALL dgemm( 'N', 'T', m, k-l, n, one, b, ldb, v, ldv,
     $               zero, work, ldwork )
*
         DO j = 1, k
            DO i = 1, m
               work( i, j ) = work( i, j ) + a( i, j )
            END DO
         END DO
*
         CALL dtrmm( 'R', 'L', trans, 'N', m, k, one, t, ldt,
     $               work, ldwork )
*
         DO j = 1, k
            DO i = 1, m
               a( i, j ) = a( i, j ) - work( i, j )
            END DO
         END DO
*
         CALL dgemm( 'N', 'N', m, n-l, k, -one, work, ldwork,
     $               v( 1, np ), ldv, one, b( 1, np ), ldb )
         CALL dgemm( 'N', 'N', m, l, k-l , -one, work, ldwork,
     $               v, ldv, one, b, ldb )
         CALL dtrmm( 'R', 'U', 'N', 'N', m, l, one, v( kp, 1 ), ldv,
     $               work( 1, kp ), ldwork )
         DO j = 1, l
            DO i = 1, m
               b( i, j ) = b( i, j ) - work( i, k-l+j )
            END DO
         END DO
*
      END IF
*
      RETURN
*
*     End of DTPRFB
*

◆ slatrd()

subroutine slatrd	(	character	uplo,
		integer	n,
		integer	nb,
		real, dimension( lda, * )	a,
		integer	lda,
		real, dimension( * )	e,
		real, dimension( * )	tau,
		real, dimension( ldw, * )	w,
		integer	ldw )

SLATRD reduces the first nb rows and columns of a symmetric/Hermitian matrix A to real tridiagonal form by an orthogonal similarity transformation.

Download SLATRD + dependencies [TGZ] [ZIP] [TXT]

Purpose:

!>
!> SLATRD reduces NB rows and columns of a real symmetric matrix A to
!> symmetric tridiagonal form by an orthogonal similarity
!> transformation Q**T * A * Q, and returns the matrices V and W which are
!> needed to apply the transformation to the unreduced part of A.
!>
!> If UPLO = 'U', SLATRD reduces the last NB rows and columns of a
!> matrix, of which the upper triangle is supplied;
!> if UPLO = 'L', SLATRD reduces the first NB rows and columns of a
!> matrix, of which the lower triangle is supplied.
!>
!> This is an auxiliary routine called by SSYTRD.
!>

Parameters

[in]	UPLO	!> UPLO is CHARACTER*1 !> Specifies whether the upper or lower triangular part of the !> symmetric matrix A is stored: !> = 'U': Upper triangular !> = 'L': Lower triangular !>
[in]	N	!> N is INTEGER !> The order of the matrix A. !>
[in]	NB	!> NB is INTEGER !> The number of rows and columns to be reduced. !>
[in,out]	A	!> A is REAL array, dimension (LDA,N) !> On entry, the symmetric matrix A. If UPLO = 'U', the leading !> n-by-n upper triangular part of A contains the upper !> triangular part of the matrix A, and the strictly lower !> triangular part of A is not referenced. If UPLO = 'L', the !> leading n-by-n lower triangular part of A contains the lower !> triangular part of the matrix A, and the strictly upper !> triangular part of A is not referenced. !> On exit: !> if UPLO = 'U', the last NB columns have been reduced to !> tridiagonal form, with the diagonal elements overwriting !> the diagonal elements of A; the elements above the diagonal !> with the array TAU, represent the orthogonal matrix Q as a !> product of elementary reflectors; !> if UPLO = 'L', the first NB columns have been reduced to !> tridiagonal form, with the diagonal elements overwriting !> the diagonal elements of A; the elements below the diagonal !> with the array TAU, represent the orthogonal matrix Q as a !> product of elementary reflectors. !> See Further Details. !>
[in]	LDA	!> LDA is INTEGER !> The leading dimension of the array A. LDA >= (1,N). !>
[out]	E	!> E is REAL array, dimension (N-1) !> If UPLO = 'U', E(n-nb:n-1) contains the superdiagonal !> elements of the last NB columns of the reduced matrix; !> if UPLO = 'L', E(1:nb) contains the subdiagonal elements of !> the first NB columns of the reduced matrix. !>
[out]	TAU	!> TAU is REAL array, dimension (N-1) !> The scalar factors of the elementary reflectors, stored in !> TAU(n-nb:n-1) if UPLO = 'U', and in TAU(1:nb) if UPLO = 'L'. !> See Further Details. !>
[out]	W	!> W is REAL array, dimension (LDW,NB) !> The n-by-nb matrix W required to update the unreduced part !> of A. !>
[in]	LDW	!> LDW is INTEGER !> The leading dimension of the array W. LDW >= max(1,N). !>

Author: Univ. of Tennessee; Univ. of California Berkeley; Univ. of Colorado Denver; NAG Ltd.

Further Details:

!>
!>  If UPLO = 'U', the matrix Q is represented as a product of elementary
!>  reflectors
!>
!>     Q = H(n) H(n-1) . . . H(n-nb+1).
!>
!>  Each H(i) has the form
!>
!>     H(i) = I - tau * v * v**T
!>
!>  where tau is a real scalar, and v is a real vector with
!>  v(i:n) = 0 and v(i-1) = 1; v(1:i-1) is stored on exit in A(1:i-1,i),
!>  and tau in TAU(i-1).
!>
!>  If UPLO = 'L', the matrix Q is represented as a product of elementary
!>  reflectors
!>
!>     Q = H(1) H(2) . . . H(nb).
!>
!>  Each H(i) has the form
!>
!>     H(i) = I - tau * v * v**T
!>
!>  where tau is a real scalar, and v is a real vector with
!>  v(1:i) = 0 and v(i+1) = 1; v(i+1:n) is stored on exit in A(i+1:n,i),
!>  and tau in TAU(i).
!>
!>  The elements of the vectors v together form the n-by-nb matrix V
!>  which is needed, with W, to apply the transformation to the unreduced
!>  part of the matrix, using a symmetric rank-2k update of the form:
!>  A := A - V*W**T - W*V**T.
!>
!>  The contents of A on exit are illustrated by the following examples
!>  with n = 5 and nb = 2:
!>
!>  if UPLO = 'U':                       if UPLO = 'L':
!>
!>    (  a   a   a   v4  v5 )              (  d                  )
!>    (      a   a   v4  v5 )              (  1   d              )
!>    (          a   1   v5 )              (  v1  1   a          )
!>    (              d   1  )              (  v1  v2  a   a      )
!>    (                  d  )              (  v1  v2  a   a   a  )
!>
!>  where d denotes a diagonal element of the reduced matrix, a denotes
!>  an element of the original matrix that is unchanged, and vi denotes
!>  an element of the vector defining H(i).
!>

Definition at line 197 of file slatrd.f.

*
*  -- LAPACK auxiliary routine --
*  -- LAPACK is a software package provided by Univ. of Tennessee,    --
*  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
*
*     .. Scalar Arguments ..
      CHARACTER          UPLO
      INTEGER            LDA, LDW, N, NB
*     ..
*     .. Array Arguments ..
      REAL               A( LDA, * ), E( * ), TAU( * ), W( LDW, * )
*     ..
*
*  =====================================================================
*
*     .. Parameters ..
      REAL               ZERO, ONE, HALF
      parameter( zero = 0.0e+0, one = 1.0e+0, half = 0.5e+0 )
*     ..
*     .. Local Scalars ..
      INTEGER            I, IW
      REAL               ALPHA
*     ..
*     .. External Subroutines ..
      EXTERNAL           saxpy, sgemv, slarfg, sscal, ssymv
*     ..
*     .. External Functions ..
      LOGICAL            LSAME
      REAL               SDOT
      EXTERNAL           lsame, sdot
*     ..
*     .. Intrinsic Functions ..
      INTRINSIC          min
*     ..
*     .. Executable Statements ..
*
*     Quick return if possible
*
      IF( n.LE.0 )
     $   RETURN
*
      IF( lsame( uplo, 'U' ) ) THEN
*
*        Reduce last NB columns of upper triangle
*
         DO 10 i = n, n - nb + 1, -1
            iw = i - n + nb
            IF( i.LT.n ) THEN
*
*              Update A(1:i,i)
*
               CALL sgemv( 'No transpose', i, n-i, -one, a( 1, i+1 ),
     $                     lda, w( i, iw+1 ), ldw, one, a( 1, i ), 1 )
               CALL sgemv( 'No transpose', i, n-i, -one, w( 1, iw+1 ),
     $                     ldw, a( i, i+1 ), lda, one, a( 1, i ), 1 )
            END IF
            IF( i.GT.1 ) THEN
*
*              Generate elementary reflector H(i) to annihilate
*              A(1:i-2,i)
*
               CALL slarfg( i-1, a( i-1, i ), a( 1, i ), 1, tau( i-1 ) )
               e( i-1 ) = a( i-1, i )
               a( i-1, i ) = one
*
*              Compute W(1:i-1,i)
*
               CALL ssymv( 'Upper', i-1, one, a, lda, a( 1, i ), 1,
     $                     zero, w( 1, iw ), 1 )
               IF( i.LT.n ) THEN
                  CALL sgemv( 'Transpose', i-1, n-i, one, w( 1, iw+1 ),
     $                        ldw, a( 1, i ), 1, zero, w( i+1, iw ), 1 )
                  CALL sgemv( 'No transpose', i-1, n-i, -one,
     $                        a( 1, i+1 ), lda, w( i+1, iw ), 1, one,
     $                        w( 1, iw ), 1 )
                  CALL sgemv( 'Transpose', i-1, n-i, one, a( 1, i+1 ),
     $                        lda, a( 1, i ), 1, zero, w( i+1, iw ), 1 )
                  CALL sgemv( 'No transpose', i-1, n-i, -one,
     $                        w( 1, iw+1 ), ldw, w( i+1, iw ), 1, one,
     $                        w( 1, iw ), 1 )
               END IF
               CALL sscal( i-1, tau( i-1 ), w( 1, iw ), 1 )
               alpha = -half*tau( i-1 )*sdot( i-1, w( 1, iw ), 1,
     $                 a( 1, i ), 1 )
               CALL saxpy( i-1, alpha, a( 1, i ), 1, w( 1, iw ), 1 )
            END IF
*
   10    CONTINUE
      ELSE
*
*        Reduce first NB columns of lower triangle
*
         DO 20 i = 1, nb
*
*           Update A(i:n,i)
*
            CALL sgemv( 'No transpose', n-i+1, i-1, -one, a( i, 1 ),
     $                  lda, w( i, 1 ), ldw, one, a( i, i ), 1 )
            CALL sgemv( 'No transpose', n-i+1, i-1, -one, w( i, 1 ),
     $                  ldw, a( i, 1 ), lda, one, a( i, i ), 1 )
            IF( i.LT.n ) THEN
*
*              Generate elementary reflector H(i) to annihilate
*              A(i+2:n,i)
*
               CALL slarfg( n-i, a( i+1, i ), a( min( i+2, n ), i ), 1,
     $                      tau( i ) )
               e( i ) = a( i+1, i )
               a( i+1, i ) = one
*
*              Compute W(i+1:n,i)
*
               CALL ssymv( 'Lower', n-i, one, a( i+1, i+1 ), lda,
     $                     a( i+1, i ), 1, zero, w( i+1, i ), 1 )
               CALL sgemv( 'Transpose', n-i, i-1, one, w( i+1, 1 ), ldw,
     $                     a( i+1, i ), 1, zero, w( 1, i ), 1 )
               CALL sgemv( 'No transpose', n-i, i-1, -one, a( i+1, 1 ),
     $                     lda, w( 1, i ), 1, one, w( i+1, i ), 1 )
               CALL sgemv( 'Transpose', n-i, i-1, one, a( i+1, 1 ), lda,
     $                     a( i+1, i ), 1, zero, w( 1, i ), 1 )
               CALL sgemv( 'No transpose', n-i, i-1, -one, w( i+1, 1 ),
     $                     ldw, w( 1, i ), 1, one, w( i+1, i ), 1 )
               CALL sscal( n-i, tau( i ), w( i+1, i ), 1 )
               alpha = -half*tau( i )*sdot( n-i, w( i+1, i ), 1,
     $                 a( i+1, i ), 1 )
               CALL saxpy( n-i, alpha, a( i+1, i ), 1, w( i+1, i ), 1 )
            END IF
*
   20    CONTINUE
      END IF
*
      RETURN
*
*     End of SLATRD
*

OpenRadioss 2025.1.11 OpenRadioss project