342 lines
		
	
	
		
			10 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			342 lines
		
	
	
		
			10 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| /* dsytrf.f -- translated by f2c (version 20061008).
 | |
|    You must link the resulting object file with libf2c:
 | |
| 	on Microsoft Windows system, link with libf2c.lib;
 | |
| 	on Linux or Unix systems, link with .../path/to/libf2c.a -lm
 | |
| 	or, if you install libf2c.a in a standard place, with -lf2c -lm
 | |
| 	-- in that order, at the end of the command line, as in
 | |
| 		cc *.o -lf2c -lm
 | |
| 	Source for libf2c is in /netlib/f2c/libf2c.zip, e.g.,
 | |
| 
 | |
| 		http://www.netlib.org/f2c/libf2c.zip
 | |
| */
 | |
| 
 | |
| #include "clapack.h"
 | |
| 
 | |
| 
 | |
| /* Table of constant values */
 | |
| 
 | |
| static integer c__1 = 1;
 | |
| static integer c_n1 = -1;
 | |
| static integer c__2 = 2;
 | |
| 
 | |
| /* Subroutine */ int dsytrf_(char *uplo, integer *n, doublereal *a, integer *
 | |
| 	lda, integer *ipiv, doublereal *work, integer *lwork, integer *info)
 | |
| {
 | |
|     /* System generated locals */
 | |
|     integer a_dim1, a_offset, i__1, i__2;
 | |
| 
 | |
|     /* Local variables */
 | |
|     integer j, k, kb, nb, iws;
 | |
|     extern logical lsame_(char *, char *);
 | |
|     integer nbmin, iinfo;
 | |
|     logical upper;
 | |
|     extern /* Subroutine */ int dsytf2_(char *, integer *, doublereal *, 
 | |
| 	    integer *, integer *, integer *), xerbla_(char *, integer 
 | |
| 	    *);
 | |
|     extern integer ilaenv_(integer *, char *, char *, integer *, integer *, 
 | |
| 	    integer *, integer *);
 | |
|     extern /* Subroutine */ int dlasyf_(char *, integer *, integer *, integer 
 | |
| 	    *, doublereal *, integer *, integer *, doublereal *, integer *, 
 | |
| 	    integer *);
 | |
|     integer ldwork, lwkopt;
 | |
|     logical lquery;
 | |
| 
 | |
| 
 | |
| /*  -- LAPACK routine (version 3.2) -- */
 | |
| /*     Univ. of Tennessee, Univ. of California Berkeley and NAG Ltd.. */
 | |
| /*     November 2006 */
 | |
| 
 | |
| /*     .. Scalar Arguments .. */
 | |
| /*     .. */
 | |
| /*     .. Array Arguments .. */
 | |
| /*     .. */
 | |
| 
 | |
| /*  Purpose */
 | |
| /*  ======= */
 | |
| 
 | |
| /*  DSYTRF computes the factorization of a real symmetric matrix A using */
 | |
| /*  the Bunch-Kaufman diagonal pivoting method.  The form of the */
 | |
| /*  factorization is */
 | |
| 
 | |
| /*     A = U*D*U**T  or  A = L*D*L**T */
 | |
| 
 | |
| /*  where U (or L) is a product of permutation and unit upper (lower) */
 | |
| /*  triangular matrices, and D is symmetric and block diagonal with */
 | |
| /*  1-by-1 and 2-by-2 diagonal blocks. */
 | |
| 
 | |
| /*  This is the blocked version of the algorithm, calling Level 3 BLAS. */
 | |
| 
 | |
| /*  Arguments */
 | |
| /*  ========= */
 | |
| 
 | |
| /*  UPLO    (input) CHARACTER*1 */
 | |
| /*          = 'U':  Upper triangle of A is stored; */
 | |
| /*          = 'L':  Lower triangle of A is stored. */
 | |
| 
 | |
| /*  N       (input) INTEGER */
 | |
| /*          The order of the matrix A.  N >= 0. */
 | |
| 
 | |
| /*  A       (input/output) DOUBLE PRECISION array, dimension (LDA,N) */
 | |
| /*          On entry, the symmetric matrix A.  If UPLO = 'U', the leading */
 | |
| /*          N-by-N upper triangular part of A contains the upper */
 | |
| /*          triangular part of the matrix A, and the strictly lower */
 | |
| /*          triangular part of A is not referenced.  If UPLO = 'L', the */
 | |
| /*          leading N-by-N lower triangular part of A contains the lower */
 | |
| /*          triangular part of the matrix A, and the strictly upper */
 | |
| /*          triangular part of A is not referenced. */
 | |
| 
 | |
| /*          On exit, the block diagonal matrix D and the multipliers used */
 | |
| /*          to obtain the factor U or L (see below for further details). */
 | |
| 
 | |
| /*  LDA     (input) INTEGER */
 | |
| /*          The leading dimension of the array A.  LDA >= max(1,N). */
 | |
| 
 | |
| /*  IPIV    (output) INTEGER array, dimension (N) */
 | |
| /*          Details of the interchanges and the block structure of D. */
 | |
| /*          If IPIV(k) > 0, then rows and columns k and IPIV(k) were */
 | |
| /*          interchanged and D(k,k) is a 1-by-1 diagonal block. */
 | |
| /*          If UPLO = 'U' and IPIV(k) = IPIV(k-1) < 0, then rows and */
 | |
| /*          columns k-1 and -IPIV(k) were interchanged and D(k-1:k,k-1:k) */
 | |
| /*          is a 2-by-2 diagonal block.  If UPLO = 'L' and IPIV(k) = */
 | |
| /*          IPIV(k+1) < 0, then rows and columns k+1 and -IPIV(k) were */
 | |
| /*          interchanged and D(k:k+1,k:k+1) is a 2-by-2 diagonal block. */
 | |
| 
 | |
| /*  WORK    (workspace/output) DOUBLE PRECISION array, dimension (MAX(1,LWORK)) */
 | |
| /*          On exit, if INFO = 0, WORK(1) returns the optimal LWORK. */
 | |
| 
 | |
| /*  LWORK   (input) INTEGER */
 | |
| /*          The length of WORK.  LWORK >=1.  For best performance */
 | |
| /*          LWORK >= N*NB, where NB is the block size returned by ILAENV. */
 | |
| 
 | |
| /*          If LWORK = -1, then a workspace query is assumed; the routine */
 | |
| /*          only calculates the optimal size of the WORK array, returns */
 | |
| /*          this value as the first entry of the WORK array, and no error */
 | |
| /*          message related to LWORK is issued by XERBLA. */
 | |
| 
 | |
| /*  INFO    (output) INTEGER */
 | |
| /*          = 0:  successful exit */
 | |
| /*          < 0:  if INFO = -i, the i-th argument had an illegal value */
 | |
| /*          > 0:  if INFO = i, D(i,i) is exactly zero.  The factorization */
 | |
| /*                has been completed, but the block diagonal matrix D is */
 | |
| /*                exactly singular, and division by zero will occur if it */
 | |
| /*                is used to solve a system of equations. */
 | |
| 
 | |
| /*  Further Details */
 | |
| /*  =============== */
 | |
| 
 | |
| /*  If UPLO = 'U', then A = U*D*U', where */
 | |
| /*     U = P(n)*U(n)* ... *P(k)U(k)* ..., */
 | |
| /*  i.e., U is a product of terms P(k)*U(k), where k decreases from n to */
 | |
| /*  1 in steps of 1 or 2, and D is a block diagonal matrix with 1-by-1 */
 | |
| /*  and 2-by-2 diagonal blocks D(k).  P(k) is a permutation matrix as */
 | |
| /*  defined by IPIV(k), and U(k) is a unit upper triangular matrix, such */
 | |
| /*  that if the diagonal block D(k) is of order s (s = 1 or 2), then */
 | |
| 
 | |
| /*             (   I    v    0   )   k-s */
 | |
| /*     U(k) =  (   0    I    0   )   s */
 | |
| /*             (   0    0    I   )   n-k */
 | |
| /*                k-s   s   n-k */
 | |
| 
 | |
| /*  If s = 1, D(k) overwrites A(k,k), and v overwrites A(1:k-1,k). */
 | |
| /*  If s = 2, the upper triangle of D(k) overwrites A(k-1,k-1), A(k-1,k), */
 | |
| /*  and A(k,k), and v overwrites A(1:k-2,k-1:k). */
 | |
| 
 | |
| /*  If UPLO = 'L', then A = L*D*L', where */
 | |
| /*     L = P(1)*L(1)* ... *P(k)*L(k)* ..., */
 | |
| /*  i.e., L is a product of terms P(k)*L(k), where k increases from 1 to */
 | |
| /*  n in steps of 1 or 2, and D is a block diagonal matrix with 1-by-1 */
 | |
| /*  and 2-by-2 diagonal blocks D(k).  P(k) is a permutation matrix as */
 | |
| /*  defined by IPIV(k), and L(k) is a unit lower triangular matrix, such */
 | |
| /*  that if the diagonal block D(k) is of order s (s = 1 or 2), then */
 | |
| 
 | |
| /*             (   I    0     0   )  k-1 */
 | |
| /*     L(k) =  (   0    I     0   )  s */
 | |
| /*             (   0    v     I   )  n-k-s+1 */
 | |
| /*                k-1   s  n-k-s+1 */
 | |
| 
 | |
| /*  If s = 1, D(k) overwrites A(k,k), and v overwrites A(k+1:n,k). */
 | |
| /*  If s = 2, the lower triangle of D(k) overwrites A(k,k), A(k+1,k), */
 | |
| /*  and A(k+1,k+1), and v overwrites A(k+2:n,k:k+1). */
 | |
| 
 | |
| /*  ===================================================================== */
 | |
| 
 | |
| /*     .. Local Scalars .. */
 | |
| /*     .. */
 | |
| /*     .. External Functions .. */
 | |
| /*     .. */
 | |
| /*     .. External Subroutines .. */
 | |
| /*     .. */
 | |
| /*     .. Intrinsic Functions .. */
 | |
| /*     .. */
 | |
| /*     .. Executable Statements .. */
 | |
| 
 | |
| /*     Test the input parameters. */
 | |
| 
 | |
|     /* Parameter adjustments */
 | |
|     a_dim1 = *lda;
 | |
|     a_offset = 1 + a_dim1;
 | |
|     a -= a_offset;
 | |
|     --ipiv;
 | |
|     --work;
 | |
| 
 | |
|     /* Function Body */
 | |
|     *info = 0;
 | |
|     upper = lsame_(uplo, "U");
 | |
|     lquery = *lwork == -1;
 | |
|     if (! upper && ! lsame_(uplo, "L")) {
 | |
| 	*info = -1;
 | |
|     } else if (*n < 0) {
 | |
| 	*info = -2;
 | |
|     } else if (*lda < max(1,*n)) {
 | |
| 	*info = -4;
 | |
|     } else if (*lwork < 1 && ! lquery) {
 | |
| 	*info = -7;
 | |
|     }
 | |
| 
 | |
|     if (*info == 0) {
 | |
| 
 | |
| /*        Determine the block size */
 | |
| 
 | |
| 	nb = ilaenv_(&c__1, "DSYTRF", uplo, n, &c_n1, &c_n1, &c_n1);
 | |
| 	lwkopt = *n * nb;
 | |
| 	work[1] = (doublereal) lwkopt;
 | |
|     }
 | |
| 
 | |
|     if (*info != 0) {
 | |
| 	i__1 = -(*info);
 | |
| 	xerbla_("DSYTRF", &i__1);
 | |
| 	return 0;
 | |
|     } else if (lquery) {
 | |
| 	return 0;
 | |
|     }
 | |
| 
 | |
|     nbmin = 2;
 | |
|     ldwork = *n;
 | |
|     if (nb > 1 && nb < *n) {
 | |
| 	iws = ldwork * nb;
 | |
| 	if (*lwork < iws) {
 | |
| /* Computing MAX */
 | |
| 	    i__1 = *lwork / ldwork;
 | |
| 	    nb = max(i__1,1);
 | |
| /* Computing MAX */
 | |
| 	    i__1 = 2, i__2 = ilaenv_(&c__2, "DSYTRF", uplo, n, &c_n1, &c_n1, &
 | |
| 		    c_n1);
 | |
| 	    nbmin = max(i__1,i__2);
 | |
| 	}
 | |
|     } else {
 | |
| 	iws = 1;
 | |
|     }
 | |
|     if (nb < nbmin) {
 | |
| 	nb = *n;
 | |
|     }
 | |
| 
 | |
|     if (upper) {
 | |
| 
 | |
| /*        Factorize A as U*D*U' using the upper triangle of A */
 | |
| 
 | |
| /*        K is the main loop index, decreasing from N to 1 in steps of */
 | |
| /*        KB, where KB is the number of columns factorized by DLASYF; */
 | |
| /*        KB is either NB or NB-1, or K for the last block */
 | |
| 
 | |
| 	k = *n;
 | |
| L10:
 | |
| 
 | |
| /*        If K < 1, exit from loop */
 | |
| 
 | |
| 	if (k < 1) {
 | |
| 	    goto L40;
 | |
| 	}
 | |
| 
 | |
| 	if (k > nb) {
 | |
| 
 | |
| /*           Factorize columns k-kb+1:k of A and use blocked code to */
 | |
| /*           update columns 1:k-kb */
 | |
| 
 | |
| 	    dlasyf_(uplo, &k, &nb, &kb, &a[a_offset], lda, &ipiv[1], &work[1], 
 | |
| 		     &ldwork, &iinfo);
 | |
| 	} else {
 | |
| 
 | |
| /*           Use unblocked code to factorize columns 1:k of A */
 | |
| 
 | |
| 	    dsytf2_(uplo, &k, &a[a_offset], lda, &ipiv[1], &iinfo);
 | |
| 	    kb = k;
 | |
| 	}
 | |
| 
 | |
| /*        Set INFO on the first occurrence of a zero pivot */
 | |
| 
 | |
| 	if (*info == 0 && iinfo > 0) {
 | |
| 	    *info = iinfo;
 | |
| 	}
 | |
| 
 | |
| /*        Decrease K and return to the start of the main loop */
 | |
| 
 | |
| 	k -= kb;
 | |
| 	goto L10;
 | |
| 
 | |
|     } else {
 | |
| 
 | |
| /*        Factorize A as L*D*L' using the lower triangle of A */
 | |
| 
 | |
| /*        K is the main loop index, increasing from 1 to N in steps of */
 | |
| /*        KB, where KB is the number of columns factorized by DLASYF; */
 | |
| /*        KB is either NB or NB-1, or N-K+1 for the last block */
 | |
| 
 | |
| 	k = 1;
 | |
| L20:
 | |
| 
 | |
| /*        If K > N, exit from loop */
 | |
| 
 | |
| 	if (k > *n) {
 | |
| 	    goto L40;
 | |
| 	}
 | |
| 
 | |
| 	if (k <= *n - nb) {
 | |
| 
 | |
| /*           Factorize columns k:k+kb-1 of A and use blocked code to */
 | |
| /*           update columns k+kb:n */
 | |
| 
 | |
| 	    i__1 = *n - k + 1;
 | |
| 	    dlasyf_(uplo, &i__1, &nb, &kb, &a[k + k * a_dim1], lda, &ipiv[k], 
 | |
| 		    &work[1], &ldwork, &iinfo);
 | |
| 	} else {
 | |
| 
 | |
| /*           Use unblocked code to factorize columns k:n of A */
 | |
| 
 | |
| 	    i__1 = *n - k + 1;
 | |
| 	    dsytf2_(uplo, &i__1, &a[k + k * a_dim1], lda, &ipiv[k], &iinfo);
 | |
| 	    kb = *n - k + 1;
 | |
| 	}
 | |
| 
 | |
| /*        Set INFO on the first occurrence of a zero pivot */
 | |
| 
 | |
| 	if (*info == 0 && iinfo > 0) {
 | |
| 	    *info = iinfo + k - 1;
 | |
| 	}
 | |
| 
 | |
| /*        Adjust IPIV */
 | |
| 
 | |
| 	i__1 = k + kb - 1;
 | |
| 	for (j = k; j <= i__1; ++j) {
 | |
| 	    if (ipiv[j] > 0) {
 | |
| 		ipiv[j] = ipiv[j] + k - 1;
 | |
| 	    } else {
 | |
| 		ipiv[j] = ipiv[j] - k + 1;
 | |
| 	    }
 | |
| /* L30: */
 | |
| 	}
 | |
| 
 | |
| /*        Increase K and return to the start of the main loop */
 | |
| 
 | |
| 	k += kb;
 | |
| 	goto L20;
 | |
| 
 | |
|     }
 | |
| 
 | |
| L40:
 | |
|     work[1] = (doublereal) lwkopt;
 | |
|     return 0;
 | |
| 
 | |
| /*     End of DSYTRF */
 | |
| 
 | |
| } /* dsytrf_ */
 | 
