283 lines
		
	
	
		
			10 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			283 lines
		
	
	
		
			10 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
/* iparmq.f -- translated by f2c (version 20061008).
 | 
						|
   You must link the resulting object file with libf2c:
 | 
						|
	on Microsoft Windows system, link with libf2c.lib;
 | 
						|
	on Linux or Unix systems, link with .../path/to/libf2c.a -lm
 | 
						|
	or, if you install libf2c.a in a standard place, with -lf2c -lm
 | 
						|
	-- in that order, at the end of the command line, as in
 | 
						|
		cc *.o -lf2c -lm
 | 
						|
	Source for libf2c is in /netlib/f2c/libf2c.zip, e.g.,
 | 
						|
 | 
						|
		http://www.netlib.org/f2c/libf2c.zip
 | 
						|
*/
 | 
						|
 | 
						|
#include "clapack.h"
 | 
						|
 | 
						|
 | 
						|
integer iparmq_(integer *ispec, char *name__, char *opts, integer *n, integer 
 | 
						|
	*ilo, integer *ihi, integer *lwork)
 | 
						|
{
 | 
						|
    /* System generated locals */
 | 
						|
    integer ret_val, i__1, i__2;
 | 
						|
    real r__1;
 | 
						|
 | 
						|
    /* Builtin functions */
 | 
						|
    double log(doublereal);
 | 
						|
    integer i_nint(real *);
 | 
						|
 | 
						|
    /* Local variables */
 | 
						|
    integer nh, ns;
 | 
						|
 | 
						|
 | 
						|
/*  -- LAPACK auxiliary routine (version 3.2) -- */
 | 
						|
/*     Univ. of Tennessee, Univ. of California Berkeley and NAG Ltd.. */
 | 
						|
/*     November 2006 */
 | 
						|
 | 
						|
/*     .. Scalar Arguments .. */
 | 
						|
 | 
						|
/*  Purpose */
 | 
						|
/*  ======= */
 | 
						|
 | 
						|
/*       This program sets problem and machine dependent parameters */
 | 
						|
/*       useful for xHSEQR and its subroutines. It is called whenever */
 | 
						|
/*       ILAENV is called with 12 <= ISPEC <= 16 */
 | 
						|
 | 
						|
/*  Arguments */
 | 
						|
/*  ========= */
 | 
						|
 | 
						|
/*       ISPEC  (input) integer scalar */
 | 
						|
/*              ISPEC specifies which tunable parameter IPARMQ should */
 | 
						|
/*              return. */
 | 
						|
 | 
						|
/*              ISPEC=12: (INMIN)  Matrices of order nmin or less */
 | 
						|
/*                        are sent directly to xLAHQR, the implicit */
 | 
						|
/*                        double shift QR algorithm.  NMIN must be */
 | 
						|
/*                        at least 11. */
 | 
						|
 | 
						|
/*              ISPEC=13: (INWIN)  Size of the deflation window. */
 | 
						|
/*                        This is best set greater than or equal to */
 | 
						|
/*                        the number of simultaneous shifts NS. */
 | 
						|
/*                        Larger matrices benefit from larger deflation */
 | 
						|
/*                        windows. */
 | 
						|
 | 
						|
/*              ISPEC=14: (INIBL) Determines when to stop nibbling and */
 | 
						|
/*                        invest in an (expensive) multi-shift QR sweep. */
 | 
						|
/*                        If the aggressive early deflation subroutine */
 | 
						|
/*                        finds LD converged eigenvalues from an order */
 | 
						|
/*                        NW deflation window and LD.GT.(NW*NIBBLE)/100, */
 | 
						|
/*                        then the next QR sweep is skipped and early */
 | 
						|
/*                        deflation is applied immediately to the */
 | 
						|
/*                        remaining active diagonal block.  Setting */
 | 
						|
/*                        IPARMQ(ISPEC=14) = 0 causes TTQRE to skip a */
 | 
						|
/*                        multi-shift QR sweep whenever early deflation */
 | 
						|
/*                        finds a converged eigenvalue.  Setting */
 | 
						|
/*                        IPARMQ(ISPEC=14) greater than or equal to 100 */
 | 
						|
/*                        prevents TTQRE from skipping a multi-shift */
 | 
						|
/*                        QR sweep. */
 | 
						|
 | 
						|
/*              ISPEC=15: (NSHFTS) The number of simultaneous shifts in */
 | 
						|
/*                        a multi-shift QR iteration. */
 | 
						|
 | 
						|
/*              ISPEC=16: (IACC22) IPARMQ is set to 0, 1 or 2 with the */
 | 
						|
/*                        following meanings. */
 | 
						|
/*                        0:  During the multi-shift QR sweep, */
 | 
						|
/*                            xLAQR5 does not accumulate reflections and */
 | 
						|
/*                            does not use matrix-matrix multiply to */
 | 
						|
/*                            update the far-from-diagonal matrix */
 | 
						|
/*                            entries. */
 | 
						|
/*                        1:  During the multi-shift QR sweep, */
 | 
						|
/*                            xLAQR5 and/or xLAQRaccumulates reflections and uses */
 | 
						|
/*                            matrix-matrix multiply to update the */
 | 
						|
/*                            far-from-diagonal matrix entries. */
 | 
						|
/*                        2:  During the multi-shift QR sweep. */
 | 
						|
/*                            xLAQR5 accumulates reflections and takes */
 | 
						|
/*                            advantage of 2-by-2 block structure during */
 | 
						|
/*                            matrix-matrix multiplies. */
 | 
						|
/*                        (If xTRMM is slower than xGEMM, then */
 | 
						|
/*                        IPARMQ(ISPEC=16)=1 may be more efficient than */
 | 
						|
/*                        IPARMQ(ISPEC=16)=2 despite the greater level of */
 | 
						|
/*                        arithmetic work implied by the latter choice.) */
 | 
						|
 | 
						|
/*       NAME    (input) character string */
 | 
						|
/*               Name of the calling subroutine */
 | 
						|
 | 
						|
/*       OPTS    (input) character string */
 | 
						|
/*               This is a concatenation of the string arguments to */
 | 
						|
/*               TTQRE. */
 | 
						|
 | 
						|
/*       N       (input) integer scalar */
 | 
						|
/*               N is the order of the Hessenberg matrix H. */
 | 
						|
 | 
						|
/*       ILO     (input) INTEGER */
 | 
						|
/*       IHI     (input) INTEGER */
 | 
						|
/*               It is assumed that H is already upper triangular */
 | 
						|
/*               in rows and columns 1:ILO-1 and IHI+1:N. */
 | 
						|
 | 
						|
/*       LWORK   (input) integer scalar */
 | 
						|
/*               The amount of workspace available. */
 | 
						|
 | 
						|
/*  Further Details */
 | 
						|
/*  =============== */
 | 
						|
 | 
						|
/*       Little is known about how best to choose these parameters. */
 | 
						|
/*       It is possible to use different values of the parameters */
 | 
						|
/*       for each of CHSEQR, DHSEQR, SHSEQR and ZHSEQR. */
 | 
						|
 | 
						|
/*       It is probably best to choose different parameters for */
 | 
						|
/*       different matrices and different parameters at different */
 | 
						|
/*       times during the iteration, but this has not been */
 | 
						|
/*       implemented --- yet. */
 | 
						|
 | 
						|
 | 
						|
/*       The best choices of most of the parameters depend */
 | 
						|
/*       in an ill-understood way on the relative execution */
 | 
						|
/*       rate of xLAQR3 and xLAQR5 and on the nature of each */
 | 
						|
/*       particular eigenvalue problem.  Experiment may be the */
 | 
						|
/*       only practical way to determine which choices are most */
 | 
						|
/*       effective. */
 | 
						|
 | 
						|
/*       Following is a list of default values supplied by IPARMQ. */
 | 
						|
/*       These defaults may be adjusted in order to attain better */
 | 
						|
/*       performance in any particular computational environment. */
 | 
						|
 | 
						|
/*       IPARMQ(ISPEC=12) The xLAHQR vs xLAQR0 crossover point. */
 | 
						|
/*                        Default: 75. (Must be at least 11.) */
 | 
						|
 | 
						|
/*       IPARMQ(ISPEC=13) Recommended deflation window size. */
 | 
						|
/*                        This depends on ILO, IHI and NS, the */
 | 
						|
/*                        number of simultaneous shifts returned */
 | 
						|
/*                        by IPARMQ(ISPEC=15).  The default for */
 | 
						|
/*                        (IHI-ILO+1).LE.500 is NS.  The default */
 | 
						|
/*                        for (IHI-ILO+1).GT.500 is 3*NS/2. */
 | 
						|
 | 
						|
/*       IPARMQ(ISPEC=14) Nibble crossover point.  Default: 14. */
 | 
						|
 | 
						|
/*       IPARMQ(ISPEC=15) Number of simultaneous shifts, NS. */
 | 
						|
/*                        a multi-shift QR iteration. */
 | 
						|
 | 
						|
/*                        If IHI-ILO+1 is ... */
 | 
						|
 | 
						|
/*                        greater than      ...but less    ... the */
 | 
						|
/*                        or equal to ...      than        default is */
 | 
						|
 | 
						|
/*                                0               30       NS =   2+ */
 | 
						|
/*                               30               60       NS =   4+ */
 | 
						|
/*                               60              150       NS =  10 */
 | 
						|
/*                              150              590       NS =  ** */
 | 
						|
/*                              590             3000       NS =  64 */
 | 
						|
/*                             3000             6000       NS = 128 */
 | 
						|
/*                             6000             infinity   NS = 256 */
 | 
						|
 | 
						|
/*                    (+)  By default matrices of this order are */
 | 
						|
/*                         passed to the implicit double shift routine */
 | 
						|
/*                         xLAHQR.  See IPARMQ(ISPEC=12) above.   These */
 | 
						|
/*                         values of NS are used only in case of a rare */
 | 
						|
/*                         xLAHQR failure. */
 | 
						|
 | 
						|
/*                    (**) The asterisks (**) indicate an ad-hoc */
 | 
						|
/*                         function increasing from 10 to 64. */
 | 
						|
 | 
						|
/*       IPARMQ(ISPEC=16) Select structured matrix multiply. */
 | 
						|
/*                        (See ISPEC=16 above for details.) */
 | 
						|
/*                        Default: 3. */
 | 
						|
 | 
						|
/*     ================================================================ */
 | 
						|
/*     .. Parameters .. */
 | 
						|
/*     .. */
 | 
						|
/*     .. Local Scalars .. */
 | 
						|
/*     .. */
 | 
						|
/*     .. Intrinsic Functions .. */
 | 
						|
/*     .. */
 | 
						|
/*     .. Executable Statements .. */
 | 
						|
    if (*ispec == 15 || *ispec == 13 || *ispec == 16) {
 | 
						|
 | 
						|
/*        ==== Set the number simultaneous shifts ==== */
 | 
						|
 | 
						|
	nh = *ihi - *ilo + 1;
 | 
						|
	ns = 2;
 | 
						|
	if (nh >= 30) {
 | 
						|
	    ns = 4;
 | 
						|
	}
 | 
						|
	if (nh >= 60) {
 | 
						|
	    ns = 10;
 | 
						|
	}
 | 
						|
	if (nh >= 150) {
 | 
						|
/* Computing MAX */
 | 
						|
	    r__1 = log((real) nh) / log(2.f);
 | 
						|
	    i__1 = 10, i__2 = nh / i_nint(&r__1);
 | 
						|
	    ns = max(i__1,i__2);
 | 
						|
	}
 | 
						|
	if (nh >= 590) {
 | 
						|
	    ns = 64;
 | 
						|
	}
 | 
						|
	if (nh >= 3000) {
 | 
						|
	    ns = 128;
 | 
						|
	}
 | 
						|
	if (nh >= 6000) {
 | 
						|
	    ns = 256;
 | 
						|
	}
 | 
						|
/* Computing MAX */
 | 
						|
	i__1 = 2, i__2 = ns - ns % 2;
 | 
						|
	ns = max(i__1,i__2);
 | 
						|
    }
 | 
						|
 | 
						|
    if (*ispec == 12) {
 | 
						|
 | 
						|
 | 
						|
/*        ===== Matrices of order smaller than NMIN get sent */
 | 
						|
/*        .     to xLAHQR, the classic double shift algorithm. */
 | 
						|
/*        .     This must be at least 11. ==== */
 | 
						|
 | 
						|
	ret_val = 75;
 | 
						|
 | 
						|
    } else if (*ispec == 14) {
 | 
						|
 | 
						|
/*        ==== INIBL: skip a multi-shift qr iteration and */
 | 
						|
/*        .    whenever aggressive early deflation finds */
 | 
						|
/*        .    at least (NIBBLE*(window size)/100) deflations. ==== */
 | 
						|
 | 
						|
	ret_val = 14;
 | 
						|
 | 
						|
    } else if (*ispec == 15) {
 | 
						|
 | 
						|
/*        ==== NSHFTS: The number of simultaneous shifts ===== */
 | 
						|
 | 
						|
	ret_val = ns;
 | 
						|
 | 
						|
    } else if (*ispec == 13) {
 | 
						|
 | 
						|
/*        ==== NW: deflation window size.  ==== */
 | 
						|
 | 
						|
	if (nh <= 500) {
 | 
						|
	    ret_val = ns;
 | 
						|
	} else {
 | 
						|
	    ret_val = ns * 3 / 2;
 | 
						|
	}
 | 
						|
 | 
						|
    } else if (*ispec == 16) {
 | 
						|
 | 
						|
/*        ==== IACC22: Whether to accumulate reflections */
 | 
						|
/*        .     before updating the far-from-diagonal elements */
 | 
						|
/*        .     and whether to use 2-by-2 block structure while */
 | 
						|
/*        .     doing it.  A small amount of work could be saved */
 | 
						|
/*        .     by making this choice dependent also upon the */
 | 
						|
/*        .     NH=IHI-ILO+1. */
 | 
						|
 | 
						|
	ret_val = 0;
 | 
						|
	if (ns >= 14) {
 | 
						|
	    ret_val = 1;
 | 
						|
	}
 | 
						|
	if (ns >= 14) {
 | 
						|
	    ret_val = 2;
 | 
						|
	}
 | 
						|
 | 
						|
    } else {
 | 
						|
/*        ===== invalid value of ispec ===== */
 | 
						|
	ret_val = -1;
 | 
						|
 | 
						|
    }
 | 
						|
 | 
						|
/*     ==== End of IPARMQ ==== */
 | 
						|
 | 
						|
    return ret_val;
 | 
						|
} /* iparmq_ */
 |