dlasd4.c
来自「提供矩阵类的函数库」· C语言 代码 · 共 1,087 行 · 第 1/2 页
C
1,087 行
#include "blaswrap.h"
/* -- translated by f2c (version 19990503).
You must link the resulting object file with the libraries:
-lf2c -lm (in that order)
*/
#include "f2c.h"
/* Common Block Declarations */
struct {
doublereal ops, itcnt;
} latime_;
#define latime_1 latime_
/* Subroutine */ int dlasd4_(integer *n, integer *i__, doublereal *d__,
doublereal *z__, doublereal *delta, doublereal *rho, doublereal *
sigma, doublereal *work, integer *info)
{
/* System generated locals */
integer i__1;
doublereal d__1;
/* Builtin functions */
double sqrt(doublereal);
/* Local variables */
static doublereal dphi, dpsi;
static integer iter;
static doublereal temp, prew, sg2lb, sg2ub, temp1, temp2, a, b, c__;
static integer j;
static doublereal w, dtiim, delsq, dtiip;
static integer niter;
static doublereal dtisq;
static logical swtch;
static doublereal dtnsq;
extern /* Subroutine */ int dlaed6_(integer *, logical *, doublereal *,
doublereal *, doublereal *, doublereal *, doublereal *, integer *)
, dlasd5_(integer *, doublereal *, doublereal *, doublereal *,
doublereal *, doublereal *, doublereal *);
static doublereal delsq2, dd[3], dtnsq1;
static logical swtch3;
static integer ii;
extern doublereal dlamch_(char *);
static doublereal dw, zz[3];
static logical orgati;
static doublereal erretm, dtipsq, rhoinv;
static integer ip1;
static doublereal eta, phi, eps, tau, psi;
static integer iim1, iip1;
/* -- LAPACK auxiliary routine (instrumented to count ops, version 3.0) --
Univ. of Tennessee, Oak Ridge National Lab, Argonne National Lab,
Courant Institute, NAG Ltd., and Rice University
October 31, 1999
Purpose
=======
This subroutine computes the square root of the I-th updated
eigenvalue of a positive symmetric rank-one modification to
a positive diagonal matrix whose entries are given as the squares
of the corresponding entries in the array d, and that
0 <= D(i) < D(j) for i < j
and that RHO > 0. This is arranged by the calling routine, and is
no loss in generality. The rank-one modified system is thus
diag( D ) * diag( D ) + RHO * Z * Z_transpose.
where we assume the Euclidean norm of Z is 1.
The method consists of approximating the rational functions in the
secular equation by simpler interpolating rational functions.
Arguments
=========
N (input) INTEGER
The length of all arrays.
I (input) INTEGER
The index of the eigenvalue to be computed. 1 <= I <= N.
D (input) DOUBLE PRECISION array, dimension ( N )
The original eigenvalues. It is assumed that they are in
order, 0 <= D(I) < D(J) for I < J.
Z (input) DOUBLE PRECISION array, dimension ( N )
The components of the updating vector.
DELTA (output) DOUBLE PRECISION array, dimension ( N )
If N .ne. 1, DELTA contains (D(j) - sigma_I) in its j-th
component. If N = 1, then DELTA(1) = 1. The vector DELTA
contains the information necessary to construct the
(singular) eigenvectors.
RHO (input) DOUBLE PRECISION
The scalar in the symmetric updating formula.
SIGMA (output) DOUBLE PRECISION
The computed lambda_I, the I-th updated eigenvalue.
WORK (workspace) DOUBLE PRECISION array, dimension ( N )
If N .ne. 1, WORK contains (D(j) + sigma_I) in its j-th
component. If N = 1, then WORK( 1 ) = 1.
INFO (output) INTEGER
= 0: successful exit
> 0: if INFO = 1, the updating process failed.
Internal Parameters
===================
Logical variable ORGATI (origin-at-i?) is used for distinguishing
whether D(i) or D(i+1) is treated as the origin.
ORGATI = .true. origin at i
ORGATI = .false. origin at i+1
Logical variable SWTCH3 (switch-for-3-poles?) is for noting
if we are working with THREE poles!
MAXIT is the maximum number of iterations allowed for each
eigenvalue.
Further Details
===============
Based on contributions by
Ren-Cang Li, Computer Science Division, University of California
at Berkeley, USA
=====================================================================
Since this routine is called in an inner loop, we do no argument
checking.
Quick return for N=1 and 2.
Parameter adjustments */
--work;
--delta;
--z__;
--d__;
/* Function Body */
*info = 0;
if (*n == 1) {
/* Presumably, I=1 upon entry */
latime_1.ops += 5.;
*sigma = sqrt(d__[1] * d__[1] + *rho * z__[1] * z__[1]);
delta[1] = 1.;
work[1] = 1.;
return 0;
}
if (*n == 2) {
dlasd5_(i__, &d__[1], &z__[1], &delta[1], rho, sigma, &work[1]);
return 0;
}
/* Compute machine epsilon */
eps = dlamch_("Epsilon");
latime_1.ops += 1.;
rhoinv = 1. / *rho;
/* The case I = N */
if (*i__ == *n) {
/* Initialize some basic variables */
ii = *n - 1;
niter = 1;
/* Calculate initial guess */
latime_1.ops += 1.;
temp = *rho / 2.;
/* If ||Z||_2 is not one, then TEMP should be set to
RHO * ||Z||_2^2 / TWO */
latime_1.ops += (doublereal) ((*n << 2) + 5);
temp1 = temp / (d__[*n] + sqrt(d__[*n] * d__[*n] + temp));
i__1 = *n;
for (j = 1; j <= i__1; ++j) {
work[j] = d__[j] + d__[*n] + temp1;
delta[j] = d__[j] - d__[*n] - temp1;
/* L10: */
}
psi = 0.;
latime_1.ops += (doublereal) (*n - 2 << 2);
i__1 = *n - 2;
for (j = 1; j <= i__1; ++j) {
psi += z__[j] * z__[j] / (delta[j] * work[j]);
/* L20: */
}
latime_1.ops += 9.;
c__ = rhoinv + psi;
w = c__ + z__[ii] * z__[ii] / (delta[ii] * work[ii]) + z__[*n] * z__[*
n] / (delta[*n] * work[*n]);
if (w <= 0.) {
latime_1.ops += 14.;
temp1 = sqrt(d__[*n] * d__[*n] + *rho);
temp = z__[*n - 1] * z__[*n - 1] / ((d__[*n - 1] + temp1) * (d__[*
n] - d__[*n - 1] + *rho / (d__[*n] + temp1))) + z__[*n] *
z__[*n] / *rho;
/* The following TAU is to approximate
SIGMA_n^2 - D( N )*D( N ) */
if (c__ <= temp) {
tau = *rho;
} else {
latime_1.ops += 10.;
delsq = (d__[*n] - d__[*n - 1]) * (d__[*n] + d__[*n - 1]);
a = -c__ * delsq + z__[*n - 1] * z__[*n - 1] + z__[*n] * z__[*
n];
b = z__[*n] * z__[*n] * delsq;
if (a < 0.) {
latime_1.ops += 8.;
tau = b * 2. / (sqrt(a * a + b * 4. * c__) - a);
} else {
latime_1.ops += 8.;
tau = (a + sqrt(a * a + b * 4. * c__)) / (c__ * 2.);
}
}
/* It can be proved that
D(N)^2+RHO/2 <= SIGMA_n^2 < D(N)^2+TAU <= D(N)^2+RHO */
} else {
latime_1.ops += 10.;
delsq = (d__[*n] - d__[*n - 1]) * (d__[*n] + d__[*n - 1]);
a = -c__ * delsq + z__[*n - 1] * z__[*n - 1] + z__[*n] * z__[*n];
b = z__[*n] * z__[*n] * delsq;
/* The following TAU is to approximate
SIGMA_n^2 - D( N )*D( N ) */
if (a < 0.) {
latime_1.ops += 8.;
tau = b * 2. / (sqrt(a * a + b * 4. * c__) - a);
} else {
latime_1.ops += 8.;
tau = (a + sqrt(a * a + b * 4. * c__)) / (c__ * 2.);
}
/* It can be proved that
D(N)^2 < D(N)^2+TAU < SIGMA(N)^2 < D(N)^2+RHO/2 */
}
/* The following ETA is to approximate SIGMA_n - D( N ) */
latime_1.ops += 5.;
eta = tau / (d__[*n] + sqrt(d__[*n] * d__[*n] + tau));
latime_1.ops += (doublereal) ((*n << 2) + 1);
*sigma = d__[*n] + eta;
i__1 = *n;
for (j = 1; j <= i__1; ++j) {
delta[j] = d__[j] - d__[*i__] - eta;
work[j] = d__[j] + d__[*i__] + eta;
/* L30: */
}
/* Evaluate PSI and the derivative DPSI */
dpsi = 0.;
psi = 0.;
erretm = 0.;
latime_1.ops += (doublereal) (ii * 7);
i__1 = ii;
for (j = 1; j <= i__1; ++j) {
temp = z__[j] / (delta[j] * work[j]);
psi += z__[j] * temp;
dpsi += temp * temp;
erretm += psi;
/* L40: */
}
erretm = abs(erretm);
/* Evaluate PHI and the derivative DPHI */
latime_1.ops += 14.;
temp = z__[*n] / (delta[*n] * work[*n]);
phi = z__[*n] * temp;
dphi = temp * temp;
erretm = (-phi - psi) * 8. + erretm - phi + rhoinv + abs(tau) * (dpsi
+ dphi);
w = rhoinv + phi + psi;
/* Test for convergence */
if (abs(w) <= eps * erretm) {
goto L240;
}
/* Calculate the new step */
++niter;
latime_1.ops += 14.;
dtnsq1 = work[*n - 1] * delta[*n - 1];
dtnsq = work[*n] * delta[*n];
c__ = w - dtnsq1 * dpsi - dtnsq * dphi;
a = (dtnsq + dtnsq1) * w - dtnsq * dtnsq1 * (dpsi + dphi);
b = dtnsq * dtnsq1 * w;
if (c__ < 0.) {
c__ = abs(c__);
}
if (c__ == 0.) {
latime_1.ops += 2.;
eta = *rho - *sigma * *sigma;
} else if (a >= 0.) {
latime_1.ops += 8.;
eta = (a + sqrt((d__1 = a * a - b * 4. * c__, abs(d__1)))) / (c__
* 2.);
} else {
latime_1.ops += 8.;
eta = b * 2. / (a - sqrt((d__1 = a * a - b * 4. * c__, abs(d__1)))
);
}
/* Note, eta should be positive if w is negative, and
eta should be negative otherwise. However,
if for some reason caused by roundoff, eta*w > 0,
we simply use one Newton step instead. This way
will guarantee eta*w < 0. */
latime_1.ops += 1.;
if (w * eta > 0.) {
latime_1.ops += 2.;
eta = -w / (dpsi + dphi);
}
temp = eta - dtnsq;
if (temp > *rho) {
latime_1.ops += 1.;
eta = *rho + dtnsq;
}
latime_1.ops += (doublereal) ((*n << 1) + 7);
tau += eta;
eta /= *sigma + sqrt(eta + *sigma * *sigma);
i__1 = *n;
for (j = 1; j <= i__1; ++j) {
delta[j] -= eta;
work[j] += eta;
/* L50: */
}
*sigma += eta;
/* Evaluate PSI and the derivative DPSI */
dpsi = 0.;
psi = 0.;
erretm = 0.;
latime_1.ops += (doublereal) (ii * 7);
i__1 = ii;
for (j = 1; j <= i__1; ++j) {
temp = z__[j] / (work[j] * delta[j]);
psi += z__[j] * temp;
dpsi += temp * temp;
erretm += psi;
/* L60: */
}
erretm = abs(erretm);
/* Evaluate PHI and the derivative DPHI */
latime_1.ops += 14.;
temp = z__[*n] / (work[*n] * delta[*n]);
phi = z__[*n] * temp;
dphi = temp * temp;
erretm = (-phi - psi) * 8. + erretm - phi + rhoinv + abs(tau) * (dpsi
+ dphi);
w = rhoinv + phi + psi;
/* Main loop to update the values of the array DELTA */
iter = niter + 1;
for (niter = iter; niter <= 20; ++niter) {
/* Test for convergence */
latime_1.ops += 1.;
if (abs(w) <= eps * erretm) {
goto L240;
}
/* Calculate the new step */
latime_1.ops += 22.;
dtnsq1 = work[*n - 1] * delta[*n - 1];
dtnsq = work[*n] * delta[*n];
c__ = w - dtnsq1 * dpsi - dtnsq * dphi;
a = (dtnsq + dtnsq1) * w - dtnsq1 * dtnsq * (dpsi + dphi);
b = dtnsq1 * dtnsq * w;
if (a >= 0.) {
eta = (a + sqrt((d__1 = a * a - b * 4. * c__, abs(d__1)))) / (
c__ * 2.);
} else {
eta = b * 2. / (a - sqrt((d__1 = a * a - b * 4. * c__, abs(
d__1))));
}
/* Note, eta should be positive if w is negative, and
eta should be negative otherwise. However,
if for some reason caused by roundoff, eta*w > 0,
we simply use one Newton step instead. This way
will guarantee eta*w < 0. */
latime_1.ops += 2.;
if (w * eta > 0.) {
latime_1.ops += 2.;
eta = -w / (dpsi + dphi);
}
temp = eta - dtnsq;
if (temp <= 0.) {
latime_1.ops += 1.;
eta /= 2.;
}
latime_1.ops += (doublereal) ((*n << 1) + 7);
tau += eta;
eta /= *sigma + sqrt(eta + *sigma * *sigma);
i__1 = *n;
for (j = 1; j <= i__1; ++j) {
delta[j] -= eta;
work[j] += eta;
/* L70: */
}
*sigma += eta;
/* Evaluate PSI and the derivative DPSI */
dpsi = 0.;
psi = 0.;
erretm = 0.;
latime_1.ops += (doublereal) (ii * 7);
i__1 = ii;
for (j = 1; j <= i__1; ++j) {
temp = z__[j] / (work[j] * delta[j]);
psi += z__[j] * temp;
dpsi += temp * temp;
erretm += psi;
/* L80: */
}
erretm = abs(erretm);
/* Evaluate PHI and the derivative DPHI */
latime_1.ops += 14.;
temp = z__[*n] / (work[*n] * delta[*n]);
phi = z__[*n] * temp;
dphi = temp * temp;
erretm = (-phi - psi) * 8. + erretm - phi + rhoinv + abs(tau) * (
dpsi + dphi);
w = rhoinv + phi + psi;
/* L90: */
}
/* Return with INFO = 1, NITER = MAXIT and not converged */
*info = 1;
goto L240;
/* End for the case I = N */
} else {
/* The case for I < N */
niter = 1;
ip1 = *i__ + 1;
/* Calculate initial guess */
latime_1.ops += (doublereal) ((*n << 2) + 9);
delsq = (d__[ip1] - d__[*i__]) * (d__[ip1] + d__[*i__]);
delsq2 = delsq / 2.;
temp = delsq2 / (d__[*i__] + sqrt(d__[*i__] * d__[*i__] + delsq2));
i__1 = *n;
for (j = 1; j <= i__1; ++j) {
work[j] = d__[j] + d__[*i__] + temp;
delta[j] = d__[j] - d__[*i__] - temp;
/* L100: */
}
psi = 0.;
latime_1.ops += (doublereal) (*i__ - 1 << 2);
i__1 = *i__ - 1;
for (j = 1; j <= i__1; ++j) {
psi += z__[j] * z__[j] / (work[j] * delta[j]);
/* L110: */
}
phi = 0.;
latime_1.ops += (doublereal) ((*n - *i__ - 1 << 2) + 10);
i__1 = *i__ + 2;
for (j = *n; j >= i__1; --j) {
phi += z__[j] * z__[j] / (work[j] * delta[j]);
/* L120: */
}
c__ = rhoinv + psi + phi;
w = c__ + z__[*i__] * z__[*i__] / (work[*i__] * delta[*i__]) + z__[
ip1] * z__[ip1] / (work[ip1] * delta[ip1]);
if (w > 0.) {
/* d(i)^2 < the ith sigma^2 < (d(i)^2+d(i+1)^2)/2
We choose d(i) as origin. */
latime_1.ops += 20.;
orgati = TRUE_;
sg2lb = 0.;
sg2ub = delsq2;
a = c__ * delsq + z__[*i__] * z__[*i__] + z__[ip1] * z__[ip1];
b = z__[*i__] * z__[*i__] * delsq;
if (a > 0.) {
tau = b * 2. / (a + sqrt((d__1 = a * a - b * 4. * c__, abs(
d__1))));
} else {
tau = (a - sqrt((d__1 = a * a - b * 4. * c__, abs(d__1)))) / (
c__ * 2.);
⌨️ 快捷键说明
复制代码Ctrl + C
搜索代码Ctrl + F
全屏模式F11
增大字号Ctrl + =
减小字号Ctrl + -
显示快捷键?