slasd4.c
来自「提供矩阵类的函数库」· C语言 代码 · 共 1,088 行 · 第 1/2 页
C
1,088 行
(c__ * 2.f);
}
/* TAU now is an estimation of SIGMA^2 - D( I )^2. The
following, however, is the corresponding estimation of
SIGMA - D( I ). */
eta = tau / (d__[*i__] + sqrt(d__[*i__] * d__[*i__] + tau));
} else {
/* (d(i)^2+d(i+1)^2)/2 <= the ith sigma^2 < d(i+1)^2/2
We choose d(i+1) as origin. */
latime_1.ops += 20.f;
orgati = FALSE_;
sg2lb = -delsq2;
sg2ub = 0.f;
a = c__ * delsq - z__[*i__] * z__[*i__] - z__[ip1] * z__[ip1];
b = z__[ip1] * z__[ip1] * delsq;
if (a < 0.f) {
tau = b * 2.f / (a - sqrt((r__1 = a * a + b * 4.f * c__, dabs(
r__1))));
} else {
tau = -(a + sqrt((r__1 = a * a + b * 4.f * c__, dabs(r__1))))
/ (c__ * 2.f);
}
/* TAU now is an estimation of SIGMA^2 - D( IP1 )^2. The
following, however, is the corresponding estimation of
SIGMA - D( IP1 ). */
eta = tau / (d__[ip1] + sqrt((r__1 = d__[ip1] * d__[ip1] + tau,
dabs(r__1))));
}
latime_1.ops += (real) ((*n << 2) + 1);
if (orgati) {
ii = *i__;
*sigma = d__[*i__] + eta;
i__1 = *n;
for (j = 1; j <= i__1; ++j) {
work[j] = d__[j] + d__[*i__] + eta;
delta[j] = d__[j] - d__[*i__] - eta;
/* L130: */
}
} else {
ii = *i__ + 1;
*sigma = d__[ip1] + eta;
i__1 = *n;
for (j = 1; j <= i__1; ++j) {
work[j] = d__[j] + d__[ip1] + eta;
delta[j] = d__[j] - d__[ip1] - eta;
/* L140: */
}
}
iim1 = ii - 1;
iip1 = ii + 1;
/* Evaluate PSI and the derivative DPSI */
dpsi = 0.f;
psi = 0.f;
erretm = 0.f;
latime_1.ops += (real) (iim1 * 7);
i__1 = iim1;
for (j = 1; j <= i__1; ++j) {
temp = z__[j] / (work[j] * delta[j]);
psi += z__[j] * temp;
dpsi += temp * temp;
erretm += psi;
/* L150: */
}
erretm = dabs(erretm);
/* Evaluate PHI and the derivative DPHI */
dphi = 0.f;
phi = 0.f;
latime_1.ops += (real) ((*n - iip1 + 1) * 7 + 2);
i__1 = iip1;
for (j = *n; j >= i__1; --j) {
temp = z__[j] / (work[j] * delta[j]);
phi += z__[j] * temp;
dphi += temp * temp;
erretm += phi;
/* L160: */
}
w = rhoinv + phi + psi;
/* W is the value of the secular function with
its ii-th element removed. */
swtch3 = FALSE_;
if (orgati) {
if (w < 0.f) {
swtch3 = TRUE_;
}
} else {
if (w > 0.f) {
swtch3 = TRUE_;
}
}
if (ii == 1 || ii == *n) {
swtch3 = FALSE_;
}
latime_1.ops += 17.f;
temp = z__[ii] / (work[ii] * delta[ii]);
dw = dpsi + dphi + temp * temp;
temp = z__[ii] * temp;
w += temp;
erretm = (phi - psi) * 8.f + erretm + rhoinv * 2.f + dabs(temp) * 3.f
+ dabs(tau) * dw;
/* Test for convergence */
if (dabs(w) <= eps * erretm) {
goto L240;
}
if (w <= 0.f) {
sg2lb = dmax(sg2lb,tau);
} else {
sg2ub = dmin(sg2ub,tau);
}
/* Calculate the new step */
++niter;
if (! swtch3) {
latime_1.ops += 15.f;
dtipsq = work[ip1] * delta[ip1];
dtisq = work[*i__] * delta[*i__];
if (orgati) {
/* Computing 2nd power */
r__1 = z__[*i__] / dtisq;
c__ = w - dtipsq * dw + delsq * (r__1 * r__1);
} else {
/* Computing 2nd power */
r__1 = z__[ip1] / dtipsq;
c__ = w - dtisq * dw - delsq * (r__1 * r__1);
}
a = (dtipsq + dtisq) * w - dtipsq * dtisq * dw;
b = dtipsq * dtisq * w;
if (c__ == 0.f) {
if (a == 0.f) {
latime_1.ops += 5.f;
if (orgati) {
a = z__[*i__] * z__[*i__] + dtipsq * dtipsq * (dpsi +
dphi);
} else {
a = z__[ip1] * z__[ip1] + dtisq * dtisq * (dpsi +
dphi);
}
}
latime_1.ops += 1.f;
eta = b / a;
} else if (a <= 0.f) {
latime_1.ops += 8.f;
eta = (a - sqrt((r__1 = a * a - b * 4.f * c__, dabs(r__1)))) /
(c__ * 2.f);
} else {
latime_1.ops += 8.f;
eta = b * 2.f / (a + sqrt((r__1 = a * a - b * 4.f * c__, dabs(
r__1))));
}
} else {
/* Interpolation using THREE most relevant poles */
latime_1.ops += 15.f;
dtiim = work[iim1] * delta[iim1];
dtiip = work[iip1] * delta[iip1];
temp = rhoinv + psi + phi;
if (orgati) {
temp1 = z__[iim1] / dtiim;
temp1 *= temp1;
c__ = temp - dtiip * (dpsi + dphi) - (d__[iim1] - d__[iip1]) *
(d__[iim1] + d__[iip1]) * temp1;
zz[0] = z__[iim1] * z__[iim1];
if (dpsi < temp1) {
latime_1.ops += 2.f;
zz[2] = dtiip * dtiip * dphi;
} else {
latime_1.ops += 4.f;
zz[2] = dtiip * dtiip * (dpsi - temp1 + dphi);
}
} else {
temp1 = z__[iip1] / dtiip;
temp1 *= temp1;
c__ = temp - dtiim * (dpsi + dphi) - (d__[iip1] - d__[iim1]) *
(d__[iim1] + d__[iip1]) * temp1;
if (dphi < temp1) {
latime_1.ops += 2.f;
zz[0] = dtiim * dtiim * dpsi;
} else {
latime_1.ops += 4.f;
zz[0] = dtiim * dtiim * (dpsi + (dphi - temp1));
}
zz[2] = z__[iip1] * z__[iip1];
}
latime_1.ops += 2.f;
zz[1] = z__[ii] * z__[ii];
dd[0] = dtiim;
dd[1] = delta[ii] * work[ii];
dd[2] = dtiip;
slaed6_(&niter, &orgati, &c__, dd, zz, &w, &eta, info);
if (*info != 0) {
goto L240;
}
}
/* Note, eta should be positive if w is negative, and
eta should be negative otherwise. However,
if for some reason caused by roundoff, eta*w > 0,
we simply use one Newton step instead. This way
will guarantee eta*w < 0. */
latime_1.ops += 1.f;
if (w * eta >= 0.f) {
latime_1.ops += 1.f;
eta = -w / dw;
}
latime_1.ops += 8.f;
if (orgati) {
temp1 = work[*i__] * delta[*i__];
temp = eta - temp1;
} else {
temp1 = work[ip1] * delta[ip1];
temp = eta - temp1;
}
if (temp > sg2ub || temp < sg2lb) {
latime_1.ops += 2.f;
if (w < 0.f) {
eta = (sg2ub - tau) / 2.f;
} else {
eta = (sg2lb - tau) / 2.f;
}
}
tau += eta;
eta /= *sigma + sqrt(*sigma * *sigma + eta);
prew = w;
latime_1.ops += (real) ((*n << 1) + 1);
*sigma += eta;
i__1 = *n;
for (j = 1; j <= i__1; ++j) {
work[j] += eta;
delta[j] -= eta;
/* L170: */
}
/* Evaluate PSI and the derivative DPSI */
dpsi = 0.f;
psi = 0.f;
erretm = 0.f;
latime_1.ops += (real) (iim1 * 7);
i__1 = iim1;
for (j = 1; j <= i__1; ++j) {
temp = z__[j] / (work[j] * delta[j]);
psi += z__[j] * temp;
dpsi += temp * temp;
erretm += psi;
/* L180: */
}
erretm = dabs(erretm);
/* Evaluate PHI and the derivative DPHI */
dphi = 0.f;
phi = 0.f;
latime_1.ops += (real) ((*n - iim1 + 1) * 7);
i__1 = iip1;
for (j = *n; j >= i__1; --j) {
temp = z__[j] / (work[j] * delta[j]);
phi += z__[j] * temp;
dphi += temp * temp;
erretm += phi;
/* L190: */
}
latime_1.ops += 19.f;
temp = z__[ii] / (work[ii] * delta[ii]);
dw = dpsi + dphi + temp * temp;
temp = z__[ii] * temp;
w = rhoinv + phi + psi + temp;
erretm = (phi - psi) * 8.f + erretm + rhoinv * 2.f + dabs(temp) * 3.f
+ dabs(tau) * dw;
if (w <= 0.f) {
sg2lb = dmax(sg2lb,tau);
} else {
sg2ub = dmin(sg2ub,tau);
}
swtch = FALSE_;
if (orgati) {
if (-w > dabs(prew) / 10.f) {
swtch = TRUE_;
}
} else {
if (w > dabs(prew) / 10.f) {
swtch = TRUE_;
}
}
/* Main loop to update the values of the array DELTA and WORK */
iter = niter + 1;
for (niter = iter; niter <= 20; ++niter) {
/* Test for convergence */
latime_1.ops += 1.f;
if (dabs(w) <= eps * erretm) {
goto L240;
}
/* Calculate the new step */
if (! swtch3) {
latime_1.ops += 2.f;
dtipsq = work[ip1] * delta[ip1];
dtisq = work[*i__] * delta[*i__];
if (! swtch) {
latime_1.ops += 6.f;
if (orgati) {
/* Computing 2nd power */
r__1 = z__[*i__] / dtisq;
c__ = w - dtipsq * dw + delsq * (r__1 * r__1);
} else {
/* Computing 2nd power */
r__1 = z__[ip1] / dtipsq;
c__ = w - dtisq * dw - delsq * (r__1 * r__1);
}
} else {
latime_1.ops += 8.f;
temp = z__[ii] / (work[ii] * delta[ii]);
if (orgati) {
dpsi += temp * temp;
} else {
dphi += temp * temp;
}
c__ = w - dtisq * dpsi - dtipsq * dphi;
}
latime_1.ops += 7.f;
a = (dtipsq + dtisq) * w - dtipsq * dtisq * dw;
b = dtipsq * dtisq * w;
if (c__ == 0.f) {
if (a == 0.f) {
latime_1.ops += 5.f;
if (! swtch) {
if (orgati) {
a = z__[*i__] * z__[*i__] + dtipsq * dtipsq *
(dpsi + dphi);
} else {
a = z__[ip1] * z__[ip1] + dtisq * dtisq * (
dpsi + dphi);
}
} else {
a = dtisq * dtisq * dpsi + dtipsq * dtipsq * dphi;
}
}
latime_1.ops += 1.f;
eta = b / a;
} else if (a <= 0.f) {
latime_1.ops += 8.f;
eta = (a - sqrt((r__1 = a * a - b * 4.f * c__, dabs(r__1))
)) / (c__ * 2.f);
} else {
latime_1.ops += 8.f;
eta = b * 2.f / (a + sqrt((r__1 = a * a - b * 4.f * c__,
dabs(r__1))));
}
} else {
/* Interpolation using THREE most relevant poles */
latime_1.ops += 4.f;
dtiim = work[iim1] * delta[iim1];
dtiip = work[iip1] * delta[iip1];
temp = rhoinv + psi + phi;
if (swtch) {
latime_1.ops += 8.f;
c__ = temp - dtiim * dpsi - dtiip * dphi;
zz[0] = dtiim * dtiim * dpsi;
zz[2] = dtiip * dtiip * dphi;
} else {
if (orgati) {
latime_1.ops += 11.f;
temp1 = z__[iim1] / dtiim;
temp1 *= temp1;
temp2 = (d__[iim1] - d__[iip1]) * (d__[iim1] + d__[
iip1]) * temp1;
c__ = temp - dtiip * (dpsi + dphi) - temp2;
zz[0] = z__[iim1] * z__[iim1];
if (dpsi < temp1) {
latime_1.ops += 2.f;
zz[2] = dtiip * dtiip * dphi;
} else {
latime_1.ops += 4.f;
zz[2] = dtiip * dtiip * (dpsi - temp1 + dphi);
}
} else {
latime_1.ops += 10.f;
temp1 = z__[iip1] / dtiip;
temp1 *= temp1;
temp2 = (d__[iip1] - d__[iim1]) * (d__[iim1] + d__[
iip1]) * temp1;
c__ = temp - dtiim * (dpsi + dphi) - temp2;
if (dphi < temp1) {
latime_1.ops += 2.f;
zz[0] = dtiim * dtiim * dpsi;
} else {
latime_1.ops += 4.f;
zz[0] = dtiim * dtiim * (dpsi + (dphi - temp1));
}
latime_1.ops += 1.f;
zz[2] = z__[iip1] * z__[iip1];
}
}
latime_1.ops += 1.f;
dd[0] = dtiim;
dd[1] = delta[ii] * work[ii];
dd[2] = dtiip;
slaed6_(&niter, &orgati, &c__, dd, zz, &w, &eta, info);
if (*info != 0) {
goto L240;
}
}
/* Note, eta should be positive if w is negative, and
eta should be negative otherwise. However,
if for some reason caused by roundoff, eta*w > 0,
we simply use one Newton step instead. This way
will guarantee eta*w < 0. */
latime_1.ops += 1.f;
if (w * eta >= 0.f) {
latime_1.ops += 1.f;
eta = -w / dw;
}
latime_1.ops += 2.f;
if (orgati) {
temp1 = work[*i__] * delta[*i__];
temp = eta - temp1;
} else {
temp1 = work[ip1] * delta[ip1];
temp = eta - temp1;
}
if (temp > sg2ub || temp < sg2lb) {
latime_1.ops += 2.f;
if (w < 0.f) {
eta = (sg2ub - tau) / 2.f;
} else {
eta = (sg2lb - tau) / 2.f;
}
}
latime_1.ops += 6.f;
tau += eta;
eta /= *sigma + sqrt(*sigma * *sigma + eta);
latime_1.ops += (real) ((*n << 1) + 1);
*sigma += eta;
i__1 = *n;
for (j = 1; j <= i__1; ++j) {
work[j] += eta;
delta[j] -= eta;
/* L200: */
}
prew = w;
/* Evaluate PSI and the derivative DPSI */
dpsi = 0.f;
psi = 0.f;
erretm = 0.f;
latime_1.ops += (real) (iim1 * 7);
i__1 = iim1;
for (j = 1; j <= i__1; ++j) {
temp = z__[j] / (work[j] * delta[j]);
psi += z__[j] * temp;
dpsi += temp * temp;
erretm += psi;
/* L210: */
}
erretm = dabs(erretm);
/* Evaluate PHI and the derivative DPHI */
dphi = 0.f;
phi = 0.f;
latime_1.ops += (real) ((iim1 - *n + 1) * 7);
i__1 = iip1;
for (j = *n; j >= i__1; --j) {
temp = z__[j] / (work[j] * delta[j]);
phi += z__[j] * temp;
dphi += temp * temp;
erretm += phi;
/* L220: */
}
latime_1.ops += 19.f;
temp = z__[ii] / (work[ii] * delta[ii]);
dw = dpsi + dphi + temp * temp;
temp = z__[ii] * temp;
w = rhoinv + phi + psi + temp;
erretm = (phi - psi) * 8.f + erretm + rhoinv * 2.f + dabs(temp) *
3.f + dabs(tau) * dw;
if (w * prew > 0.f && dabs(w) > dabs(prew) / 10.f) {
swtch = ! swtch;
}
if (w <= 0.f) {
sg2lb = dmax(sg2lb,tau);
} else {
sg2ub = dmin(sg2ub,tau);
}
/* L230: */
}
/* Return with INFO = 1, NITER = MAXIT and not converged */
*info = 1;
}
L240:
return 0;
/* End of SLASD4 */
} /* slasd4_ */
⌨️ 快捷键说明
复制代码Ctrl + C
搜索代码Ctrl + F
全屏模式F11
增大字号Ctrl + =
减小字号Ctrl + -
显示快捷键?