📄 dtgevc.c
字号:
scale = 1.;
if (acoefa * ulp < safmin && acoefa >= safmin) {
scale = safmin / ulp / acoefa;
}
if (bcoefa * ulp < safmin && bcoefa >= safmin) {
/* Computing MAX */
d__1 = scale, d__2 = safmin / ulp / bcoefa;
scale = max(d__1,d__2);
}
if (safmin * acoefa > ascale) {
scale = ascale / (safmin * acoefa);
}
if (safmin * bcoefa > bscale) {
/* Computing MIN */
d__1 = scale, d__2 = bscale / (safmin * bcoefa);
scale = min(d__1,d__2);
}
if (scale != 1.) {
acoef = scale * acoef;
acoefa = abs(acoef);
bcoefr = scale * bcoefr;
bcoefi = scale * bcoefi;
bcoefa = abs(bcoefr) + abs(bcoefi);
}
/* Compute first two components of eigenvector
and contribution to sums */
temp = acoef * a_ref(je, je - 1);
temp2r = acoef * a_ref(je, je) - bcoefr * b_ref(je, je);
temp2i = -bcoefi * b_ref(je, je);
if (abs(temp) >= abs(temp2r) + abs(temp2i)) {
work[(*n << 1) + je] = 1.;
work[*n * 3 + je] = 0.;
work[(*n << 1) + je - 1] = -temp2r / temp;
work[*n * 3 + je - 1] = -temp2i / temp;
} else {
work[(*n << 1) + je - 1] = 1.;
work[*n * 3 + je - 1] = 0.;
temp = acoef * a_ref(je - 1, je);
work[(*n << 1) + je] = (bcoefr * b_ref(je - 1, je - 1) -
acoef * a_ref(je - 1, je - 1)) / temp;
work[*n * 3 + je] = bcoefi * b_ref(je - 1, je - 1) / temp;
}
/* Computing MAX */
d__5 = (d__1 = work[(*n << 1) + je], abs(d__1)) + (d__2 =
work[*n * 3 + je], abs(d__2)), d__6 = (d__3 = work[(*
n << 1) + je - 1], abs(d__3)) + (d__4 = work[*n * 3 +
je - 1], abs(d__4));
xmax = max(d__5,d__6);
/* Compute contribution from columns JE and JE-1
of A and B to the sums. */
creala = acoef * work[(*n << 1) + je - 1];
cimaga = acoef * work[*n * 3 + je - 1];
crealb = bcoefr * work[(*n << 1) + je - 1] - bcoefi * work[*n
* 3 + je - 1];
cimagb = bcoefi * work[(*n << 1) + je - 1] + bcoefr * work[*n
* 3 + je - 1];
cre2a = acoef * work[(*n << 1) + je];
cim2a = acoef * work[*n * 3 + je];
cre2b = bcoefr * work[(*n << 1) + je] - bcoefi * work[*n * 3
+ je];
cim2b = bcoefi * work[(*n << 1) + je] + bcoefr * work[*n * 3
+ je];
i__1 = je - 2;
for (jr = 1; jr <= i__1; ++jr) {
work[(*n << 1) + jr] = -creala * a_ref(jr, je - 1) +
crealb * b_ref(jr, je - 1) - cre2a * a_ref(jr, je)
+ cre2b * b_ref(jr, je);
work[*n * 3 + jr] = -cimaga * a_ref(jr, je - 1) + cimagb *
b_ref(jr, je - 1) - cim2a * a_ref(jr, je) +
cim2b * b_ref(jr, je);
/* L270: */
}
}
/* Computing MAX */
d__1 = ulp * acoefa * anorm, d__2 = ulp * bcoefa * bnorm, d__1 =
max(d__1,d__2);
dmin__ = max(d__1,safmin);
/* Columnwise triangular solve of (a A - b B) x = 0 */
il2by2 = FALSE_;
/* ------------------- Begin Timing Code ---------------------- */
opst = 0.;
in2by2 = 0;
/* -------------------- End Timing Code ----------------------- */
for (j = je - nw; j >= 1; --j) {
/* ------------------- Begin Timing Code ------------------- */
opssca = (doublereal) (nw * je + 1);
/* -------------------- End Timing Code --------------------
If a 2-by-2 block, is in position j-1:j, wait until
next iteration to process it (when it will be j:j+1) */
if (! il2by2 && j > 1) {
if (a_ref(j, j - 1) != 0.) {
il2by2 = TRUE_;
/* -------------- Begin Timing Code ----------------- */
++in2by2;
/* --------------- End Timing Code ------------------- */
goto L370;
}
}
bdiag[0] = b_ref(j, j);
if (il2by2) {
na = 2;
bdiag[1] = b_ref(j + 1, j + 1);
} else {
na = 1;
}
/* Compute x(j) (and x(j+1), if 2-by-2 block) */
dlaln2_(&c_false, &na, &nw, &dmin__, &acoef, &a_ref(j, j),
lda, bdiag, &bdiag[1], &work[(*n << 1) + j], n, &
bcoefr, &bcoefi, sum, &c__2, &scale, &temp, &iinfo);
if (scale < 1.) {
i__1 = nw - 1;
for (jw = 0; jw <= i__1; ++jw) {
i__2 = je;
for (jr = 1; jr <= i__2; ++jr) {
work[(jw + 2) * *n + jr] = scale * work[(jw + 2) *
*n + jr];
/* L280: */
}
/* L290: */
}
}
/* Computing MAX */
d__1 = scale * xmax;
xmax = max(d__1,temp);
/* ------------------ Begin Timing Code ----------------- */
opst += opssca;
/* ------------------- End Timing Code ------------------ */
i__1 = nw;
for (jw = 1; jw <= i__1; ++jw) {
i__2 = na;
for (ja = 1; ja <= i__2; ++ja) {
work[(jw + 1) * *n + j + ja - 1] = sum_ref(ja, jw);
/* L300: */
}
/* L310: */
}
/* w = w + x(j)*(a A(*,j) - b B(*,j) ) with scaling */
if (j > 1) {
/* Check whether scaling is necessary for sum. */
xscale = 1. / max(1.,xmax);
temp = acoefa * work[j] + bcoefa * work[*n + j];
if (il2by2) {
/* Computing MAX */
d__1 = temp, d__2 = acoefa * work[j + 1] + bcoefa *
work[*n + j + 1];
temp = max(d__1,d__2);
}
/* Computing MAX */
d__1 = max(temp,acoefa);
temp = max(d__1,bcoefa);
if (temp > bignum * xscale) {
i__1 = nw - 1;
for (jw = 0; jw <= i__1; ++jw) {
i__2 = je;
for (jr = 1; jr <= i__2; ++jr) {
work[(jw + 2) * *n + jr] = xscale * work[(jw
+ 2) * *n + jr];
/* L320: */
}
/* L330: */
}
xmax *= xscale;
/* ----------------- Begin Timing Code --------------- */
opst += opssca;
/* ------------------ End Timing Code ---------------- */
}
/* Compute the contributions of the off-diagonals of
column j (and j+1, if 2-by-2 block) of A and B to the
sums. */
i__1 = na;
for (ja = 1; ja <= i__1; ++ja) {
if (ilcplx) {
creala = acoef * work[(*n << 1) + j + ja - 1];
cimaga = acoef * work[*n * 3 + j + ja - 1];
crealb = bcoefr * work[(*n << 1) + j + ja - 1] -
bcoefi * work[*n * 3 + j + ja - 1];
cimagb = bcoefi * work[(*n << 1) + j + ja - 1] +
bcoefr * work[*n * 3 + j + ja - 1];
i__2 = j - 1;
for (jr = 1; jr <= i__2; ++jr) {
work[(*n << 1) + jr] = work[(*n << 1) + jr] -
creala * a_ref(jr, j + ja - 1) +
crealb * b_ref(jr, j + ja - 1);
work[*n * 3 + jr] = work[*n * 3 + jr] -
cimaga * a_ref(jr, j + ja - 1) +
cimagb * b_ref(jr, j + ja - 1);
/* L340: */
}
} else {
creala = acoef * work[(*n << 1) + j + ja - 1];
crealb = bcoefr * work[(*n << 1) + j + ja - 1];
i__2 = j - 1;
for (jr = 1; jr <= i__2; ++jr) {
work[(*n << 1) + jr] = work[(*n << 1) + jr] -
creala * a_ref(jr, j + ja - 1) +
crealb * b_ref(jr, j + ja - 1);
/* L350: */
}
}
/* L360: */
}
}
il2by2 = FALSE_;
L370:
;
}
/* Copy eigenvector to VR, back transforming if
HOWMNY='B'. */
ieig -= nw;
if (ilback) {
i__1 = nw - 1;
for (jw = 0; jw <= i__1; ++jw) {
i__2 = *n;
for (jr = 1; jr <= i__2; ++jr) {
work[(jw + 4) * *n + jr] = work[(jw + 2) * *n + 1] *
vr_ref(jr, 1);
/* L380: */
}
/* A series of compiler directives to defeat
vectorization for the next loop */
i__2 = je;
for (jc = 2; jc <= i__2; ++jc) {
i__3 = *n;
for (jr = 1; jr <= i__3; ++jr) {
work[(jw + 4) * *n + jr] += work[(jw + 2) * *n +
jc] * vr_ref(jr, jc);
/* L390: */
}
/* L400: */
}
/* L410: */
}
i__1 = nw - 1;
for (jw = 0; jw <= i__1; ++jw) {
i__2 = *n;
for (jr = 1; jr <= i__2; ++jr) {
vr_ref(jr, ieig + jw) = work[(jw + 4) * *n + jr];
/* L420: */
}
/* L430: */
}
iend = *n;
} else {
i__1 = nw - 1;
for (jw = 0; jw <= i__1; ++jw) {
i__2 = *n;
for (jr = 1; jr <= i__2; ++jr) {
vr_ref(jr, ieig + jw) = work[(jw + 2) * *n + jr];
/* L440: */
}
/* L450: */
}
iend = je;
}
/* Scale eigenvector */
xmax = 0.;
if (ilcplx) {
i__1 = iend;
for (j = 1; j <= i__1; ++j) {
/* Computing MAX */
d__3 = xmax, d__4 = (d__1 = vr_ref(j, ieig), abs(d__1)) +
(d__2 = vr_ref(j, ieig + 1), abs(d__2));
xmax = max(d__3,d__4);
/* L460: */
}
} else {
i__1 = iend;
for (j = 1; j <= i__1; ++j) {
/* Computing MAX */
d__2 = xmax, d__3 = (d__1 = vr_ref(j, ieig), abs(d__1));
xmax = max(d__2,d__3);
/* L470: */
}
}
if (xmax > safmin) {
xscale = 1. / xmax;
i__1 = nw - 1;
for (jw = 0; jw <= i__1; ++jw) {
i__2 = iend;
for (jr = 1; jr <= i__2; ++jr) {
vr_ref(jr, ieig + jw) = xscale * vr_ref(jr, ieig + jw)
;
/* L480: */
}
/* L490: */
}
}
/* ------------------- Begin Timing Code ----------------------
Opcounts for each eigenvector
Real Complex
Initialization 8--16 + 3*(JE-1) 71--87+16+14*(JE-2)
Solve (per iter) NA*(5 + 7*(NA-1)) NA*(17 + 17*(NA-1))
+ scaling + scaling
column add (per iter)
2 + 5*NA 2 + 11*NA
+ 4*NA*(J-1) + 8*NA*(J-1)
+ scaling + scaling
iteration: J=JE-1,...,1 J=JE-2,...,1
Back xform 2*N*JE - N 4*N*JE - 2*N
Scaling (w/back x.) N 3*N
Scaling (w/o back) JE 3*JE */
if (! ilcplx) {
opst += (doublereal) (((je << 1) + 11) * (je - 1) + 12 + (
in2by2 << 3));
if (ilback) {
opst += (doublereal) ((*n << 1) * je);
} else {
opst += (doublereal) je;
}
} else {
opst += (doublereal) (((je << 2) + 32) * (je - 2) + 95 +
in2by2 * 24);
if (ilback) {
opst += (doublereal) ((*n << 2) * je + *n);
} else {
opst += (doublereal) (je * 3);
}
}
latime_1.ops += opst;
/* -------------------- End Timing Code ----------------------- */
L500:
;
}
}
return 0;
/* End of DTGEVC */
} /* dtgevc_ */
#undef sum_ref
#undef vr_ref
#undef vl_ref
#undef b_ref
#undef a_ref
#undef sumb_ref
#undef suma_ref
⌨️ 快捷键说明
复制代码
Ctrl + C
搜索代码
Ctrl + F
全屏模式
F11
切换主题
Ctrl + Shift + D
显示快捷键
?
增大字号
Ctrl + =
减小字号
Ctrl + -