dtgsyl.c
来自「InsightToolkit-1.4.0(有大量的优化算法程序)」· C语言 代码 · 共 583 行 · 第 1/2 页
C
583 行
work[1] = (doublereal) lwmin;
}
if (*info != 0) {
i__1 = -(*info);
xerbla_("DTGSYL", &i__1);
return;
} else if (lquery) {
return;
}
/* Determine optimal block sizes MB and NB */
mb = ilaenv_(&c__2, "DTGSYL", trans, m, n, &c_n1, &c_n1);
nb = ilaenv_(&c__5, "DTGSYL", trans, m, n, &c_n1, &c_n1);
isolve = 1;
ifunc = 0;
if (*ijob >= 3 && notran) {
ifunc = *ijob - 2;
for (j = 1; j <= *n; ++j) {
dcopy_(m, &c_b14, &c__0, &c[j * c_dim1 + 1], &c__1);
dcopy_(m, &c_b14, &c__0, &f[j * f_dim1 + 1], &c__1);
}
} else if (*ijob >= 1 && notran) {
isolve = 2;
}
if ((mb <= 1 && nb <= 1) || (mb >= *m && nb >= *n)) {
for (iround = 1; iround <= isolve; ++iround) {
/* Use unblocked Level 2 solver */
dscale = 0.;
dsum = 1.;
pq = 0;
dtgsy2_(trans, &ifunc, m, n, &a[a_offset], lda, &b[b_offset], ldb,
&c[c_offset], ldc, &d[d_offset], ldd, &e[e_offset],
lde, &f[f_offset], ldf, scale, &dsum, &dscale, &iwork[1],
&pq, info);
if (dscale != 0.) {
if (*ijob == 1 || *ijob == 3) {
*dif = sqrt((doublereal) ((*m << 1) * *n)) / (dscale * sqrt(dsum));
} else {
*dif = sqrt((doublereal) pq) / (dscale * sqrt(dsum));
}
}
if (isolve == 2 && iround == 1) {
ifunc = *ijob;
scale2 = *scale;
dlacpy_("F", m, n, &c[c_offset], ldc, &work[1], m);
dlacpy_("F", m, n, &f[f_offset], ldf, &work[*m * *n + 1], m);
for (j = 1; j <= *n; ++j) {
dcopy_(m, &c_b14, &c__0, &c[j * c_dim1 + 1], &c__1);
dcopy_(m, &c_b14, &c__0, &f[j * f_dim1 + 1], &c__1);
}
} else if (isolve == 2 && iround == 2) {
dlacpy_("F", m, n, &work[1], m, &c[c_offset], ldc);
dlacpy_("F", m, n, &work[*m * *n + 1], m, &f[f_offset], ldf);
*scale = scale2;
}
}
return;
}
/* Determine block structure of A */
p = 0;
i = 1;
L40:
if (i > *m) {
goto L50;
}
++p;
iwork[p] = i;
i += mb;
if (i >= *m) {
goto L50;
}
if (a[i + (i - 1) * a_dim1] != 0.) {
++i;
}
goto L40;
L50:
iwork[p + 1] = *m + 1;
if (iwork[p] == iwork[p + 1]) {
--p;
}
/* Determine block structure of B */
q = p + 1;
j = 1;
L60:
if (j > *n) {
goto L70;
}
++q;
iwork[q] = j;
j += nb;
if (j >= *n) {
goto L70;
}
if (b[j + (j - 1) * b_dim1] != 0.) {
++j;
}
goto L60;
L70:
iwork[q + 1] = *n + 1;
if (iwork[q] == iwork[q + 1]) {
--q;
}
if (notran) {
for (iround = 1; iround <= isolve; ++iround) {
/* Solve (I, J)-subsystem */
/* A(I, I) * R(I, J) - L(I, J) * B(J, J) = C(I, J) */
/* D(I, I) * R(I, J) - L(I, J) * E(J, J) = F(I, J) */
/* for I = P, P - 1,..., 1; J = 1, 2,..., Q */
dscale = 0.;
dsum = 1.;
pq = 0;
*scale = 1.;
for (j = p + 2; j <= q; ++j) {
js = iwork[j];
je = iwork[j + 1] - 1;
nb = je - js + 1;
for (i = p; i >= 1; --i) {
is = iwork[i];
ie = iwork[i + 1] - 1;
mb = ie - is + 1;
ppqq = 0;
dtgsy2_(trans, &ifunc, &mb, &nb, &a[is + is * a_dim1], lda,
&b[js + js * b_dim1], ldb, &c[is + js * c_dim1], ldc,
&d[is + is * d_dim1], ldd, &e[js + js * e_dim1], lde,
&f[is + js * f_dim1], ldf, &scaloc, &dsum, &dscale,
&iwork[q + 2], &ppqq, &linfo);
if (linfo > 0) {
*info = linfo;
}
pq += ppqq;
if (scaloc != 1.) {
for (k = 1; k < js; ++k) {
dscal_(m, &scaloc, &c[k * c_dim1 + 1], &c__1);
dscal_(m, &scaloc, &f[k * f_dim1 + 1], &c__1);
}
for (k = js; k <= je; ++k) {
i__1 = is - 1;
dscal_(&i__1, &scaloc, &c[k * c_dim1 + 1], &c__1);
i__1 = is - 1;
dscal_(&i__1, &scaloc, &f[k * f_dim1 + 1], &c__1);
}
for (k = js; k <= je; ++k) {
i__1 = *m - ie;
dscal_(&i__1, &scaloc, &c[ie + 1 + k * c_dim1], &c__1);
i__1 = *m - ie;
dscal_(&i__1, &scaloc, &f[ie + 1 + k * f_dim1], &c__1);
}
for (k = je + 1; k <= *n; ++k) {
dscal_(m, &scaloc, &c[k * c_dim1 + 1], &c__1);
dscal_(m, &scaloc, &f[k * f_dim1 + 1], &c__1);
}
*scale *= scaloc;
}
/* Substitute R(I, J) and L(I, J) into remaining */
/* equation. */
if (i > 1) {
i__1 = is - 1;
dgemm_("N", "N", &i__1, &nb, &mb, &c_b53, &a[is * a_dim1 + 1], lda,
&c[is + js * c_dim1], ldc, &c_b54, &c[js * c_dim1 + 1], ldc);
i__1 = is - 1;
dgemm_("N", "N", &i__1, &nb, &mb, &c_b53, &d[is * d_dim1 + 1], ldd,
&c[is + js * c_dim1], ldc, &c_b54, &f[js * f_dim1 + 1], ldf);
}
if (j < q) {
i__1 = *n - je;
dgemm_("N", "N", &mb, &i__1, &nb, &c_b54, &f[is + js * f_dim1], ldf,
&b[js + (je + 1) * b_dim1], ldb, &c_b54, &c[is + (je + 1) * c_dim1], ldc);
i__1 = *n - je;
dgemm_("N", "N", &mb, &i__1, &nb, &c_b54, &f[is + js * f_dim1], ldf,
&e[js + (je + 1) * e_dim1], lde, &c_b54, &f[is + (je + 1) * f_dim1], ldf);
}
}
}
if (dscale != 0.) {
if (*ijob == 1 || *ijob == 3) {
*dif = sqrt((doublereal) ((*m << 1) * *n)) / (dscale * sqrt(dsum));
} else {
*dif = sqrt((doublereal) pq) / (dscale * sqrt(dsum));
}
}
if (isolve == 2 && iround == 1) {
ifunc = *ijob;
scale2 = *scale;
dlacpy_("F", m, n, &c[c_offset], ldc, &work[1], m);
dlacpy_("F", m, n, &f[f_offset], ldf, &work[*m * *n + 1], m);
for (j = 1; j <= *n; ++j) {
dcopy_(m, &c_b14, &c__0, &c[j * c_dim1 + 1], &c__1);
dcopy_(m, &c_b14, &c__0, &f[j * f_dim1 + 1], &c__1);
}
} else if (isolve == 2 && iround == 2) {
dlacpy_("F", m, n, &work[1], m, &c[c_offset], ldc);
dlacpy_("F", m, n, &work[*m * *n + 1], m, &f[f_offset], ldf);
*scale = scale2;
}
}
} else {
/* Solve transposed (I, J)-subsystem */
/* A(I, I)' * R(I, J) + D(I, I)' * L(I, J) = C(I, J) */
/* R(I, J) * B(J, J)' + L(I, J) * E(J, J)' = -F(I, J) */
/* for I = 1,2,..., P; J = Q, Q-1,..., 1 */
*scale = 1.;
for (i = 1; i <= p; ++i) {
is = iwork[i];
ie = iwork[i + 1] - 1;
mb = ie - is + 1;
for (j = q; j >= p + 2; --j) {
js = iwork[j];
je = iwork[j + 1] - 1;
nb = je - js + 1;
dtgsy2_(trans, &ifunc, &mb, &nb, &a[is + is * a_dim1], lda,
&b[js + js * b_dim1], ldb, &c[is + js * c_dim1], ldc,
&d[is + is * d_dim1], ldd, &e[js + js * e_dim1], lde,
&f[is + js * f_dim1], ldf, &scaloc, &dsum, &dscale, &iwork[q + 2], &ppqq, &linfo);
if (linfo > 0) {
*info = linfo;
}
if (scaloc != 1.) {
for (k = 1; k < js; ++k) {
dscal_(m, &scaloc, &c[k * c_dim1 + 1], &c__1);
dscal_(m, &scaloc, &f[k * f_dim1 + 1], &c__1);
}
for (k = js; k <= je; ++k) {
i__1 = is - 1;
dscal_(&i__1, &scaloc, &c[k * c_dim1 + 1], &c__1);
i__1 = is - 1;
dscal_(&i__1, &scaloc, &f[k * f_dim1 + 1], &c__1);
}
for (k = js; k <= je; ++k) {
i__1 = *m - ie;
dscal_(&i__1, &scaloc, &c[ie + 1 + k * c_dim1], &c__1);
i__1 = *m - ie;
dscal_(&i__1, &scaloc, &f[ie + 1 + k * f_dim1], &c__1);
}
for (k = je + 1; k <= *n; ++k) {
dscal_(m, &scaloc, &c[k * c_dim1 + 1], &c__1);
dscal_(m, &scaloc, &f[k * f_dim1 + 1], &c__1);
}
*scale *= scaloc;
}
/* Substitute R(I, J) and L(I, J) into remaining equation. */
if (j > p + 2) {
i__1 = js - 1;
dgemm_("N", "T", &mb, &i__1, &nb, &c_b54, &c[is + js * c_dim1], ldc,
&b[js * b_dim1 + 1], ldb, &c_b54, &f[is + f_dim1], ldf);
i__1 = js - 1;
dgemm_("N", "T", &mb, &i__1, &nb, &c_b54, &f[is + js * f_dim1], ldf,
&e[js * e_dim1 + 1], lde, &c_b54, &f[is + f_dim1], ldf);
}
if (i < p) {
i__1 = *m - ie;
dgemm_("T", "N", &i__1, &nb, &mb, &c_b53, &a[is + (ie + 1) * a_dim1], lda,
&c[is + js * c_dim1], ldc, &c_b54, &c[ie + 1 + js * c_dim1], ldc);
i__1 = *m - ie;
dgemm_("T", "N", &i__1, &nb, &mb, &c_b53, &d[is + (ie + 1) * d_dim1], ldd,
&f[is + js * f_dim1], ldf, &c_b54, &c[ie + 1 + js * c_dim1], ldc);
}
}
}
}
work[1] = (doublereal) lwmin;
} /* dtgsyl_ */
⌨️ 快捷键说明
复制代码Ctrl + C
搜索代码Ctrl + F
全屏模式F11
增大字号Ctrl + =
减小字号Ctrl + -
显示快捷键?