dtgsyl.c

来自「InsightToolkit-1.4.0(有大量的优化算法程序)」· C语言 代码 · 共 583 行 · 第 1/2 页

C
583
字号
        work[1] = (doublereal) lwmin;
    }

    if (*info != 0) {
        i__1 = -(*info);
        xerbla_("DTGSYL", &i__1);
        return;
    } else if (lquery) {
        return;
    }

/*     Determine optimal block sizes MB and NB */

    mb = ilaenv_(&c__2, "DTGSYL", trans, m, n, &c_n1, &c_n1);
    nb = ilaenv_(&c__5, "DTGSYL", trans, m, n, &c_n1, &c_n1);

    isolve = 1;
    ifunc = 0;
    if (*ijob >= 3 && notran) {
        ifunc = *ijob - 2;
        for (j = 1; j <= *n; ++j) {
            dcopy_(m, &c_b14, &c__0, &c[j * c_dim1 + 1], &c__1);
            dcopy_(m, &c_b14, &c__0, &f[j * f_dim1 + 1], &c__1);
        }
    } else if (*ijob >= 1 && notran) {
        isolve = 2;
    }

    if ((mb <= 1 && nb <= 1) || (mb >= *m && nb >= *n)) {

        for (iround = 1; iround <= isolve; ++iround) {

/*           Use unblocked Level 2 solver */

            dscale = 0.;
            dsum = 1.;
            pq = 0;
            dtgsy2_(trans, &ifunc, m, n, &a[a_offset], lda, &b[b_offset], ldb,
                    &c[c_offset], ldc, &d[d_offset], ldd, &e[e_offset],
                    lde, &f[f_offset], ldf, scale, &dsum, &dscale, &iwork[1],
                    &pq, info);
            if (dscale != 0.) {
                if (*ijob == 1 || *ijob == 3) {
                    *dif = sqrt((doublereal) ((*m << 1) * *n)) / (dscale * sqrt(dsum));
                } else {
                    *dif = sqrt((doublereal) pq) / (dscale * sqrt(dsum));
                }
            }

            if (isolve == 2 && iround == 1) {
                ifunc = *ijob;
                scale2 = *scale;
                dlacpy_("F", m, n, &c[c_offset], ldc, &work[1], m);
                dlacpy_("F", m, n, &f[f_offset], ldf, &work[*m * *n + 1], m);
                for (j = 1; j <= *n; ++j) {
                    dcopy_(m, &c_b14, &c__0, &c[j * c_dim1 + 1], &c__1);
                    dcopy_(m, &c_b14, &c__0, &f[j * f_dim1 + 1], &c__1);
                }
            } else if (isolve == 2 && iround == 2) {
                dlacpy_("F", m, n, &work[1], m, &c[c_offset], ldc);
                dlacpy_("F", m, n, &work[*m * *n + 1], m, &f[f_offset], ldf);
                *scale = scale2;
            }
        }

        return;
    }

/*     Determine block structure of A */

    p = 0;
    i = 1;
L40:
    if (i > *m) {
        goto L50;
    }
    ++p;
    iwork[p] = i;
    i += mb;
    if (i >= *m) {
        goto L50;
    }
    if (a[i + (i - 1) * a_dim1] != 0.) {
        ++i;
    }
    goto L40;
L50:

    iwork[p + 1] = *m + 1;
    if (iwork[p] == iwork[p + 1]) {
        --p;
    }

/*     Determine block structure of B */

    q = p + 1;
    j = 1;
L60:
    if (j > *n) {
        goto L70;
    }
    ++q;
    iwork[q] = j;
    j += nb;
    if (j >= *n) {
        goto L70;
    }
    if (b[j + (j - 1) * b_dim1] != 0.) {
        ++j;
    }
    goto L60;
L70:

    iwork[q + 1] = *n + 1;
    if (iwork[q] == iwork[q + 1]) {
        --q;
    }

    if (notran) {

        for (iround = 1; iround <= isolve; ++iround) {

/*           Solve (I, J)-subsystem */
/*               A(I, I) * R(I, J) - L(I, J) * B(J, J) = C(I, J) */
/*               D(I, I) * R(I, J) - L(I, J) * E(J, J) = F(I, J) */
/*           for I = P, P - 1,..., 1; J = 1, 2,..., Q */

            dscale = 0.;
            dsum = 1.;
            pq = 0;
            *scale = 1.;
            for (j = p + 2; j <= q; ++j) {
                js = iwork[j];
                je = iwork[j + 1] - 1;
                nb = je - js + 1;
                for (i = p; i >= 1; --i) {
                    is = iwork[i];
                    ie = iwork[i + 1] - 1;
                    mb = ie - is + 1;
                    ppqq = 0;
                    dtgsy2_(trans, &ifunc, &mb, &nb, &a[is + is * a_dim1], lda,
                            &b[js + js * b_dim1], ldb, &c[is + js * c_dim1], ldc,
                            &d[is + is * d_dim1], ldd, &e[js + js * e_dim1], lde,
                            &f[is + js * f_dim1], ldf, &scaloc, &dsum, &dscale,
                            &iwork[q + 2], &ppqq, &linfo);
                    if (linfo > 0) {
                        *info = linfo;
                    }

                    pq += ppqq;
                    if (scaloc != 1.) {
                        for (k = 1; k < js; ++k) {
                            dscal_(m, &scaloc, &c[k * c_dim1 + 1], &c__1);
                            dscal_(m, &scaloc, &f[k * f_dim1 + 1], &c__1);
                        }
                        for (k = js; k <= je; ++k) {
                            i__1 = is - 1;
                            dscal_(&i__1, &scaloc, &c[k * c_dim1 + 1], &c__1);
                            i__1 = is - 1;
                            dscal_(&i__1, &scaloc, &f[k * f_dim1 + 1], &c__1);
                        }
                        for (k = js; k <= je; ++k) {
                            i__1 = *m - ie;
                            dscal_(&i__1, &scaloc, &c[ie + 1 + k * c_dim1], &c__1);
                            i__1 = *m - ie;
                            dscal_(&i__1, &scaloc, &f[ie + 1 + k * f_dim1], &c__1);
                        }
                        for (k = je + 1; k <= *n; ++k) {
                            dscal_(m, &scaloc, &c[k * c_dim1 + 1], &c__1);
                            dscal_(m, &scaloc, &f[k * f_dim1 + 1], &c__1);
                        }
                        *scale *= scaloc;
                    }

/*                 Substitute R(I, J) and L(I, J) into remaining */
/*                 equation. */

                    if (i > 1) {
                        i__1 = is - 1;
                        dgemm_("N", "N", &i__1, &nb, &mb, &c_b53, &a[is * a_dim1 + 1], lda,
                               &c[is + js * c_dim1], ldc, &c_b54, &c[js * c_dim1 + 1], ldc);
                        i__1 = is - 1;
                        dgemm_("N", "N", &i__1, &nb, &mb, &c_b53, &d[is * d_dim1 + 1], ldd,
                               &c[is + js * c_dim1], ldc, &c_b54, &f[js * f_dim1 + 1], ldf);
                    }
                    if (j < q) {
                        i__1 = *n - je;
                        dgemm_("N", "N", &mb, &i__1, &nb, &c_b54, &f[is + js * f_dim1], ldf,
                               &b[js + (je + 1) * b_dim1], ldb, &c_b54, &c[is + (je + 1) * c_dim1], ldc);
                        i__1 = *n - je;
                        dgemm_("N", "N", &mb, &i__1, &nb, &c_b54, &f[is + js * f_dim1], ldf,
                               &e[js + (je + 1) * e_dim1], lde, &c_b54, &f[is + (je + 1) * f_dim1], ldf);
                    }
                }
            }
            if (dscale != 0.) {
                if (*ijob == 1 || *ijob == 3) {
                    *dif = sqrt((doublereal) ((*m << 1) * *n)) / (dscale * sqrt(dsum));
                } else {
                    *dif = sqrt((doublereal) pq) / (dscale * sqrt(dsum));
                }
            }
            if (isolve == 2 && iround == 1) {
                ifunc = *ijob;
                scale2 = *scale;
                dlacpy_("F", m, n, &c[c_offset], ldc, &work[1], m);
                dlacpy_("F", m, n, &f[f_offset], ldf, &work[*m * *n + 1], m);
                for (j = 1; j <= *n; ++j) {
                    dcopy_(m, &c_b14, &c__0, &c[j * c_dim1 + 1], &c__1);
                    dcopy_(m, &c_b14, &c__0, &f[j * f_dim1 + 1], &c__1);
                }
            } else if (isolve == 2 && iround == 2) {
                dlacpy_("F", m, n, &work[1], m, &c[c_offset], ldc);
                dlacpy_("F", m, n, &work[*m * *n + 1], m, &f[f_offset], ldf);
                *scale = scale2;
            }
        }

    } else {

/*        Solve transposed (I, J)-subsystem */
/*             A(I, I)' * R(I, J)  + D(I, I)' * L(I, J)  =  C(I, J) */
/*             R(I, J)  * B(J, J)' + L(I, J)  * E(J, J)' = -F(I, J) */
/*        for I = 1,2,..., P; J = Q, Q-1,..., 1 */

        *scale = 1.;
        for (i = 1; i <= p; ++i) {
            is = iwork[i];
            ie = iwork[i + 1] - 1;
            mb = ie - is + 1;
            for (j = q; j >= p + 2; --j) {
                js = iwork[j];
                je = iwork[j + 1] - 1;
                nb = je - js + 1;
                dtgsy2_(trans, &ifunc, &mb, &nb, &a[is + is * a_dim1], lda,
                        &b[js + js * b_dim1], ldb, &c[is + js * c_dim1], ldc,
                        &d[is + is * d_dim1], ldd, &e[js + js * e_dim1], lde,
                        &f[is + js * f_dim1], ldf, &scaloc, &dsum, &dscale, &iwork[q + 2], &ppqq, &linfo);
                if (linfo > 0) {
                    *info = linfo;
                }
                if (scaloc != 1.) {
                    for (k = 1; k < js; ++k) {
                        dscal_(m, &scaloc, &c[k * c_dim1 + 1], &c__1);
                        dscal_(m, &scaloc, &f[k * f_dim1 + 1], &c__1);
                    }
                    for (k = js; k <= je; ++k) {
                        i__1 = is - 1;
                        dscal_(&i__1, &scaloc, &c[k * c_dim1 + 1], &c__1);
                        i__1 = is - 1;
                        dscal_(&i__1, &scaloc, &f[k * f_dim1 + 1], &c__1);
                    }
                    for (k = js; k <= je; ++k) {
                        i__1 = *m - ie;
                        dscal_(&i__1, &scaloc, &c[ie + 1 + k * c_dim1], &c__1);
                        i__1 = *m - ie;
                        dscal_(&i__1, &scaloc, &f[ie + 1 + k * f_dim1], &c__1);
                    }
                    for (k = je + 1; k <= *n; ++k) {
                        dscal_(m, &scaloc, &c[k * c_dim1 + 1], &c__1);
                        dscal_(m, &scaloc, &f[k * f_dim1 + 1], &c__1);
                    }
                    *scale *= scaloc;
                }

/*              Substitute R(I, J) and L(I, J) into remaining equation. */

                if (j > p + 2) {
                    i__1 = js - 1;
                    dgemm_("N", "T", &mb, &i__1, &nb, &c_b54, &c[is + js * c_dim1], ldc,
                           &b[js * b_dim1 + 1], ldb, &c_b54, &f[is + f_dim1], ldf);
                    i__1 = js - 1;
                    dgemm_("N", "T", &mb, &i__1, &nb, &c_b54, &f[is + js * f_dim1], ldf,
                           &e[js * e_dim1 + 1], lde, &c_b54, &f[is + f_dim1], ldf);
                }
                if (i < p) {
                    i__1 = *m - ie;
                    dgemm_("T", "N", &i__1, &nb, &mb, &c_b53, &a[is + (ie + 1) * a_dim1], lda,
                           &c[is + js * c_dim1], ldc, &c_b54, &c[ie + 1 + js * c_dim1], ldc);
                    i__1 = *m - ie;
                    dgemm_("T", "N", &i__1, &nb, &mb, &c_b53, &d[is + (ie + 1) * d_dim1], ldd,
                           &f[is + js * f_dim1], ldf, &c_b54, &c[ie + 1 + js * c_dim1], ldc);
                }
            }
        }
    }

    work[1] = (doublereal) lwmin;

} /* dtgsyl_ */

⌨️ 快捷键说明

复制代码Ctrl + C
搜索代码Ctrl + F
全屏模式F11
增大字号Ctrl + =
减小字号Ctrl + -
显示快捷键?