zgemm.c
来自「算断裂的」· C语言 代码 · 共 698 行 · 第 1/2 页
C
698 行
d_cnjg(&z__3, &A(l,i));
i__4 = l + j * b_dim1;
z__2.r = z__3.r * B(l,j).r - z__3.i * B(l,j).i,
z__2.i = z__3.r * B(l,j).i + z__3.i * B(l,j)
.r;
z__1.r = temp.r + z__2.r, z__1.i = temp.i + z__2.i;
temp.r = z__1.r, temp.i = z__1.i;
/* L100: */
}
if (beta->r == 0. && beta->i == 0.) {
i__3 = i + j * c_dim1;
z__1.r = alpha->r * temp.r - alpha->i * temp.i,
z__1.i = alpha->r * temp.i + alpha->i *
temp.r;
C(i,j).r = z__1.r, C(i,j).i = z__1.i;
} else {
i__3 = i + j * c_dim1;
z__2.r = alpha->r * temp.r - alpha->i * temp.i,
z__2.i = alpha->r * temp.i + alpha->i *
temp.r;
i__4 = i + j * c_dim1;
z__3.r = beta->r * C(i,j).r - beta->i * C(i,j).i,
z__3.i = beta->r * C(i,j).i + beta->i * C(i,j).r;
z__1.r = z__2.r + z__3.r, z__1.i = z__2.i + z__3.i;
C(i,j).r = z__1.r, C(i,j).i = z__1.i;
}
/* L110: */
}
/* L120: */
}
} else {
/* Form C := alpha*A'*B + beta*C */
i__1 = *n;
for (j = 1; j <= *n; ++j) {
i__2 = *m;
for (i = 1; i <= *m; ++i) {
temp.r = 0., temp.i = 0.;
i__3 = *k;
for (l = 1; l <= *k; ++l) {
i__4 = l + i * a_dim1;
i__5 = l + j * b_dim1;
z__2.r = A(l,i).r * B(l,j).r - A(l,i).i * B(l,j)
.i, z__2.i = A(l,i).r * B(l,j).i + A(l,i)
.i * B(l,j).r;
z__1.r = temp.r + z__2.r, z__1.i = temp.i + z__2.i;
temp.r = z__1.r, temp.i = z__1.i;
/* L130: */
}
if (beta->r == 0. && beta->i == 0.) {
i__3 = i + j * c_dim1;
z__1.r = alpha->r * temp.r - alpha->i * temp.i,
z__1.i = alpha->r * temp.i + alpha->i *
temp.r;
C(i,j).r = z__1.r, C(i,j).i = z__1.i;
} else {
i__3 = i + j * c_dim1;
z__2.r = alpha->r * temp.r - alpha->i * temp.i,
z__2.i = alpha->r * temp.i + alpha->i *
temp.r;
i__4 = i + j * c_dim1;
z__3.r = beta->r * C(i,j).r - beta->i * C(i,j).i,
z__3.i = beta->r * C(i,j).i + beta->i * C(i,j).r;
z__1.r = z__2.r + z__3.r, z__1.i = z__2.i + z__3.i;
C(i,j).r = z__1.r, C(i,j).i = z__1.i;
}
/* L140: */
}
/* L150: */
}
}
} else if (nota) {
if (conjb) {
/* Form C := alpha*A*conjg( B' ) + beta*C. */
i__1 = *n;
for (j = 1; j <= *n; ++j) {
if (beta->r == 0. && beta->i == 0.) {
i__2 = *m;
for (i = 1; i <= *m; ++i) {
i__3 = i + j * c_dim1;
C(i,j).r = 0., C(i,j).i = 0.;
/* L160: */
}
} else if (beta->r != 1. || beta->i != 0.) {
i__2 = *m;
for (i = 1; i <= *m; ++i) {
i__3 = i + j * c_dim1;
i__4 = i + j * c_dim1;
z__1.r = beta->r * C(i,j).r - beta->i * C(i,j).i,
z__1.i = beta->r * C(i,j).i + beta->i * C(i,j).r;
C(i,j).r = z__1.r, C(i,j).i = z__1.i;
/* L170: */
}
}
i__2 = *k;
for (l = 1; l <= *k; ++l) {
i__3 = j + l * b_dim1;
if (B(j,l).r != 0. || B(j,l).i != 0.) {
d_cnjg(&z__2, &B(j,l));
z__1.r = alpha->r * z__2.r - alpha->i * z__2.i,
z__1.i = alpha->r * z__2.i + alpha->i *
z__2.r;
temp.r = z__1.r, temp.i = z__1.i;
i__3 = *m;
for (i = 1; i <= *m; ++i) {
i__4 = i + j * c_dim1;
i__5 = i + j * c_dim1;
i__6 = i + l * a_dim1;
z__2.r = temp.r * A(i,l).r - temp.i * A(i,l).i,
z__2.i = temp.r * A(i,l).i + temp.i * A(i,l).r;
z__1.r = C(i,j).r + z__2.r, z__1.i = C(i,j).i +
z__2.i;
C(i,j).r = z__1.r, C(i,j).i = z__1.i;
/* L180: */
}
}
/* L190: */
}
/* L200: */
}
} else {
/* Form C := alpha*A*B' + beta*C */
i__1 = *n;
for (j = 1; j <= *n; ++j) {
if (beta->r == 0. && beta->i == 0.) {
i__2 = *m;
for (i = 1; i <= *m; ++i) {
i__3 = i + j * c_dim1;
C(i,j).r = 0., C(i,j).i = 0.;
/* L210: */
}
} else if (beta->r != 1. || beta->i != 0.) {
i__2 = *m;
for (i = 1; i <= *m; ++i) {
i__3 = i + j * c_dim1;
i__4 = i + j * c_dim1;
z__1.r = beta->r * C(i,j).r - beta->i * C(i,j).i,
z__1.i = beta->r * C(i,j).i + beta->i * C(i,j).r;
C(i,j).r = z__1.r, C(i,j).i = z__1.i;
/* L220: */
}
}
i__2 = *k;
for (l = 1; l <= *k; ++l) {
i__3 = j + l * b_dim1;
if (B(j,l).r != 0. || B(j,l).i != 0.) {
i__3 = j + l * b_dim1;
z__1.r = alpha->r * B(j,l).r - alpha->i * B(j,l).i,
z__1.i = alpha->r * B(j,l).i + alpha->i * B(j,l).r;
temp.r = z__1.r, temp.i = z__1.i;
i__3 = *m;
for (i = 1; i <= *m; ++i) {
i__4 = i + j * c_dim1;
i__5 = i + j * c_dim1;
i__6 = i + l * a_dim1;
z__2.r = temp.r * A(i,l).r - temp.i * A(i,l).i,
z__2.i = temp.r * A(i,l).i + temp.i * A(i,l).r;
z__1.r = C(i,j).r + z__2.r, z__1.i = C(i,j).i +
z__2.i;
C(i,j).r = z__1.r, C(i,j).i = z__1.i;
/* L230: */
}
}
/* L240: */
}
/* L250: */
}
}
} else if (conja) {
if (conjb) {
/* Form C := alpha*conjg( A' )*conjg( B' ) + beta*C. */
i__1 = *n;
for (j = 1; j <= *n; ++j) {
i__2 = *m;
for (i = 1; i <= *m; ++i) {
temp.r = 0., temp.i = 0.;
i__3 = *k;
for (l = 1; l <= *k; ++l) {
d_cnjg(&z__3, &A(l,i));
d_cnjg(&z__4, &B(j,l));
z__2.r = z__3.r * z__4.r - z__3.i * z__4.i, z__2.i =
z__3.r * z__4.i + z__3.i * z__4.r;
z__1.r = temp.r + z__2.r, z__1.i = temp.i + z__2.i;
temp.r = z__1.r, temp.i = z__1.i;
/* L260: */
}
if (beta->r == 0. && beta->i == 0.) {
i__3 = i + j * c_dim1;
z__1.r = alpha->r * temp.r - alpha->i * temp.i,
z__1.i = alpha->r * temp.i + alpha->i *
temp.r;
C(i,j).r = z__1.r, C(i,j).i = z__1.i;
} else {
i__3 = i + j * c_dim1;
z__2.r = alpha->r * temp.r - alpha->i * temp.i,
z__2.i = alpha->r * temp.i + alpha->i *
temp.r;
i__4 = i + j * c_dim1;
z__3.r = beta->r * C(i,j).r - beta->i * C(i,j).i,
z__3.i = beta->r * C(i,j).i + beta->i * C(i,j).r;
z__1.r = z__2.r + z__3.r, z__1.i = z__2.i + z__3.i;
C(i,j).r = z__1.r, C(i,j).i = z__1.i;
}
/* L270: */
}
/* L280: */
}
} else {
/* Form C := alpha*conjg( A' )*B' + beta*C */
i__1 = *n;
for (j = 1; j <= *n; ++j) {
i__2 = *m;
for (i = 1; i <= *m; ++i) {
temp.r = 0., temp.i = 0.;
i__3 = *k;
for (l = 1; l <= *k; ++l) {
d_cnjg(&z__3, &A(l,i));
i__4 = j + l * b_dim1;
z__2.r = z__3.r * B(j,l).r - z__3.i * B(j,l).i,
z__2.i = z__3.r * B(j,l).i + z__3.i * B(j,l)
.r;
z__1.r = temp.r + z__2.r, z__1.i = temp.i + z__2.i;
temp.r = z__1.r, temp.i = z__1.i;
/* L290: */
}
if (beta->r == 0. && beta->i == 0.) {
i__3 = i + j * c_dim1;
z__1.r = alpha->r * temp.r - alpha->i * temp.i,
z__1.i = alpha->r * temp.i + alpha->i *
temp.r;
C(i,j).r = z__1.r, C(i,j).i = z__1.i;
} else {
i__3 = i + j * c_dim1;
z__2.r = alpha->r * temp.r - alpha->i * temp.i,
z__2.i = alpha->r * temp.i + alpha->i *
temp.r;
i__4 = i + j * c_dim1;
z__3.r = beta->r * C(i,j).r - beta->i * C(i,j).i,
z__3.i = beta->r * C(i,j).i + beta->i * C(i,j).r;
z__1.r = z__2.r + z__3.r, z__1.i = z__2.i + z__3.i;
C(i,j).r = z__1.r, C(i,j).i = z__1.i;
}
/* L300: */
}
/* L310: */
}
}
} else {
if (conjb) {
/* Form C := alpha*A'*conjg( B' ) + beta*C */
i__1 = *n;
for (j = 1; j <= *n; ++j) {
i__2 = *m;
for (i = 1; i <= *m; ++i) {
temp.r = 0., temp.i = 0.;
i__3 = *k;
for (l = 1; l <= *k; ++l) {
i__4 = l + i * a_dim1;
d_cnjg(&z__3, &B(j,l));
z__2.r = A(l,i).r * z__3.r - A(l,i).i * z__3.i,
z__2.i = A(l,i).r * z__3.i + A(l,i).i *
z__3.r;
z__1.r = temp.r + z__2.r, z__1.i = temp.i + z__2.i;
temp.r = z__1.r, temp.i = z__1.i;
/* L320: */
}
if (beta->r == 0. && beta->i == 0.) {
i__3 = i + j * c_dim1;
z__1.r = alpha->r * temp.r - alpha->i * temp.i,
z__1.i = alpha->r * temp.i + alpha->i *
temp.r;
C(i,j).r = z__1.r, C(i,j).i = z__1.i;
} else {
i__3 = i + j * c_dim1;
z__2.r = alpha->r * temp.r - alpha->i * temp.i,
z__2.i = alpha->r * temp.i + alpha->i *
temp.r;
i__4 = i + j * c_dim1;
z__3.r = beta->r * C(i,j).r - beta->i * C(i,j).i,
z__3.i = beta->r * C(i,j).i + beta->i * C(i,j).r;
z__1.r = z__2.r + z__3.r, z__1.i = z__2.i + z__3.i;
C(i,j).r = z__1.r, C(i,j).i = z__1.i;
}
/* L330: */
}
/* L340: */
}
} else {
/* Form C := alpha*A'*B' + beta*C */
i__1 = *n;
for (j = 1; j <= *n; ++j) {
i__2 = *m;
for (i = 1; i <= *m; ++i) {
temp.r = 0., temp.i = 0.;
i__3 = *k;
for (l = 1; l <= *k; ++l) {
i__4 = l + i * a_dim1;
i__5 = j + l * b_dim1;
z__2.r = A(l,i).r * B(j,l).r - A(l,i).i * B(j,l)
.i, z__2.i = A(l,i).r * B(j,l).i + A(l,i)
.i * B(j,l).r;
z__1.r = temp.r + z__2.r, z__1.i = temp.i + z__2.i;
temp.r = z__1.r, temp.i = z__1.i;
/* L350: */
}
if (beta->r == 0. && beta->i == 0.) {
i__3 = i + j * c_dim1;
z__1.r = alpha->r * temp.r - alpha->i * temp.i,
z__1.i = alpha->r * temp.i + alpha->i *
temp.r;
C(i,j).r = z__1.r, C(i,j).i = z__1.i;
} else {
i__3 = i + j * c_dim1;
z__2.r = alpha->r * temp.r - alpha->i * temp.i,
z__2.i = alpha->r * temp.i + alpha->i *
temp.r;
i__4 = i + j * c_dim1;
z__3.r = beta->r * C(i,j).r - beta->i * C(i,j).i,
z__3.i = beta->r * C(i,j).i + beta->i * C(i,j).r;
z__1.r = z__2.r + z__3.r, z__1.i = z__2.i + z__3.i;
C(i,j).r = z__1.r, C(i,j).i = z__1.i;
}
/* L360: */
}
/* L370: */
}
}
}
return 0;
/* End of ZGEMM . */
} /* zgemm_ */
⌨️ 快捷键说明
复制代码Ctrl + C
搜索代码Ctrl + F
全屏模式F11
增大字号Ctrl + =
减小字号Ctrl + -
显示快捷键?