📄 q1_8.c
字号:
iio[WS(vs, 4) + WS(is, 5)] = FNMS(T7H, T7G, T7F * T7K); } { E T3O, T3S, T3N, T3P; T3O = T2H - T2O; T3S = T3Q - T3R; T3N = W[6]; T3P = W[7]; rio[WS(vs, 4) + WS(is, 2)] = FMA(T3N, T3O, T3P * T3S); iio[WS(vs, 4) + WS(is, 2)] = FNMS(T3P, T3O, T3N * T3S); } { E T3K, T3M, T3J, T3L; T3K = T3B + T3A; T3M = T3E + T3H; T3J = W[2]; T3L = W[3]; iio[WS(vs, 2) + WS(is, 2)] = FNMS(T3L, T3M, T3J * T3K); rio[WS(vs, 2) + WS(is, 2)] = FMA(T3L, T3K, T3J * T3M); } { E T7C, T7E, T7B, T7D; T7C = T7t + T7s; T7E = T7w + T7z; T7B = W[2]; T7D = W[3]; iio[WS(vs, 2) + WS(is, 5)] = FNMS(T7D, T7E, T7B * T7C); rio[WS(vs, 2) + WS(is, 5)] = FMA(T7D, T7C, T7B * T7E); } { E T6k, T6m, T6j, T6l; T6k = T6b + T6a; T6m = T6e + T6h; T6j = W[2]; T6l = W[3]; iio[WS(vs, 2) + WS(is, 4)] = FNMS(T6l, T6m, T6j * T6k); rio[WS(vs, 2) + WS(is, 4)] = FMA(T6l, T6k, T6j * T6m); } { E T52, T54, T51, T53; T52 = T4T + T4S; T54 = T4W + T4Z; T51 = W[2]; T53 = W[3]; iio[WS(vs, 2) + WS(is, 3)] = FNMS(T53, T54, T51 * T52); rio[WS(vs, 2) + WS(is, 3)] = FMA(T53, T52, T51 * T54); } { E T5G, T5S, T5Q, T5U, T5F, T5P; T5F = KP707106781 * (T5z - T5E); T5G = T5u - T5F; T5S = T5u + T5F; T5P = KP707106781 * (T5N - T5O); T5Q = T5M - T5P; T5U = T5M + T5P; { E T5p, T5H, T5R, T5T; T5p = W[12]; T5H = W[13]; iio[WS(vs, 7) + WS(is, 4)] = FNMS(T5H, T5Q, T5p * T5G); rio[WS(vs, 7) + WS(is, 4)] = FMA(T5H, T5G, T5p * T5Q); T5R = W[4]; T5T = W[5]; iio[WS(vs, 3) + WS(is, 4)] = FNMS(T5T, T5U, T5R * T5S); rio[WS(vs, 3) + WS(is, 4)] = FMA(T5T, T5S, T5R * T5U); } } { E Tw, TI, TG, TK, Tv, TF; Tv = KP707106781 * (Tp - Tu); Tw = Tk - Tv; TI = Tk + Tv; TF = KP707106781 * (TD - TE); TG = TC - TF; TK = TC + TF; { E Tf, Tx, TH, TJ; Tf = W[12]; Tx = W[13]; iio[WS(vs, 7)] = FNMS(Tx, TG, Tf * Tw); rio[WS(vs, 7)] = FMA(Tx, Tw, Tf * TG); TH = W[4]; TJ = W[5]; iio[WS(vs, 3)] = FNMS(TJ, TK, TH * TI); rio[WS(vs, 3)] = FMA(TJ, TI, TH * TK); } } { E T9Q, T9W, T9U, T9Y, T9P, T9T; T9P = KP707106781 * (T9w + T9r); T9Q = T9O - T9P; T9W = T9O + T9P; T9T = KP707106781 * (T9F + T9G); T9U = T9S - T9T; T9Y = T9S + T9T; { E T9N, T9R, T9V, T9X; T9N = W[8]; T9R = W[9]; rio[WS(vs, 5) + WS(is, 7)] = FMA(T9N, T9Q, T9R * T9U); iio[WS(vs, 5) + WS(is, 7)] = FNMS(T9R, T9Q, T9N * T9U); T9V = W[0]; T9X = W[1]; rio[WS(vs, 1) + WS(is, 7)] = FMA(T9V, T9W, T9X * T9Y); iio[WS(vs, 1) + WS(is, 7)] = FNMS(T9X, T9W, T9V * T9Y); } } { E T36, T3i, T3g, T3k, T35, T3f; T35 = KP707106781 * (T2Z - T34); T36 = T2U - T35; T3i = T2U + T35; T3f = KP707106781 * (T3d - T3e); T3g = T3c - T3f; T3k = T3c + T3f; { E T2P, T37, T3h, T3j; T2P = W[12]; T37 = W[13]; iio[WS(vs, 7) + WS(is, 2)] = FNMS(T37, T3g, T2P * T36); rio[WS(vs, 7) + WS(is, 2)] = FMA(T37, T36, T2P * T3g); T3h = W[4]; T3j = W[5]; iio[WS(vs, 3) + WS(is, 2)] = FNMS(T3j, T3k, T3h * T3i); rio[WS(vs, 3) + WS(is, 2)] = FMA(T3j, T3i, T3h * T3k); } } { E T5Y, T64, T62, T66, T5X, T61; T5X = KP707106781 * (T5E + T5z); T5Y = T5W - T5X; T64 = T5W + T5X; T61 = KP707106781 * (T5N + T5O); T62 = T60 - T61; T66 = T60 + T61; { E T5V, T5Z, T63, T65; T5V = W[8]; T5Z = W[9]; rio[WS(vs, 5) + WS(is, 4)] = FMA(T5V, T5Y, T5Z * T62); iio[WS(vs, 5) + WS(is, 4)] = FNMS(T5Z, T5Y, T5V * T62); T63 = W[0]; T65 = W[1]; rio[WS(vs, 1) + WS(is, 4)] = FMA(T63, T64, T65 * T66); iio[WS(vs, 1) + WS(is, 4)] = FNMS(T65, T64, T63 * T66); } } { E T7g, T7m, T7k, T7o, T7f, T7j; T7f = KP707106781 * (T6W + T6R); T7g = T7e - T7f; T7m = T7e + T7f; T7j = KP707106781 * (T75 + T76); T7k = T7i - T7j; T7o = T7i + T7j; { E T7d, T7h, T7l, T7n; T7d = W[8]; T7h = W[9]; rio[WS(vs, 5) + WS(is, 5)] = FMA(T7d, T7g, T7h * T7k); iio[WS(vs, 5) + WS(is, 5)] = FNMS(T7h, T7g, T7d * T7k); T7l = W[0]; T7n = W[1]; rio[WS(vs, 1) + WS(is, 5)] = FMA(T7l, T7m, T7n * T7o); iio[WS(vs, 1) + WS(is, 5)] = FNMS(T7n, T7m, T7l * T7o); } } { E T8g, T8s, T8q, T8u, T8f, T8p; T8f = KP707106781 * (T89 - T8e); T8g = T84 - T8f; T8s = T84 + T8f; T8p = KP707106781 * (T8n - T8o); T8q = T8m - T8p; T8u = T8m + T8p; { E T7Z, T8h, T8r, T8t; T7Z = W[12]; T8h = W[13]; iio[WS(vs, 7) + WS(is, 6)] = FNMS(T8h, T8q, T7Z * T8g); rio[WS(vs, 7) + WS(is, 6)] = FMA(T8h, T8g, T7Z * T8q); T8r = W[4]; T8t = W[5]; iio[WS(vs, 3) + WS(is, 6)] = FNMS(T8t, T8u, T8r * T8s); rio[WS(vs, 3) + WS(is, 6)] = FMA(T8t, T8s, T8r * T8u); } } { E T4G, T4M, T4K, T4O, T4F, T4J; T4F = KP707106781 * (T4m + T4h); T4G = T4E - T4F; T4M = T4E + T4F; T4J = KP707106781 * (T4v + T4w); T4K = T4I - T4J; T4O = T4I + T4J; { E T4D, T4H, T4L, T4N; T4D = W[8]; T4H = W[9]; rio[WS(vs, 5) + WS(is, 3)] = FMA(T4D, T4G, T4H * T4K); iio[WS(vs, 5) + WS(is, 3)] = FNMS(T4H, T4G, T4D * T4K); T4L = W[0]; T4N = W[1]; rio[WS(vs, 1) + WS(is, 3)] = FMA(T4L, T4M, T4N * T4O); iio[WS(vs, 1) + WS(is, 3)] = FNMS(T4N, T4M, T4L * T4O); } } { E TO, TU, TS, TW, TN, TR; TN = KP707106781 * (Tu + Tp); TO = TM - TN; TU = TM + TN; TR = KP707106781 * (TD + TE); TS = TQ - TR; TW = TQ + TR; { E TL, TP, TT, TV; TL = W[8]; TP = W[9]; rio[WS(vs, 5)] = FMA(TL, TO, TP * TS); iio[WS(vs, 5)] = FNMS(TP, TO, TL * TS); TT = W[0]; TV = W[1]; rio[WS(vs, 1)] = FMA(TT, TU, TV * TW); iio[WS(vs, 1)] = FNMS(TV, TU, TT * TW); } } { E T26, T2c, T2a, T2e, T25, T29; T25 = KP707106781 * (T1M + T1H); T26 = T24 - T25; T2c = T24 + T25; T29 = KP707106781 * (T1V + T1W); T2a = T28 - T29; T2e = T28 + T29; { E T23, T27, T2b, T2d; T23 = W[8]; T27 = W[9]; rio[WS(vs, 5) + WS(is, 1)] = FMA(T23, T26, T27 * T2a); iio[WS(vs, 5) + WS(is, 1)] = FNMS(T27, T26, T23 * T2a); T2b = W[0]; T2d = W[1]; rio[WS(vs, 1) + WS(is, 1)] = FMA(T2b, T2c, T2d * T2e); iio[WS(vs, 1) + WS(is, 1)] = FNMS(T2d, T2c, T2b * T2e); } } { E T9y, T9K, T9I, T9M, T9x, T9H; T9x = KP707106781 * (T9r - T9w); T9y = T9m - T9x; T9K = T9m + T9x; T9H = KP707106781 * (T9F - T9G); T9I = T9E - T9H; T9M = T9E + T9H; { E T9h, T9z, T9J, T9L; T9h = W[12]; T9z = W[13]; iio[WS(vs, 7) + WS(is, 7)] = FNMS(T9z, T9I, T9h * T9y); rio[WS(vs, 7) + WS(is, 7)] = FMA(T9z, T9y, T9h * T9I); T9J = W[4]; T9L = W[5]; iio[WS(vs, 3) + WS(is, 7)] = FNMS(T9L, T9M, T9J * T9K); rio[WS(vs, 3) + WS(is, 7)] = FMA(T9L, T9K, T9J * T9M); } } { E T6Y, T7a, T78, T7c, T6X, T77; T6X = KP707106781 * (T6R - T6W); T6Y = T6M - T6X; T7a = T6M + T6X; T77 = KP707106781 * (T75 - T76); T78 = T74 - T77; T7c = T74 + T77; { E T6H, T6Z, T79, T7b; T6H = W[12]; T6Z = W[13]; iio[WS(vs, 7) + WS(is, 5)] = FNMS(T6Z, T78, T6H * T6Y); rio[WS(vs, 7) + WS(is, 5)] = FMA(T6Z, T6Y, T6H * T78); T79 = W[4]; T7b = W[5]; iio[WS(vs, 3) + WS(is, 5)] = FNMS(T7b, T7c, T79 * T7a); rio[WS(vs, 3) + WS(is, 5)] = FMA(T7b, T7a, T79 * T7c); } } { E T1O, T20, T1Y, T22, T1N, T1X; T1N = KP707106781 * (T1H - T1M); T1O = T1C - T1N; T20 = T1C + T1N; T1X = KP707106781 * (T1V - T1W); T1Y = T1U - T1X; T22 = T1U + T1X; { E T1x, T1P, T1Z, T21; T1x = W[12]; T1P = W[13]; iio[WS(vs, 7) + WS(is, 1)] = FNMS(T1P, T1Y, T1x * T1O); rio[WS(vs, 7) + WS(is, 1)] = FMA(T1P, T1O, T1x * T1Y); T1Z = W[4]; T21 = W[5]; iio[WS(vs, 3) + WS(is, 1)] = FNMS(T21, T22, T1Z * T20); rio[WS(vs, 3) + WS(is, 1)] = FMA(T21, T20, T1Z * T22); } } { E T4o, T4A, T4y, T4C, T4n, T4x; T4n = KP707106781 * (T4h - T4m); T4o = T4c - T4n; T4A = T4c + T4n; T4x = KP707106781 * (T4v - T4w); T4y = T4u - T4x; T4C = T4u + T4x; { E T47, T4p, T4z, T4B; T47 = W[12]; T4p = W[13]; iio[WS(vs, 7) + WS(is, 3)] = FNMS(T4p, T4y, T47 * T4o); rio[WS(vs, 7) + WS(is, 3)] = FMA(T4p, T4o, T47 * T4y); T4z = W[4]; T4B = W[5]; iio[WS(vs, 3) + WS(is, 3)] = FNMS(T4B, T4C, T4z * T4A); rio[WS(vs, 3) + WS(is, 3)] = FMA(T4B, T4A, T4z * T4C); } } { E T3o, T3u, T3s, T3w, T3n, T3r; T3n = KP707106781 * (T34 + T2Z); T3o = T3m - T3n; T3u = T3m + T3n; T3r = KP707106781 * (T3d + T3e); T3s = T3q - T3r; T3w = T3q + T3r; { E T3l, T3p, T3t, T3v; T3l = W[8]; T3p = W[9]; rio[WS(vs, 5) + WS(is, 2)] = FMA(T3l, T3o, T3p * T3s); iio[WS(vs, 5) + WS(is, 2)] = FNMS(T3p, T3o, T3l * T3s); T3t = W[0]; T3v = W[1]; rio[WS(vs, 1) + WS(is, 2)] = FMA(T3t, T3u, T3v * T3w); iio[WS(vs, 1) + WS(is, 2)] = FNMS(T3v, T3u, T3t * T3w); } } { E T8y, T8E, T8C, T8G, T8x, T8B; T8x = KP707106781 * (T8e + T89); T8y = T8w - T8x; T8E = T8w + T8x; T8B = KP707106781 * (T8n + T8o); T8C = T8A - T8B; T8G = T8A + T8B; { E T8v, T8z, T8D, T8F; T8v = W[8]; T8z = W[9]; rio[WS(vs, 5) + WS(is, 6)] = FMA(T8v, T8y, T8z * T8C); iio[WS(vs, 5) + WS(is, 6)] = FNMS(T8z, T8y, T8v * T8C); T8D = W[0]; T8F = W[1]; rio[WS(vs, 1) + WS(is, 6)] = FMA(T8D, T8E, T8F * T8G); iio[WS(vs, 1) + WS(is, 6)] = FNMS(T8F, T8E, T8D * T8G); } } } return W;}static const tw_instr twinstr[] = { {TW_FULL, 0, 8}, {TW_NEXT, 1, 0}};static const ct_desc desc = { 8, "q1_8", twinstr, {416, 144, 112, 0}, &GENUS, 0, 0, 0 };void X(codelet_q1_8) (planner *p) { X(kdft_difsq_register) (p, q1_8, &desc);}
⌨️ 快捷键说明
复制代码
Ctrl + C
搜索代码
Ctrl + F
全屏模式
F11
切换主题
Ctrl + Shift + D
显示快捷键
?
增大字号
Ctrl + =
减小字号
Ctrl + -