📄 t1sv_32.c
字号:
T71 = VADD(T6Y, T6Z); } ST(&(ri[WS(rs, 16)]), VSUB(T1t, T30), ms, &(ri[0])); ST(&(ii[WS(rs, 16)]), VSUB(T7a, T71), ms, &(ii[0])); ST(&(ri[0]), VADD(T1t, T30), ms, &(ri[0])); ST(&(ii[0]), VADD(T71, T7a), ms, &(ii[0])); ST(&(ri[WS(rs, 24)]), VSUB(T6X, T70), ms, &(ri[0])); ST(&(ii[WS(rs, 24)]), VSUB(T7c, T7b), ms, &(ii[0])); ST(&(ri[WS(rs, 8)]), VADD(T6X, T70), ms, &(ri[0])); ST(&(ii[WS(rs, 8)]), VADD(T7b, T7c), ms, &(ii[0])); } { V T6H, T6T, T7g, T7i, T6M, T6U, T6R, T6V; { V T6D, T6G, T7e, T7f; T6D = VSUB(Tj, TG); T6G = VSUB(T6E, T6F); T6H = VADD(T6D, T6G); T6T = VSUB(T6D, T6G); T7e = VSUB(T1r, T14); T7f = VSUB(T78, T73); T7g = VADD(T7e, T7f); T7i = VSUB(T7f, T7e); } { V T6I, T6L, T6N, T6Q; T6I = VSUB(T1Q, T2d); T6L = VSUB(T6J, T6K); T6M = VADD(T6I, T6L); T6U = VSUB(T6L, T6I); T6N = VSUB(T2B, T2Y); T6Q = VSUB(T6O, T6P); T6R = VSUB(T6N, T6Q); T6V = VADD(T6N, T6Q); } { V T6S, T7d, T6W, T7h; T6S = VMUL(LDK(KP707106781), VADD(T6M, T6R)); ST(&(ri[WS(rs, 20)]), VSUB(T6H, T6S), ms, &(ri[0])); ST(&(ri[WS(rs, 4)]), VADD(T6H, T6S), ms, &(ri[0])); T7d = VMUL(LDK(KP707106781), VADD(T6U, T6V)); ST(&(ii[WS(rs, 4)]), VADD(T7d, T7g), ms, &(ii[0])); ST(&(ii[WS(rs, 20)]), VSUB(T7g, T7d), ms, &(ii[0])); T6W = VMUL(LDK(KP707106781), VSUB(T6U, T6V)); ST(&(ri[WS(rs, 28)]), VSUB(T6T, T6W), ms, &(ri[0])); ST(&(ri[WS(rs, 12)]), VADD(T6T, T6W), ms, &(ri[0])); T7h = VMUL(LDK(KP707106781), VSUB(T6R, T6M)); ST(&(ii[WS(rs, 12)]), VADD(T7h, T7i), ms, &(ii[0])); ST(&(ii[WS(rs, 28)]), VSUB(T7i, T7h), ms, &(ii[0])); } } { V T5J, T7n, T7t, T6n, T5U, T7k, T6x, T6B, T6q, T7s, T66, T6k, T6u, T6A, T6h; V T6l; { V T5O, T5T, T60, T65; T5J = VSUB(T5F, T5I); T7n = VADD(T7l, T7m); T7t = VSUB(T7m, T7l); T6n = VADD(T5F, T5I); T5O = VSUB(T5M, T5N); T5T = VADD(T5P, T5S); T5U = VMUL(LDK(KP707106781), VSUB(T5O, T5T)); T7k = VMUL(LDK(KP707106781), VADD(T5O, T5T)); { V T6v, T6w, T6o, T6p; T6v = VADD(T67, T6a); T6w = VADD(T6e, T6f); T6x = VFNMS(LDK(KP382683432), T6w, VMUL(LDK(KP923879532), T6v)); T6B = VFMA(LDK(KP923879532), T6w, VMUL(LDK(KP382683432), T6v)); T6o = VADD(T5N, T5M); T6p = VSUB(T5P, T5S); T6q = VMUL(LDK(KP707106781), VADD(T6o, T6p)); T7s = VMUL(LDK(KP707106781), VSUB(T6p, T6o)); } T60 = VSUB(T5Y, T5Z); T65 = VSUB(T61, T64); T66 = VFMA(LDK(KP923879532), T60, VMUL(LDK(KP382683432), T65)); T6k = VFNMS(LDK(KP923879532), T65, VMUL(LDK(KP382683432), T60)); { V T6s, T6t, T6b, T6g; T6s = VADD(T5Y, T5Z); T6t = VADD(T61, T64); T6u = VFMA(LDK(KP382683432), T6s, VMUL(LDK(KP923879532), T6t)); T6A = VFNMS(LDK(KP382683432), T6t, VMUL(LDK(KP923879532), T6s)); T6b = VSUB(T67, T6a); T6g = VSUB(T6e, T6f); T6h = VFNMS(LDK(KP923879532), T6g, VMUL(LDK(KP382683432), T6b)); T6l = VFMA(LDK(KP382683432), T6g, VMUL(LDK(KP923879532), T6b)); } } { V T5V, T6i, T7r, T7u; T5V = VADD(T5J, T5U); T6i = VADD(T66, T6h); ST(&(ri[WS(rs, 22)]), VSUB(T5V, T6i), ms, &(ri[0])); ST(&(ri[WS(rs, 6)]), VADD(T5V, T6i), ms, &(ri[0])); T7r = VADD(T6k, T6l); T7u = VADD(T7s, T7t); ST(&(ii[WS(rs, 6)]), VADD(T7r, T7u), ms, &(ii[0])); ST(&(ii[WS(rs, 22)]), VSUB(T7u, T7r), ms, &(ii[0])); } { V T6j, T6m, T7v, T7w; T6j = VSUB(T5J, T5U); T6m = VSUB(T6k, T6l); ST(&(ri[WS(rs, 30)]), VSUB(T6j, T6m), ms, &(ri[0])); ST(&(ri[WS(rs, 14)]), VADD(T6j, T6m), ms, &(ri[0])); T7v = VSUB(T6h, T66); T7w = VSUB(T7t, T7s); ST(&(ii[WS(rs, 14)]), VADD(T7v, T7w), ms, &(ii[0])); ST(&(ii[WS(rs, 30)]), VSUB(T7w, T7v), ms, &(ii[0])); } { V T6r, T6y, T7j, T7o; T6r = VADD(T6n, T6q); T6y = VADD(T6u, T6x); ST(&(ri[WS(rs, 18)]), VSUB(T6r, T6y), ms, &(ri[0])); ST(&(ri[WS(rs, 2)]), VADD(T6r, T6y), ms, &(ri[0])); T7j = VADD(T6A, T6B); T7o = VADD(T7k, T7n); ST(&(ii[WS(rs, 2)]), VADD(T7j, T7o), ms, &(ii[0])); ST(&(ii[WS(rs, 18)]), VSUB(T7o, T7j), ms, &(ii[0])); } { V T6z, T6C, T7p, T7q; T6z = VSUB(T6n, T6q); T6C = VSUB(T6A, T6B); ST(&(ri[WS(rs, 26)]), VSUB(T6z, T6C), ms, &(ri[0])); ST(&(ri[WS(rs, 10)]), VADD(T6z, T6C), ms, &(ri[0])); T7p = VSUB(T6x, T6u); T7q = VSUB(T7n, T7k); ST(&(ii[WS(rs, 10)]), VADD(T7p, T7q), ms, &(ii[0])); ST(&(ii[WS(rs, 26)]), VSUB(T7q, T7p), ms, &(ii[0])); } } { V T3h, T4D, T7R, T7X, T3E, T7O, T4N, T4R, T46, T4A, T4G, T7W, T4K, T4Q, T4x; V T4B, T3g, T7P; T3g = VMUL(LDK(KP707106781), VSUB(T3a, T3f)); T3h = VSUB(T35, T3g); T4D = VADD(T35, T3g); T7P = VMUL(LDK(KP707106781), VSUB(T4V, T4U)); T7R = VADD(T7P, T7Q); T7X = VSUB(T7Q, T7P); { V T3s, T3D, T4L, T4M; T3s = VFNMS(LDK(KP923879532), T3r, VMUL(LDK(KP382683432), T3m)); T3D = VFMA(LDK(KP382683432), T3x, VMUL(LDK(KP923879532), T3C)); T3E = VSUB(T3s, T3D); T7O = VADD(T3s, T3D); T4L = VADD(T4b, T4m); T4M = VADD(T4s, T4v); T4N = VFNMS(LDK(KP555570233), T4M, VMUL(LDK(KP831469612), T4L)); T4R = VFMA(LDK(KP831469612), T4M, VMUL(LDK(KP555570233), T4L)); } { V T3W, T45, T4E, T4F; T3W = VSUB(T3K, T3V); T45 = VSUB(T41, T44); T46 = VFMA(LDK(KP980785280), T3W, VMUL(LDK(KP195090322), T45)); T4A = VFNMS(LDK(KP980785280), T45, VMUL(LDK(KP195090322), T3W)); T4E = VFMA(LDK(KP923879532), T3m, VMUL(LDK(KP382683432), T3r)); T4F = VFNMS(LDK(KP923879532), T3x, VMUL(LDK(KP382683432), T3C)); T4G = VADD(T4E, T4F); T7W = VSUB(T4F, T4E); } { V T4I, T4J, T4n, T4w; T4I = VADD(T3K, T3V); T4J = VADD(T41, T44); T4K = VFMA(LDK(KP555570233), T4I, VMUL(LDK(KP831469612), T4J)); T4Q = VFNMS(LDK(KP555570233), T4J, VMUL(LDK(KP831469612), T4I)); T4n = VSUB(T4b, T4m); T4w = VSUB(T4s, T4v); T4x = VFNMS(LDK(KP980785280), T4w, VMUL(LDK(KP195090322), T4n)); T4B = VFMA(LDK(KP195090322), T4w, VMUL(LDK(KP980785280), T4n)); } { V T3F, T4y, T7V, T7Y; T3F = VADD(T3h, T3E); T4y = VADD(T46, T4x); ST(&(ri[WS(rs, 23)]), VSUB(T3F, T4y), ms, &(ri[WS(rs, 1)])); ST(&(ri[WS(rs, 7)]), VADD(T3F, T4y), ms, &(ri[WS(rs, 1)])); T7V = VADD(T4A, T4B); T7Y = VADD(T7W, T7X); ST(&(ii[WS(rs, 7)]), VADD(T7V, T7Y), ms, &(ii[WS(rs, 1)])); ST(&(ii[WS(rs, 23)]), VSUB(T7Y, T7V), ms, &(ii[WS(rs, 1)])); } { V T4z, T4C, T7Z, T80; T4z = VSUB(T3h, T3E); T4C = VSUB(T4A, T4B); ST(&(ri[WS(rs, 31)]), VSUB(T4z, T4C), ms, &(ri[WS(rs, 1)])); ST(&(ri[WS(rs, 15)]), VADD(T4z, T4C), ms, &(ri[WS(rs, 1)])); T7Z = VSUB(T4x, T46); T80 = VSUB(T7X, T7W); ST(&(ii[WS(rs, 15)]), VADD(T7Z, T80), ms, &(ii[WS(rs, 1)])); ST(&(ii[WS(rs, 31)]), VSUB(T80, T7Z), ms, &(ii[WS(rs, 1)])); } { V T4H, T4O, T7N, T7S; T4H = VADD(T4D, T4G); T4O = VADD(T4K, T4N); ST(&(ri[WS(rs, 19)]), VSUB(T4H, T4O), ms, &(ri[WS(rs, 1)])); ST(&(ri[WS(rs, 3)]), VADD(T4H, T4O), ms, &(ri[WS(rs, 1)])); T7N = VADD(T4Q, T4R); T7S = VADD(T7O, T7R); ST(&(ii[WS(rs, 3)]), VADD(T7N, T7S), ms, &(ii[WS(rs, 1)])); ST(&(ii[WS(rs, 19)]), VSUB(T7S, T7N), ms, &(ii[WS(rs, 1)])); } { V T4P, T4S, T7T, T7U; T4P = VSUB(T4D, T4G); T4S = VSUB(T4Q, T4R); ST(&(ri[WS(rs, 27)]), VSUB(T4P, T4S), ms, &(ri[WS(rs, 1)])); ST(&(ri[WS(rs, 11)]), VADD(T4P, T4S), ms, &(ri[WS(rs, 1)])); T7T = VSUB(T4N, T4K); T7U = VSUB(T7R, T7O); ST(&(ii[WS(rs, 11)]), VADD(T7T, T7U), ms, &(ii[WS(rs, 1)])); ST(&(ii[WS(rs, 27)]), VSUB(T7U, T7T), ms, &(ii[WS(rs, 1)])); } } { V T4X, T5p, T7D, T7J, T54, T7y, T5z, T5D, T5c, T5m, T5s, T7I, T5w, T5C, T5j; V T5n, T4W, T7z; T4W = VMUL(LDK(KP707106781), VADD(T4U, T4V)); T4X = VSUB(T4T, T4W); T5p = VADD(T4T, T4W); T7z = VMUL(LDK(KP707106781), VADD(T3a, T3f)); T7D = VADD(T7z, T7C); T7J = VSUB(T7C, T7z); { V T50, T53, T5x, T5y; T50 = VFNMS(LDK(KP382683432), T4Z, VMUL(LDK(KP923879532), T4Y)); T53 = VFMA(LDK(KP923879532), T51, VMUL(LDK(KP382683432), T52)); T54 = VSUB(T50, T53); T7y = VADD(T50, T53); T5x = VADD(T5d, T5e); T5y = VADD(T5g, T5h); T5z = VFNMS(LDK(KP195090322), T5y, VMUL(LDK(KP980785280), T5x)); T5D = VFMA(LDK(KP195090322), T5x, VMUL(LDK(KP980785280), T5y)); } { V T58, T5b, T5q, T5r; T58 = VSUB(T56, T57); T5b = VSUB(T59, T5a); T5c = VFMA(LDK(KP555570233), T58, VMUL(LDK(KP831469612), T5b)); T5m = VFNMS(LDK(KP831469612), T58, VMUL(LDK(KP555570233), T5b)); T5q = VFMA(LDK(KP382683432), T4Y, VMUL(LDK(KP923879532), T4Z)); T5r = VFNMS(LDK(KP382683432), T51, VMUL(LDK(KP923879532), T52)); T5s = VADD(T5q, T5r); T7I = VSUB(T5r, T5q); } { V T5u, T5v, T5f, T5i; T5u = VADD(T56, T57); T5v = VADD(T59, T5a); T5w = VFMA(LDK(KP980785280), T5u, VMUL(LDK(KP195090322), T5v)); T5C = VFNMS(LDK(KP195090322), T5u, VMUL(LDK(KP980785280), T5v)); T5f = VSUB(T5d, T5e); T5i = VSUB(T5g, T5h); T5j = VFNMS(LDK(KP831469612), T5i, VMUL(LDK(KP555570233), T5f)); T5n = VFMA(LDK(KP831469612), T5f, VMUL(LDK(KP555570233), T5i)); } { V T55, T5k, T7H, T7K; T55 = VADD(T4X, T54); T5k = VADD(T5c, T5j); ST(&(ri[WS(rs, 21)]), VSUB(T55, T5k), ms, &(ri[WS(rs, 1)])); ST(&(ri[WS(rs, 5)]), VADD(T55, T5k), ms, &(ri[WS(rs, 1)])); T7H = VADD(T5m, T5n); T7K = VADD(T7I, T7J); ST(&(ii[WS(rs, 5)]), VADD(T7H, T7K), ms, &(ii[WS(rs, 1)])); ST(&(ii[WS(rs, 21)]), VSUB(T7K, T7H), ms, &(ii[WS(rs, 1)])); } { V T5l, T5o, T7L, T7M; T5l = VSUB(T4X, T54); T5o = VSUB(T5m, T5n); ST(&(ri[WS(rs, 29)]), VSUB(T5l, T5o), ms, &(ri[WS(rs, 1)])); ST(&(ri[WS(rs, 13)]), VADD(T5l, T5o), ms, &(ri[WS(rs, 1)])); T7L = VSUB(T5j, T5c); T7M = VSUB(T7J, T7I); ST(&(ii[WS(rs, 13)]), VADD(T7L, T7M), ms, &(ii[WS(rs, 1)])); ST(&(ii[WS(rs, 29)]), VSUB(T7M, T7L), ms, &(ii[WS(rs, 1)])); } { V T5t, T5A, T7x, T7E; T5t = VADD(T5p, T5s); T5A = VADD(T5w, T5z); ST(&(ri[WS(rs, 17)]), VSUB(T5t, T5A), ms, &(ri[WS(rs, 1)])); ST(&(ri[WS(rs, 1)]), VADD(T5t, T5A), ms, &(ri[WS(rs, 1)])); T7x = VADD(T5C, T5D); T7E = VADD(T7y, T7D); ST(&(ii[WS(rs, 1)]), VADD(T7x, T7E), ms, &(ii[WS(rs, 1)])); ST(&(ii[WS(rs, 17)]), VSUB(T7E, T7x), ms, &(ii[WS(rs, 1)])); } { V T5B, T5E, T7F, T7G; T5B = VSUB(T5p, T5s); T5E = VSUB(T5C, T5D); ST(&(ri[WS(rs, 25)]), VSUB(T5B, T5E), ms, &(ri[WS(rs, 1)])); ST(&(ri[WS(rs, 9)]), VADD(T5B, T5E), ms, &(ri[WS(rs, 1)])); T7F = VSUB(T5z, T5w); T7G = VSUB(T7D, T7y); ST(&(ii[WS(rs, 9)]), VADD(T7F, T7G), ms, &(ii[WS(rs, 1)])); ST(&(ii[WS(rs, 25)]), VSUB(T7G, T7F), ms, &(ii[WS(rs, 1)])); } } }}static const tw_instr twinstr[] = { VTW(0, 1), VTW(0, 2), VTW(0, 3), VTW(0, 4), VTW(0, 5), VTW(0, 6), VTW(0, 7), VTW(0, 8), VTW(0, 9), VTW(0, 10), VTW(0, 11), VTW(0, 12), VTW(0, 13), VTW(0, 14), VTW(0, 15), VTW(0, 16), VTW(0, 17), VTW(0, 18), VTW(0, 19), VTW(0, 20), VTW(0, 21), VTW(0, 22), VTW(0, 23), VTW(0, 24), VTW(0, 25), VTW(0, 26), VTW(0, 27), VTW(0, 28), VTW(0, 29), VTW(0, 30), VTW(0, 31), {TW_NEXT, (2 * VL), 0}};static const ct_desc desc = { 32, "t1sv_32", twinstr, &GENUS, {340, 114, 94, 0}, 0, 0, 0 };void X(codelet_t1sv_32) (planner *p) { X(kdft_dit_register) (p, t1sv_32, &desc);}#endif /* HAVE_FMA */
⌨️ 快捷键说明
复制代码
Ctrl + C
搜索代码
Ctrl + F
全屏模式
F11
切换主题
Ctrl + Shift + D
显示快捷键
?
增大字号
Ctrl + =
减小字号
Ctrl + -