📄 t2fv_64.c
字号:
T6o = VADD(T5O, T6n); T6B = VBYI(VADD(T6x, T6A)); ST(&(x[WS(rs, 62)]), VSUB(T6o, T6B), ms, &(x[0])); ST(&(x[WS(rs, 2)]), VADD(T6o, T6B), ms, &(x[0])); T6K = VBYI(VADD(T6F, T6E)); T6L = VADD(T6H, T6I); ST(&(x[WS(rs, 14)]), VADD(T6K, T6L), ms, &(x[0])); ST(&(x[WS(rs, 50)]), VSUB(T6L, T6K), ms, &(x[0])); } { V T6C, T6D, T6G, T6J; T6C = VSUB(T5O, T6n); T6D = VBYI(VSUB(T6A, T6x)); ST(&(x[WS(rs, 34)]), VSUB(T6C, T6D), ms, &(x[0])); ST(&(x[WS(rs, 30)]), VADD(T6C, T6D), ms, &(x[0])); T6G = VBYI(VSUB(T6E, T6F)); T6J = VSUB(T6H, T6I); ST(&(x[WS(rs, 18)]), VADD(T6G, T6J), ms, &(x[0])); ST(&(x[WS(rs, 46)]), VSUB(T6J, T6G), ms, &(x[0])); } } { V T6O, T79, T6Z, T77, T6V, T7a, T72, T76; { V T6M, T6N, T6X, T6Y; T6M = VSUB(T5q, T5x); T6N = VSUB(T6v, T6u); T6O = VADD(T6M, T6N); T79 = VSUB(T6M, T6N); T6X = VSUB(T6s, T6r); T6Y = VSUB(T5M, T5F); T6Z = VADD(T6X, T6Y); T77 = VSUB(T6Y, T6X); { V T6R, T70, T6U, T71; { V T6P, T6Q, T6S, T6T; T6P = VSUB(T5R, T5Y); T6Q = VSUB(T63, T62); T6R = VFMA(LDK(KP831469612), T6P, VMUL(LDK(KP555570233), T6Q)); T70 = VFNMS(LDK(KP555570233), T6P, VMUL(LDK(KP831469612), T6Q)); T6S = VSUB(T68, T6f); T6T = VSUB(T6k, T6j); T6U = VFNMS(LDK(KP555570233), T6T, VMUL(LDK(KP831469612), T6S)); T71 = VFMA(LDK(KP555570233), T6S, VMUL(LDK(KP831469612), T6T)); } T6V = VADD(T6R, T6U); T7a = VSUB(T71, T70); T72 = VADD(T70, T71); T76 = VSUB(T6U, T6R); } } { V T6W, T73, T7c, T7d; T6W = VADD(T6O, T6V); T73 = VBYI(VADD(T6Z, T72)); ST(&(x[WS(rs, 58)]), VSUB(T6W, T73), ms, &(x[0])); ST(&(x[WS(rs, 6)]), VADD(T6W, T73), ms, &(x[0])); T7c = VBYI(VADD(T77, T76)); T7d = VADD(T79, T7a); ST(&(x[WS(rs, 10)]), VADD(T7c, T7d), ms, &(x[0])); ST(&(x[WS(rs, 54)]), VSUB(T7d, T7c), ms, &(x[0])); } { V T74, T75, T78, T7b; T74 = VSUB(T6O, T6V); T75 = VBYI(VSUB(T72, T6Z)); ST(&(x[WS(rs, 38)]), VSUB(T74, T75), ms, &(x[0])); ST(&(x[WS(rs, 26)]), VADD(T74, T75), ms, &(x[0])); T78 = VBYI(VSUB(T76, T77)); T7b = VSUB(T79, T7a); ST(&(x[WS(rs, 22)]), VADD(T78, T7b), ms, &(x[0])); ST(&(x[WS(rs, 42)]), VSUB(T7b, T78), ms, &(x[0])); } } { V T4k, T5h, T4R, T59, T4H, T5j, T4P, T4Y, T4z, T4S, T4K, T4O, T55, T5k, T5c; V T5g; { V T4c, T57, T4j, T58, T4f, T4i; T4c = VADD(T4a, T4b); T57 = VSUB(T4C, T4B); T4f = VFMA(LDK(KP831469612), T4d, VMUL(LDK(KP555570233), T4e)); T4i = VFNMS(LDK(KP555570233), T4h, VMUL(LDK(KP831469612), T4g)); T4j = VADD(T4f, T4i); T58 = VSUB(T4i, T4f); T4k = VADD(T4c, T4j); T5h = VSUB(T58, T57); T4R = VSUB(T4c, T4j); T59 = VADD(T57, T58); } { V T4D, T4W, T4G, T4X, T4E, T4F; T4D = VADD(T4B, T4C); T4W = VSUB(T4a, T4b); T4E = VFNMS(LDK(KP555570233), T4d, VMUL(LDK(KP831469612), T4e)); T4F = VFMA(LDK(KP555570233), T4g, VMUL(LDK(KP831469612), T4h)); T4G = VADD(T4E, T4F); T4X = VSUB(T4F, T4E); T4H = VADD(T4D, T4G); T5j = VSUB(T4W, T4X); T4P = VSUB(T4G, T4D); T4Y = VADD(T4W, T4X); } { V T4r, T4I, T4y, T4J; { V T4n, T4q, T4u, T4x; T4n = VADD(T4l, T4m); T4q = VADD(T4o, T4p); T4r = VFMA(LDK(KP956940335), T4n, VMUL(LDK(KP290284677), T4q)); T4I = VFNMS(LDK(KP290284677), T4n, VMUL(LDK(KP956940335), T4q)); T4u = VADD(T4s, T4t); T4x = VADD(T4v, T4w); T4y = VFNMS(LDK(KP290284677), T4x, VMUL(LDK(KP956940335), T4u)); T4J = VFMA(LDK(KP290284677), T4u, VMUL(LDK(KP956940335), T4x)); } T4z = VADD(T4r, T4y); T4S = VSUB(T4J, T4I); T4K = VADD(T4I, T4J); T4O = VSUB(T4y, T4r); } { V T51, T5a, T54, T5b; { V T4Z, T50, T52, T53; T4Z = VSUB(T4l, T4m); T50 = VSUB(T4p, T4o); T51 = VFMA(LDK(KP881921264), T4Z, VMUL(LDK(KP471396736), T50)); T5a = VFNMS(LDK(KP471396736), T4Z, VMUL(LDK(KP881921264), T50)); T52 = VSUB(T4s, T4t); T53 = VSUB(T4w, T4v); T54 = VFNMS(LDK(KP471396736), T53, VMUL(LDK(KP881921264), T52)); T5b = VFMA(LDK(KP471396736), T52, VMUL(LDK(KP881921264), T53)); } T55 = VADD(T51, T54); T5k = VSUB(T5b, T5a); T5c = VADD(T5a, T5b); T5g = VSUB(T54, T51); } { V T4A, T4L, T5i, T5l; T4A = VADD(T4k, T4z); T4L = VBYI(VADD(T4H, T4K)); ST(&(x[WS(rs, 61)]), VSUB(T4A, T4L), ms, &(x[WS(rs, 1)])); ST(&(x[WS(rs, 3)]), VADD(T4A, T4L), ms, &(x[WS(rs, 1)])); T5i = VBYI(VSUB(T5g, T5h)); T5l = VSUB(T5j, T5k); ST(&(x[WS(rs, 21)]), VADD(T5i, T5l), ms, &(x[WS(rs, 1)])); ST(&(x[WS(rs, 43)]), VSUB(T5l, T5i), ms, &(x[WS(rs, 1)])); } { V T5m, T5n, T4M, T4N; T5m = VBYI(VADD(T5h, T5g)); T5n = VADD(T5j, T5k); ST(&(x[WS(rs, 11)]), VADD(T5m, T5n), ms, &(x[WS(rs, 1)])); ST(&(x[WS(rs, 53)]), VSUB(T5n, T5m), ms, &(x[WS(rs, 1)])); T4M = VSUB(T4k, T4z); T4N = VBYI(VSUB(T4K, T4H)); ST(&(x[WS(rs, 35)]), VSUB(T4M, T4N), ms, &(x[WS(rs, 1)])); ST(&(x[WS(rs, 29)]), VADD(T4M, T4N), ms, &(x[WS(rs, 1)])); } { V T4Q, T4T, T56, T5d; T4Q = VBYI(VSUB(T4O, T4P)); T4T = VSUB(T4R, T4S); ST(&(x[WS(rs, 19)]), VADD(T4Q, T4T), ms, &(x[WS(rs, 1)])); ST(&(x[WS(rs, 45)]), VSUB(T4T, T4Q), ms, &(x[WS(rs, 1)])); T56 = VADD(T4Y, T55); T5d = VBYI(VADD(T59, T5c)); ST(&(x[WS(rs, 59)]), VSUB(T56, T5d), ms, &(x[WS(rs, 1)])); ST(&(x[WS(rs, 5)]), VADD(T56, T5d), ms, &(x[WS(rs, 1)])); } { V T5e, T5f, T4U, T4V; T5e = VSUB(T4Y, T55); T5f = VBYI(VSUB(T5c, T59)); ST(&(x[WS(rs, 37)]), VSUB(T5e, T5f), ms, &(x[WS(rs, 1)])); ST(&(x[WS(rs, 27)]), VADD(T5e, T5f), ms, &(x[WS(rs, 1)])); T4U = VBYI(VADD(T4P, T4O)); T4V = VADD(T4R, T4S); ST(&(x[WS(rs, 13)]), VADD(T4U, T4V), ms, &(x[WS(rs, 1)])); ST(&(x[WS(rs, 51)]), VSUB(T4V, T4U), ms, &(x[WS(rs, 1)])); } } { V T1u, T43, T3D, T3V, T3t, T45, T3B, T3K, T3d, T3E, T3w, T3A, T3R, T46, T3Y; V T42; { V TE, T3T, T1t, T3U, T13, T1s; TE = VSUB(Tg, TD); T3T = VADD(T3o, T3h); T13 = VFMA(LDK(KP195090322), TV, VMUL(LDK(KP980785280), T12)); T1s = VFNMS(LDK(KP195090322), T1r, VMUL(LDK(KP980785280), T1k)); T1t = VSUB(T13, T1s); T3U = VADD(T1s, T13); T1u = VADD(TE, T1t); T43 = VSUB(T3U, T3T); T3D = VSUB(TE, T1t); T3V = VADD(T3T, T3U); } { V T3p, T3I, T3s, T3J, T3q, T3r; T3p = VSUB(T3h, T3o); T3I = VADD(Tg, TD); T3q = VFNMS(LDK(KP195090322), T12, VMUL(LDK(KP980785280), TV)); T3r = VFMA(LDK(KP980785280), T1r, VMUL(LDK(KP195090322), T1k)); T3s = VSUB(T3q, T3r); T3J = VADD(T3r, T3q); T3t = VADD(T3p, T3s); T45 = VSUB(T3I, T3J); T3B = VSUB(T3s, T3p); T3K = VADD(T3I, T3J); } { V T2l, T3u, T3c, T3v; { V T29, T2k, T30, T3b; T29 = VSUB(T1R, T28); T2k = VSUB(T2g, T2j); T2l = VFMA(LDK(KP634393284), T29, VMUL(LDK(KP773010453), T2k)); T3u = VFNMS(LDK(KP634393284), T2k, VMUL(LDK(KP773010453), T29)); T30 = VSUB(T2C, T2Z); T3b = VSUB(T33, T3a); T3c = VFNMS(LDK(KP634393284), T3b, VMUL(LDK(KP773010453), T30)); T3v = VFMA(LDK(KP773010453), T3b, VMUL(LDK(KP634393284), T30)); } T3d = VADD(T2l, T3c); T3E = VSUB(T3v, T3u); T3w = VADD(T3u, T3v); T3A = VSUB(T3c, T2l); } { V T3N, T3W, T3Q, T3X; { V T3L, T3M, T3O, T3P; T3L = VADD(T28, T1R); T3M = VADD(T2g, T2j); T3N = VFMA(LDK(KP098017140), T3L, VMUL(LDK(KP995184726), T3M)); T3W = VFNMS(LDK(KP098017140), T3M, VMUL(LDK(KP995184726), T3L)); T3O = VADD(T2C, T2Z); T3P = VADD(T3a, T33); T3Q = VFNMS(LDK(KP098017140), T3P, VMUL(LDK(KP995184726), T3O)); T3X = VFMA(LDK(KP995184726), T3P, VMUL(LDK(KP098017140), T3O)); } T3R = VADD(T3N, T3Q); T46 = VSUB(T3X, T3W); T3Y = VADD(T3W, T3X); T42 = VSUB(T3Q, T3N); } { V T3e, T3x, T44, T47; T3e = VADD(T1u, T3d); T3x = VBYI(VADD(T3t, T3w)); ST(&(x[WS(rs, 57)]), VSUB(T3e, T3x), ms, &(x[WS(rs, 1)])); ST(&(x[WS(rs, 7)]), VADD(T3e, T3x), ms, &(x[WS(rs, 1)])); T44 = VBYI(VSUB(T42, T43)); T47 = VSUB(T45, T46); ST(&(x[WS(rs, 17)]), VADD(T44, T47), ms, &(x[WS(rs, 1)])); ST(&(x[WS(rs, 47)]), VSUB(T47, T44), ms, &(x[WS(rs, 1)])); } { V T48, T49, T3y, T3z; T48 = VBYI(VADD(T43, T42)); T49 = VADD(T45, T46); ST(&(x[WS(rs, 15)]), VADD(T48, T49), ms, &(x[WS(rs, 1)])); ST(&(x[WS(rs, 49)]), VSUB(T49, T48), ms, &(x[WS(rs, 1)])); T3y = VSUB(T1u, T3d); T3z = VBYI(VSUB(T3w, T3t)); ST(&(x[WS(rs, 39)]), VSUB(T3y, T3z), ms, &(x[WS(rs, 1)])); ST(&(x[WS(rs, 25)]), VADD(T3y, T3z), ms, &(x[WS(rs, 1)])); } { V T3C, T3F, T3S, T3Z; T3C = VBYI(VSUB(T3A, T3B)); T3F = VSUB(T3D, T3E); ST(&(x[WS(rs, 23)]), VADD(T3C, T3F), ms, &(x[WS(rs, 1)])); ST(&(x[WS(rs, 41)]), VSUB(T3F, T3C), ms, &(x[WS(rs, 1)])); T3S = VADD(T3K, T3R); T3Z = VBYI(VADD(T3V, T3Y)); ST(&(x[WS(rs, 63)]), VSUB(T3S, T3Z), ms, &(x[WS(rs, 1)])); ST(&(x[WS(rs, 1)]), VADD(T3S, T3Z), ms, &(x[WS(rs, 1)])); } { V T40, T41, T3G, T3H; T40 = VSUB(T3K, T3R); T41 = VBYI(VSUB(T3Y, T3V)); ST(&(x[WS(rs, 33)]), VSUB(T40, T41), ms, &(x[WS(rs, 1)])); ST(&(x[WS(rs, 31)]), VADD(T40, T41), ms, &(x[WS(rs, 1)])); T3G = VBYI(VADD(T3B, T3A)); T3H = VADD(T3D, T3E); ST(&(x[WS(rs, 9)]), VADD(T3G, T3H), ms, &(x[WS(rs, 1)])); ST(&(x[WS(rs, 55)]), VSUB(T3H, T3G), ms, &(x[WS(rs, 1)])); } } }}static const tw_instr twinstr[] = { VTW(0, 1), VTW(0, 2), VTW(0, 3), VTW(0, 4), VTW(0, 5), VTW(0, 6), VTW(0, 7), VTW(0, 8), VTW(0, 9), VTW(0, 10), VTW(0, 11), VTW(0, 12), VTW(0, 13), VTW(0, 14), VTW(0, 15), VTW(0, 16), VTW(0, 17), VTW(0, 18), VTW(0, 19), VTW(0, 20), VTW(0, 21), VTW(0, 22), VTW(0, 23), VTW(0, 24), VTW(0, 25), VTW(0, 26), VTW(0, 27), VTW(0, 28), VTW(0, 29), VTW(0, 30), VTW(0, 31), VTW(0, 32), VTW(0, 33), VTW(0, 34), VTW(0, 35), VTW(0, 36), VTW(0, 37), VTW(0, 38), VTW(0, 39), VTW(0, 40), VTW(0, 41), VTW(0, 42), VTW(0, 43), VTW(0, 44), VTW(0, 45), VTW(0, 46), VTW(0, 47), VTW(0, 48), VTW(0, 49), VTW(0, 50), VTW(0, 51), VTW(0, 52), VTW(0, 53), VTW(0, 54), VTW(0, 55), VTW(0, 56), VTW(0, 57), VTW(0, 58), VTW(0, 59), VTW(0, 60), VTW(0, 61), VTW(0, 62), VTW(0, 63), {TW_NEXT, VL, 0}};static const ct_desc desc = { 64, "t2fv_64", twinstr, &GENUS, {467, 198, 52, 0}, 0, 0, 0 };void X(codelet_t2fv_64) (planner *p) { X(kdft_dit_register) (p, t2fv_64, &desc);}#endif /* HAVE_FMA */
⌨️ 快捷键说明
复制代码
Ctrl + C
搜索代码
Ctrl + F
全屏模式
F11
切换主题
Ctrl + Shift + D
显示快捷键
?
增大字号
Ctrl + =
减小字号
Ctrl + -