⭐ 欢迎来到虫虫下载站! | 📦 资源下载 📁 资源专辑 ℹ️ 关于我们
⭐ 虫虫下载站

📄 n1_20.c

📁 快速fft变换
💻 C
📖 第 1 页 / 共 2 页
字号:
/* * Copyright (c) 2003, 2007-8 Matteo Frigo * Copyright (c) 2003, 2007-8 Massachusetts Institute of Technology * * This program is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation; either version 2 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program; if not, write to the Free Software * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA * *//* This file was automatically generated --- DO NOT EDIT *//* Generated on Sat Nov 15 20:37:12 EST 2008 */#include "codelet-dft.h"#ifdef HAVE_FMA/* Generated by: ../../../genfft/gen_notw -fma -reorder-insns -schedule-for-pipeline -compact -variables 4 -pipeline-latency 4 -n 20 -name n1_20 -include n.h *//* * This function contains 208 FP additions, 72 FP multiplications, * (or, 136 additions, 0 multiplications, 72 fused multiply/add), * 86 stack variables, 4 constants, and 80 memory accesses */#include "n.h"static void n1_20(const R *ri, const R *ii, R *ro, R *io, stride is, stride os, INT v, INT ivs, INT ovs){     DK(KP951056516, +0.951056516295153572116439333379382143405698634);     DK(KP559016994, +0.559016994374947424102293417182819058860154590);     DK(KP618033988, +0.618033988749894848204586834365638117720309180);     DK(KP250000000, +0.250000000000000000000000000000000000000000000);     INT i;     for (i = v; i > 0; i = i - 1, ri = ri + ivs, ii = ii + ivs, ro = ro + ovs, io = io + ovs, MAKE_VOLATILE_STRIDE(is), MAKE_VOLATILE_STRIDE(os)) {	  E T1Y, T1Z, T1W, T1V;	  {	       E T1d, TP, TD, T7, T3b, T2N, T2f, T1R, T2U, TB, T2P, T2A, T3d, T37, T3j;	       E TJ, T2n, T1b, T1T, T1y, T2b, T2h, T1j, T2V, Tm, T2O, T2H, T3c, T34, T1e;	       E T1f, T3i, TG, T2m, T10, T1S, T1J, T28, T2g;	       {		    E T4, T1N, T3, T2L, TN, T5, T1O, T1P, T1h, T1i;		    {			 E T1, T2, TL, TM;			 T1 = ri[0];			 T2 = ri[WS(is, 10)];			 TL = ii[0];			 TM = ii[WS(is, 10)];			 T4 = ri[WS(is, 5)];			 T1N = T1 - T2;			 T3 = T1 + T2;			 T2L = TL + TM;			 TN = TL - TM;			 T5 = ri[WS(is, 15)];			 T1O = ii[WS(is, 5)];			 T1P = ii[WS(is, 15)];		    }		    {			 E T1o, Tp, T2u, T13, T14, Ts, T2v, T1r, Tx, T1t, Tw, T2x, T18, Ty, T1u;			 E T1v;			 {			      E Tq, Tr, T1p, T1q;			      {				   E Tn, To, T11, T12;				   Tn = ri[WS(is, 8)];				   {					E TO, T6, T2M, T1Q;					TO = T4 - T5;					T6 = T4 + T5;					T2M = T1O + T1P;					T1Q = T1O - T1P;					T1d = TO + TN;					TP = TN - TO;					TD = T3 + T6;					T7 = T3 - T6;					T3b = T2L + T2M;					T2N = T2L - T2M;					T2f = T1N + T1Q;					T1R = T1N - T1Q;					To = ri[WS(is, 18)];				   }				   T11 = ii[WS(is, 8)];				   T12 = ii[WS(is, 18)];				   Tq = ri[WS(is, 13)];				   T1o = Tn - To;				   Tp = Tn + To;				   T2u = T11 + T12;				   T13 = T11 - T12;				   Tr = ri[WS(is, 3)];				   T1p = ii[WS(is, 13)];				   T1q = ii[WS(is, 3)];			      }			      {				   E Tu, Tv, T16, T17;				   Tu = ri[WS(is, 12)];				   T14 = Tq - Tr;				   Ts = Tq + Tr;				   T2v = T1p + T1q;				   T1r = T1p - T1q;				   Tv = ri[WS(is, 2)];				   T16 = ii[WS(is, 12)];				   T17 = ii[WS(is, 2)];				   Tx = ri[WS(is, 17)];				   T1t = Tu - Tv;				   Tw = Tu + Tv;				   T2x = T16 + T17;				   T18 = T16 - T17;				   Ty = ri[WS(is, 7)];				   T1u = ii[WS(is, 17)];				   T1v = ii[WS(is, 7)];			      }			 }			 {			      E TH, T19, T1w, TI;			      {				   E Tt, T2w, T35, TA, T2z, T36, Tz, T2y;				   TH = Tp + Ts;				   Tt = Tp - Ts;				   T19 = Tx - Ty;				   Tz = Tx + Ty;				   T2y = T1u + T1v;				   T1w = T1u - T1v;				   T2w = T2u - T2v;				   T35 = T2u + T2v;				   TI = Tw + Tz;				   TA = Tw - Tz;				   T2z = T2x - T2y;				   T36 = T2x + T2y;				   T2U = Tt - TA;				   TB = Tt + TA;				   T2P = T2w + T2z;				   T2A = T2w - T2z;				   T3d = T35 + T36;				   T37 = T35 - T36;			      }			      {				   E T1s, T29, T1x, T2a, T15, T1a;				   T15 = T13 - T14;				   T1h = T14 + T13;				   T1i = T19 + T18;				   T1a = T18 - T19;				   T1s = T1o - T1r;				   T29 = T1o + T1r;				   T3j = TH - TI;				   TJ = TH + TI;				   T1x = T1t - T1w;				   T2a = T1t + T1w;				   T2n = T15 - T1a;				   T1b = T15 + T1a;				   T1T = T1s + T1x;				   T1y = T1s - T1x;				   T2b = T29 - T2a;				   T2h = T29 + T2a;			      }			 }		    }		    {			 E Ta, T1z, T2B, TS, TT, Td, T2C, T1C, Ti, T1E, Th, T2E, TX, Tj, T1F;			 E T1G;			 {			      E Tb, Tc, T1A, T1B;			      {				   E TQ, TR, T8, T9;				   T8 = ri[WS(is, 4)];				   T9 = ri[WS(is, 14)];				   T1j = T1h + T1i;				   T1Y = T1h - T1i;				   TQ = ii[WS(is, 4)];				   TR = ii[WS(is, 14)];				   Ta = T8 + T9;				   T1z = T8 - T9;				   Tb = ri[WS(is, 9)];				   T2B = TQ + TR;				   TS = TQ - TR;				   Tc = ri[WS(is, 19)];				   T1A = ii[WS(is, 9)];				   T1B = ii[WS(is, 19)];			      }			      {				   E Tf, Tg, TV, TW;				   Tf = ri[WS(is, 16)];				   TT = Tb - Tc;				   Td = Tb + Tc;				   T2C = T1A + T1B;				   T1C = T1A - T1B;				   Tg = ri[WS(is, 6)];				   TV = ii[WS(is, 16)];				   TW = ii[WS(is, 6)];				   Ti = ri[WS(is, 1)];				   T1E = Tf - Tg;				   Th = Tf + Tg;				   T2E = TV + TW;				   TX = TV - TW;				   Tj = ri[WS(is, 11)];				   T1F = ii[WS(is, 1)];				   T1G = ii[WS(is, 11)];			      }			 }			 {			      E TE, TY, T1H, TF;			      {				   E Te, T2D, T32, Tl, T2G, T33, Tk, T2F;				   TE = Ta + Td;				   Te = Ta - Td;				   TY = Ti - Tj;				   Tk = Ti + Tj;				   T2F = T1F + T1G;				   T1H = T1F - T1G;				   T2D = T2B - T2C;				   T32 = T2B + T2C;				   TF = Th + Tk;				   Tl = Th - Tk;				   T2G = T2E - T2F;				   T33 = T2E + T2F;				   T2V = Te - Tl;				   Tm = Te + Tl;				   T2O = T2D + T2G;				   T2H = T2D - T2G;				   T3c = T32 + T33;				   T34 = T32 - T33;			      }			      {				   E T1D, T26, T1I, T27, TU, TZ;				   TU = TS - TT;				   T1e = TT + TS;				   T1f = TY + TX;				   TZ = TX - TY;				   T1D = T1z - T1C;				   T26 = T1z + T1C;				   T3i = TE - TF;				   TG = TE + TF;				   T1I = T1E - T1H;				   T27 = T1E + T1H;				   T2m = TU - TZ;				   T10 = TU + TZ;				   T1S = T1D + T1I;				   T1J = T1D - T1I;				   T28 = T26 - T27;				   T2g = T26 + T27;			      }			 }		    }	       }	       {		    E T1g, T3g, T3f, T2S, T2R, T2k, T2j;		    {			 E T2s, T2r, TC, T2Q;			 T2s = Tm - TB;			 TC = Tm + TB;			 T1g = T1e + T1f;			 T1Z = T1e - T1f;			 T2r = FNMS(KP250000000, TC, T7);			 ro[WS(os, 10)] = T7 + TC;			 T2Q = T2O + T2P;			 T2S = T2O - T2P;			 {			      E T2K, T2I, T2t, T2J;			      T2K = FMA(KP618033988, T2A, T2H);			      T2I = FNMS(KP618033988, T2H, T2A);			      T2t = FNMS(KP559016994, T2s, T2r);			      T2J = FMA(KP559016994, T2s, T2r);			      ro[WS(os, 18)] = FMA(KP951056516, T2I, T2t);			      ro[WS(os, 2)] = FNMS(KP951056516, T2I, T2t);			      ro[WS(os, 6)] = FMA(KP951056516, T2K, T2J);			      ro[WS(os, 14)] = FNMS(KP951056516, T2K, T2J);			      T2R = FNMS(KP250000000, T2Q, T2N);			 }			 io[WS(os, 10)] = T2N + T2Q;		    }		    {			 E T30, T2Z, TK, T3e;			 TK = TG + TJ;			 T30 = TG - TJ;			 {			      E T2T, T2X, T2Y, T2W;			      T2T = FNMS(KP559016994, T2S, T2R);			      T2X = FMA(KP559016994, T2S, T2R);			      T2Y = FMA(KP618033988, T2U, T2V);			      T2W = FNMS(KP618033988, T2V, T2U);			      io[WS(os, 14)] = FMA(KP951056516, T2Y, T2X);			      io[WS(os, 6)] = FNMS(KP951056516, T2Y, T2X);			      io[WS(os, 18)] = FNMS(KP951056516, T2W, T2T);			      io[WS(os, 2)] = FMA(KP951056516, T2W, T2T);			      T2Z = FNMS(KP250000000, TK, TD);			 }			 ro[0] = TD + TK;			 T3e = T3c + T3d;			 T3g = T3c - T3d;			 {			      E T31, T39, T3a, T38;			      T31 = FMA(KP559016994, T30, T2Z);			      T39 = FNMS(KP559016994, T30, T2Z);			      T3a = FNMS(KP618033988, T34, T37);			      T38 = FMA(KP618033988, T37, T34);			      ro[WS(os, 8)] = FMA(KP951056516, T3a, T39);			      ro[WS(os, 12)] = FNMS(KP951056516, T3a, T39);			      ro[WS(os, 16)] = FMA(KP951056516, T38, T31);			      ro[WS(os, 4)] = FNMS(KP951056516, T38, T31);			      T3f = FNMS(KP250000000, T3e, T3b);			 }			 io[0] = T3b + T3e;		    }		    {			 E T24, T23, T1c, T2i;			 T1c = T10 + T1b;			 T24 = T10 - T1b;			 {			      E T3h, T3l, T3m, T3k;			      T3h = FMA(KP559016994, T3g, T3f);			      T3l = FNMS(KP559016994, T3g, T3f);			      T3m = FNMS(KP618033988, T3i, T3j);			      T3k = FMA(KP618033988, T3j, T3i);			      io[WS(os, 12)] = FMA(KP951056516, T3m, T3l);			      io[WS(os, 8)] = FNMS(KP951056516, T3m, T3l);			      io[WS(os, 16)] = FNMS(KP951056516, T3k, T3h);			      io[WS(os, 4)] = FMA(KP951056516, T3k, T3h);			      T23 = FNMS(KP250000000, T1c, TP);			 }			 io[WS(os, 5)] = TP + T1c;			 T2i = T2g + T2h;			 T2k = T2g - T2h;			 {			      E T25, T2d, T2e, T2c;			      T25 = FMA(KP559016994, T24, T23);			      T2d = FNMS(KP559016994, T24, T23);			      T2e = FNMS(KP618033988, T28, T2b);			      T2c = FMA(KP618033988, T2b, T28);			      io[WS(os, 17)] = FMA(KP951056516, T2e, T2d);			      io[WS(os, 13)] = FNMS(KP951056516, T2e, T2d);			      io[WS(os, 9)] = FMA(KP951056516, T2c, T25);			      io[WS(os, 1)] = FNMS(KP951056516, T2c, T25);			      T2j = FNMS(KP250000000, T2i, T2f);			 }			 ro[WS(os, 5)] = T2f + T2i;		    }		    {			 E T1m, T1l, T1k, T1U;			 T1k = T1g + T1j;			 T1m = T1g - T1j;			 {			      E T2l, T2p, T2q, T2o;			      T2l = FMA(KP559016994, T2k, T2j);			      T2p = FNMS(KP559016994, T2k, T2j);			      T2q = FNMS(KP618033988, T2m, T2n);			      T2o = FMA(KP618033988, T2n, T2m);			      ro[WS(os, 17)] = FNMS(KP951056516, T2q, T2p);			      ro[WS(os, 13)] = FMA(KP951056516, T2q, T2p);			      ro[WS(os, 9)] = FNMS(KP951056516, T2o, T2l);			      ro[WS(os, 1)] = FMA(KP951056516, T2o, T2l);			      T1l = FNMS(KP250000000, T1k, T1d);			 }			 io[WS(os, 15)] = T1d + T1k;			 T1U = T1S + T1T;			 T1W = T1S - T1T;			 {			      E T1n, T1L, T1M, T1K;			      T1n = FNMS(KP559016994, T1m, T1l);			      T1L = FMA(KP559016994, T1m, T1l);			      T1M = FMA(KP618033988, T1y, T1J);			      T1K = FNMS(KP618033988, T1J, T1y);			      io[WS(os, 19)] = FMA(KP951056516, T1M, T1L);			      io[WS(os, 11)] = FNMS(KP951056516, T1M, T1L);			      io[WS(os, 7)] = FMA(KP951056516, T1K, T1n);

⌨️ 快捷键说明

复制代码 Ctrl + C
搜索代码 Ctrl + F
全屏模式 F11
切换主题 Ctrl + Shift + D
显示快捷键 ?
增大字号 Ctrl + =
减小字号 Ctrl + -