📄 n1k7_14.s
字号:
/* * Copyright (c) 2003 Matteo Frigo * Copyright (c) 2003 Massachusetts Institute of Technology * * This program is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation; either version 2 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program; if not, write to the Free Software * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA * *//* This file was automatically generated --- DO NOT EDIT *//* Generated on Sat Jul 5 21:50:59 EDT 2003 */#include "config.h"/* $$$-mode: VECTGRADE_FULL succeeded (590 steps) *//* Generated by: /homee/stevenj/cvs/fftw3.0.1/genfft-k7/gen_notw -no-randomized-cse -n 14 -name n1k7_14 *//* * Generator Id's : * $Id: algsimp.ml,v 1.3 2003/03/15 20:29:42 stevenj Exp $ * $Id: fft.ml,v 1.3 2003/03/15 20:29:43 stevenj Exp $ * $Id: gen_notw.ml,v 1.11 2003/04/18 01:21:45 athena Exp $ *//* The following asm code is Copyright (c) 2000-2001 Stefan Kral */.section .rodata .balign 64KP781831482KN781831482: .float +0.781831482468029808708444526674057750232334519, -0.781831482468029808708444526674057750232334519KP433883739KN433883739: .float +0.433883739117558120475768332848358754609990728, -0.433883739117558120475768332848358754609990728KP974927912KN974927912: .float +0.974927912181823607018131682993931217232785801, -0.974927912181823607018131682993931217232785801KP900968867KP900968867: .float +0.900968867902419126236102319507445051165919162, +0.900968867902419126236102319507445051165919162KP623489801KP623489801: .float +0.623489801858733530525004884004239810632274731, +0.623489801858733530525004884004239810632274731KP222520933KP222520933: .float +0.222520933956314404288902564496794759466355569, +0.222520933956314404288902564496794759466355569.text.text .balign 64n1k7_14: subl $268, %esp femms movl %ebx, 264(%esp) movl 288(%esp), %edx movl 292(%esp), %ebx movl %esi, 260(%esp) movl %edi, 256(%esp) movl 272(%esp), %eax movl %ebp, 252(%esp) movl 280(%esp), %ecx sall $2, 300(%esp) leal (,%edx,4), %edx sall $2, 304(%esp) leal (,%ebx,4), %ebx .p2align 4,,7.L0: /* promise simd cell size = 8 */ leal (%edx,%edx,2), %esi movq (%eax), %mm1 movq (%eax,%edx,4), %mm3 leal (%edx,%esi,2), %edi movq (%eax,%esi), %mm6 leal (%edx,%edx,4), %esi leal (%edi,%edx,4), %ebp movq (%eax,%edi), %mm0 movq (%eax,%esi,2), %mm7 movq %mm1, %mm2 movq %mm3, %mm4 leal (%edx,%edx,8), %esi movq (%eax,%ebp), %mm5 leal (%ebp,%edx,2), %edi leal (%edx,%edx,2), %ebp pfsub %mm0, %mm2 pfadd %mm0, %mm1 movq %mm7, %mm0 pfadd %mm6, %mm7 pfadd %mm5, %mm3 movq %mm2, 8(%esp) pfsub %mm5, %mm4 pfsub %mm6, %mm0 movq %mm1, 0(%esp) movq %mm3, %mm2 pfsubr %mm7, %mm3 movq %mm4, %mm6 pfadd %mm0, %mm4 pfadd %mm7, %mm2 pswapd %mm3, %mm3 pfsub %mm0, %mm6 movq %mm3, %mm5 movq %mm3, %mm1 pfmul KP781831482KN781831482, %mm3 movq %mm4, 80(%esp) pfmul KP433883739KN433883739, %mm1 movq %mm2, 72(%esp) pswapd %mm6, %mm6 pfmul KP974927912KN974927912, %mm5 movq %mm6, %mm7 movq %mm6, %mm0 pfmul KP781831482KN781831482, %mm6 movq %mm3, 16(%esp) movq %mm4, %mm3 pfmul KP433883739KN433883739, %mm7 pfmul KP974927912KN974927912, %mm0 pfmul KP900968867KP900968867, %mm3 movq %mm1, 88(%esp) movq %mm4, %mm1 pfmul KP623489801KP623489801, %mm4 movq %mm5, 96(%esp) movq %mm2, %mm5 pfmul KP222520933KP222520933, %mm1 pfmul KP222520933KP222520933, %mm5 movq %mm3, 24(%esp) movq %mm2, %mm3 pfmul KP900968867KP900968867, %mm2 movq %mm4, 32(%esp) pfmul KP623489801KP623489801, %mm3 movq %mm1, 40(%esp) movq %mm5, 48(%esp) movq (%eax,%ebp,2), %mm4 movq (%eax,%edi), %mm1 leal (%edx,%edx,4), %edi movq %mm4, %mm5 movq %mm2, 56(%esp) movq (%eax,%edx,8), %mm2 pfsub %mm1, %mm5 movq %mm3, 64(%esp) movq (%eax,%edx), %mm3 pfadd %mm1, %mm4 movq %mm2, %mm1 pfsub %mm3, %mm2 pfadd %mm3, %mm1 movq %mm5, %mm3 pfadd %mm2, %mm5 pfsub %mm2, %mm3 movq %mm5, %mm2 movq %mm5, 120(%esp) movq %mm3, 104(%esp) movq %mm5, %mm3 pfmul KP623489801KP623489801, %mm5 pfmul KP222520933KP222520933, %mm2 pfmul KP900968867KP900968867, %mm3 movq %mm5, 176(%esp) movq %mm2, 112(%esp) movq %mm3, 168(%esp) movq %mm4, %mm3 pfadd %mm1, %mm4 pfsubr %mm1, %mm3 movq %mm4, 144(%esp) movq (%eax,%esi), %mm1 movq %mm4, %mm2 movq %mm4, %mm5 pfmul KP900968867KP900968867, %mm4 pfmul KP222520933KP222520933, %mm5 movq %mm3, 128(%esp) pfmul KP623489801KP623489801, %mm2 movq %mm4, 160(%esp) movq (%eax,%edx,2), %mm3 movq (%eax,%ebp,4), %mm4 leal (%ebx,%ebx,2), %ebp movq %mm5, 152(%esp) movq %mm3, %mm5 pfadd %mm1, %mm3 movq %mm2, 136(%esp) movq (%eax,%edi), %mm2 leal (%ebx,%ebp,2), %esi pfsub %mm1, %mm5 /* simd data load/store barrier */ leal (%ebx,%ebp,4), %edi movq %mm4, %mm1 leal (%esi,%ebx,4), %ebp addl 300(%esp), %eax pfsub %mm2, %mm1 pfadd %mm2, %mm4 movq %mm5, %mm2 pfsub %mm1, %mm5 pfadd %mm1, %mm2 movq %mm3, %mm1 pfadd %mm4, %mm3 pfsub %mm4, %mm1 pswapd %mm5, %mm5 movq %mm5, %mm4 pswapd %mm1, %mm1 pfmul KP974927912KN974927912, %mm4 pfsub %mm7, %mm4 movq %mm5, %mm7 pfmul KP433883739KN433883739, %mm5 pfmul KP781831482KN781831482, %mm7 movq %mm4, 208(%esp) movq %mm1, %mm4 pfmul KP781831482KN781831482, %mm4 pfsub %mm6, %mm5 movq %mm2, %mm6 pfadd %mm7, %mm0 movq %mm1, %mm7 pfmul KP974927912KN974927912, %mm1 pfmul KP623489801KP623489801, %mm6 pfmul KP433883739KN433883739, %mm7 movq %mm5, 216(%esp) movq %mm2, %mm5 pfsub 96(%esp), %mm4 pfmul KP222520933KP222520933, %mm5 pfadd 88(%esp), %mm1 pfsub 168(%esp), %mm6 pfadd 16(%esp), %mm7 movq %mm4, 184(%esp) movq %mm3, %mm4 pfsubr 176(%esp), %mm5 pfmul KP623489801KP623489801, %mm4 movq %mm1, 192(%esp) movq %mm3, %mm1 pfmul KP222520933KP222520933, %mm1 movq %mm7, 200(%esp) movq %mm2, %mm7 pfadd 120(%esp), %mm2 pfmul KP900968867KP900968867, %mm7 pfsub 160(%esp), %mm4 pfsubr 136(%esp), %mm1 pfadd 112(%esp), %mm7 movq %mm4, 224(%esp) movq %mm3, %mm4 pfadd 144(%esp), %mm3 pfmul KP900968867KP900968867, %mm4 movq %mm1, 232(%esp) movq 8(%esp), %mm1 pfadd 152(%esp), %mm4 movq %mm4, 240(%esp) movq 80(%esp), %mm4 pfadd %mm1, %mm4 pfadd %mm4, %mm2 movq %mm1, %mm4 pfsub 40(%esp), %mm4 movq %mm2, (%ecx,%esi) movq 104(%esp), %mm2 leal (%ebx,%ebx,2), %esi pswapd %mm2, %mm2 pfadd %mm4, %mm6 movq %mm2, %mm4 pfmul KP433883739KN433883739, %mm4 pfadd %mm4, %mm0 movq %mm6, %mm4 pfsub %mm0, %mm6 pfadd %mm0, %mm4 movq %mm1, %mm0 pfadd 32(%esp), %mm1 pfsub 24(%esp), %mm0 movq %mm6, (%ecx,%edi) movq %mm2, %mm6 pfmul KP974927912KN974927912, %mm2 movq %mm4, (%ecx,%ebx) leal (%ebx,%ebx,4), %edi pfmul KP781831482KN781831482, %mm6 pfsubr %mm1, %mm7 movq 72(%esp), %mm1 pfadd %mm0, %mm5 pfadd 216(%esp), %mm2 pfsubr 208(%esp), %mm6 movq %mm7, %mm4 movq %mm5, %mm0 pfsub %mm2, %mm7 pfadd %mm2, %mm4 movq 0(%esp), %mm2 pfsub %mm6, %mm0 pfadd %mm6, %mm5 movq %mm7, (%ecx,%ebp) movq 128(%esp), %mm7 leal (%ebx,%ebx,8), %ebp movq %mm2, %mm6 movq %mm4, (%ecx,%esi) pfadd %mm2, %mm1 movq %mm0, (%ecx,%edi) movq %mm2, %mm0 pfsub 56(%esp), %mm2 pfadd 64(%esp), %mm6 movq %mm5, (%ecx,%ebp) pswapd %mm7, %mm7 pfsub 48(%esp), %mm0 pfadd %mm1, %mm3 movq %mm7, %mm4 movq %mm7, %mm5 pfmul KP781831482KN781831482, %mm7 pfmul KP974927912KN974927912, %mm4 pfadd 232(%esp), %mm2 pfmul KP433883739KN433883739, %mm5 pfsub 240(%esp), %mm6 pfadd 224(%esp), %mm0 pfadd 192(%esp), %mm7 pfsubr 200(%esp), %mm4 pfsubr 184(%esp), %mm5 movq %mm3, (%ecx) movq %mm6, %mm1 movq %mm0, %mm3 pfsub %mm4, %mm1 pfadd %mm4, %mm6 movq %mm2, %mm4 pfsub %mm5, %mm3 pfadd %mm5, %mm0 pfsub %mm7, %mm2 movq %mm1, (%ecx,%ebx,4) pfadd %mm7, %mm4 movq %mm6, (%ecx,%edi,2) movq %mm3, (%ecx,%esi,2) movq %mm0, (%ecx,%ebx,8) movq %mm2, (%ecx,%esi,4) movq %mm4, (%ecx,%ebx,2) addl 304(%esp), %ecx decl 296(%esp) jnz .L0 femms movl 264(%esp), %ebx movl 260(%esp), %esi movl 256(%esp), %edi movl 252(%esp), %ebp addl $268, %esp ret .section .rodatanam: .string "n1k7_14" .align 4desc: .long 14 .long nam .double 74 .double 36 .double 0 .double 0 .long fftwf_kdft_k7_mgenus .long 0 .long 0 .long 0 .long 0.text .align 4.globl fftwf_codelet_n1k7_14fftwf_codelet_n1k7_14: subl $12,%esp addl $-4,%esp pushl $desc pushl $n1k7_14 pushl 28(%esp) call fftwf_kdft_register addl $16,%esp addl $12,%esp ret
⌨️ 快捷键说明
复制代码
Ctrl + C
搜索代码
Ctrl + F
全屏模式
F11
切换主题
Ctrl + Shift + D
显示快捷键
?
增大字号
Ctrl + =
减小字号
Ctrl + -