📄 n1k7i_16.s
字号:
/* * Copyright (c) 2003 Matteo Frigo * Copyright (c) 2003 Massachusetts Institute of Technology * * This program is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation; either version 2 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program; if not, write to the Free Software * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA * *//* This file was automatically generated --- DO NOT EDIT *//* Generated on Sat Jul 5 21:51:34 EDT 2003 */#include "config.h"/* cheap-mode: VECTGRADE_FULL succeeded. (330 steps) *//* Generated by: /homee/stevenj/cvs/fftw3.0.1/genfft-k7/gen_notw -no-randomized-cse -n 16 -sign 1 -name n1k7i_16 *//* * Generator Id's : * $Id: algsimp.ml,v 1.3 2003/03/15 20:29:42 stevenj Exp $ * $Id: fft.ml,v 1.3 2003/03/15 20:29:43 stevenj Exp $ * $Id: gen_notw.ml,v 1.11 2003/04/18 01:21:45 athena Exp $ *//* The following asm code is Copyright (c) 2000-2001 Stefan Kral */.section .rodata .balign 64KP707106781KP707106781: .float +0.707106781186547524400844362104849039284835938, +0.707106781186547524400844362104849039284835938chs_lo: .long 0x80000000, 0x00000000KP382683432KP923879532: .float +0.382683432365089771728459984030398866761344562, +0.923879532511286756128183189396788286822416626KP923879532KP382683432: .float +0.923879532511286756128183189396788286822416626, +0.382683432365089771728459984030398866761344562chs_hi: .long 0x00000000, 0x80000000.text.text .balign 64n1k7i_16: subl $132, %esp femms movl %esi, 124(%esp) movl 152(%esp), %ecx movl 156(%esp), %esi movl %ebx, 128(%esp) movl 140(%esp), %eax movl 148(%esp), %ebx movl %edi, 120(%esp) sall $2, 164(%esp) leal (,%ecx,4), %ecx movl %ebp, 116(%esp) sall $2, 168(%esp) leal (,%esi,4), %esi leal (%eax,%ecx,8), %edx leal (%ebx,%esi,8), %edi .p2align 4,,7.L0: /* promise simd cell size = 8 */ movq (%eax), %mm1 movq (%edx), %mm0 movq (%edx,%ecx,4), %mm3 movq (%eax,%ecx,4), %mm4 leal (%ecx,%ecx,2), %ebp movq (%edx,%ecx,2), %mm7 movq %mm1, %mm2 pfadd %mm0, %mm1 movq %mm4, %mm5 pfsub %mm3, %mm4 pfsub %mm0, %mm2 movq (%eax,%ecx,2), %mm0 pfadd %mm3, %mm5 movq %mm1, %mm6 movq %mm4, 24(%esp) movq %mm2, 0(%esp) movq (%eax,%ebp,2), %mm4 movq (%edx,%ebp,2), %mm2 movq %mm0, %mm3 pfsub %mm5, %mm1 leal (%ecx,%ecx,4), %ebp pfadd %mm5, %mm6 pfsub %mm7, %mm0 movq %mm2, %mm5 pfsub %mm4, %mm2 pfadd %mm7, %mm3 movq %mm1, 32(%esp) pfadd %mm4, %mm5 movq %mm6, 56(%esp) movq (%edx,%ecx), %mm4 movq (%eax,%ecx), %mm6 pswapd %mm2, %mm7 movq %mm3, %mm1 pfpnacc %mm0, %mm7 pfpnacc %mm2, %mm0 movq %mm6, %mm2 pfsubr %mm5, %mm3 pfadd %mm5, %mm1 movq %mm7, %mm5 pfsub %mm4, %mm6 pfnacc %mm0, %mm7 pfacc %mm5, %mm0 movq %mm3, 40(%esp) movq (%edx,%ebp), %mm5 movq (%eax,%ebp), %mm3 leal (%ecx,%ecx,2), %ebp movq %mm1, 48(%esp) movq %mm6, 64(%esp) pfadd %mm4, %mm2 pfmul KP707106781KP707106781, %mm7 leal (%ecx,%ebp,2), %ebp pfmul KP707106781KP707106781, %mm0 movq (%eax,%ebp), %mm1 movq (%edx,%ebp), %mm6 leal (%ecx,%ecx,2), %ebp movq %mm3, %mm4 pfadd %mm5, %mm3 pfsub %mm5, %mm4 movq %mm7, 8(%esp) movq (%edx,%ebp), %mm7 movq %mm6, %mm5 movq %mm0, 16(%esp) movq (%eax,%ebp), %mm0 pfsub %mm1, %mm6 pfadd %mm1, %mm5 /* simd data load/store barrier */ leal (%esi,%esi,2), %ebp pswapd %mm4, %mm4 addl 164(%esp), %eax addl 164(%esp), %edx movq %mm0, %mm1 pfsub %mm7, %mm0 pswapd %mm6, %mm6 pxor chs_lo, %mm4 pfadd %mm7, %mm1 movq %mm5, %mm7 pxor chs_lo, %mm0 pfsub %mm1, %mm7 pfadd %mm1, %mm5 movq %mm6, %mm1 pfadd %mm0, %mm6 pfsub %mm0, %mm1 movq %mm6, %mm0 pfmul KP382683432KP923879532, %mm6 pfmul KP923879532KP382683432, %mm0 movq %mm6, 80(%esp) movq %mm2, %mm6 pfadd %mm3, %mm2 movq %mm0, 72(%esp) movq %mm1, %mm0 pfmul KP382683432KP923879532, %mm1 pfsub %mm3, %mm6 pswapd %mm7, %mm3 pfmul KP923879532KP382683432, %mm0 pfpnacc %mm6, %mm3 movq %mm1, 88(%esp) movq 64(%esp), %mm1 pfpnacc %mm7, %mm6 movq %mm2, %mm7 pfadd %mm5, %mm2 movq %mm0, 104(%esp) pfsubr %mm5, %mm7 movq 56(%esp), %mm5 movq %mm1, %mm0 pfsub %mm4, %mm1 pfadd %mm4, %mm0 movq 48(%esp), %mm4 pswapd %mm7, %mm7 movq %mm1, 96(%esp) movq %mm5, %mm1 pxor chs_hi, %mm7 pfadd %mm4, %mm5 pfsub %mm4, %mm1 movq %mm5, %mm4 pfsub %mm2, %mm5 pfadd %mm2, %mm4 movq %mm3, %mm2 pfnacc %mm6, %mm3 movq %mm5, (%edi) movq 40(%esp), %mm5 pfacc %mm2, %mm6 pswapd %mm0, %mm2 pfmul KP923879532KP382683432, %mm0 movq %mm4, (%ebx) movq %mm1, %mm4 pfadd %mm7, %mm1 pfmul KP707106781KP707106781, %mm3 pfsub %mm7, %mm4 pswapd %mm5, %mm5 movq 32(%esp), %mm7 pfmul KP707106781KP707106781, %mm6 pxor chs_hi, %mm5 pfmul KP923879532KP382683432, %mm2 pfpnacc 88(%esp), %mm0 movq %mm1, (%ebx,%esi,4) movq %mm7, %mm1 movq %mm4, (%edi,%esi,4) pfadd %mm5, %mm1 pfsub %mm5, %mm7 movq %mm1, %mm5 pfadd %mm6, %mm1 movq %mm7, %mm4 pfsub %mm3, %mm7 pfsub %mm6, %mm5 pfadd %mm3, %mm4 movq 104(%esp), %mm3 movq %mm1, (%ebx,%esi,2) movq 24(%esp), %mm1 movq %mm7, (%edi,%ebp,2) movq 0(%esp), %mm7 movq %mm5, (%edi,%esi,2) pfpnacc %mm2, %mm3 movq 16(%esp), %mm2 movq %mm4, (%ebx,%ebp,2) pswapd %mm1, %mm1 leal (%esi,%esi,4), %ebp movq %mm7, %mm4 pxor chs_lo, %mm1 movq %mm3, %mm6 pfnacc %mm0, %mm3 pfacc %mm6, %mm0 movq 96(%esp), %mm6 pfadd %mm1, %mm7 pfsub %mm1, %mm4 pswapd %mm6, %mm1 pfmul KP382683432KP923879532, %mm6 movq %mm7, %mm5 pfsub %mm2, %mm7 pfmul KP382683432KP923879532, %mm1 pfadd %mm2, %mm5 movq %mm7, %mm2 pfadd %mm3, %mm7 pfpnacc 72(%esp), %mm6 pfsub %mm3, %mm2 movq %mm5, %mm3 pfadd %mm0, %mm5 movq %mm7, (%ebx,%ebp) movq 80(%esp), %mm7 pfsub %mm0, %mm3 movq %mm4, %mm0 movq %mm2, (%edi,%ebp) movq 8(%esp), %mm2 leal (%esi,%esi,2), %ebp movq %mm5, (%ebx,%esi) pfpnacc %mm1, %mm7 movq %mm3, (%edi,%esi) pfadd %mm2, %mm4 pfsub %mm2, %mm0 movq %mm7, %mm5 pfnacc %mm6, %mm7 pfacc %mm5, %mm6 movq %mm4, %mm2 movq %mm0, %mm3 pfadd %mm7, %mm0 pfsub %mm7, %mm3 pfsub %mm6, %mm2 pfadd %mm6, %mm4 movq %mm2, (%edi,%ebp) movq %mm4, (%ebx,%ebp) leal (%esi,%esi,2), %ebp leal (%esi,%ebp,2), %ebp movq %mm3, (%edi,%ebp) movq %mm0, (%ebx,%ebp) addl 168(%esp), %ebx addl 168(%esp), %edi decl 160(%esp) jnz .L0 femms movl 128(%esp), %ebx movl 124(%esp), %esi movl 120(%esp), %edi movl 116(%esp), %ebp addl $132, %esp ret .section .rodatanam: .string "n1k7i_16" .align 4desc: .long 16 .long nam .double 72 .double 12 .double 0 .double 0 .long fftwf_kdft_k7_pgenus .long 0 .long 0 .long 0 .long 0.text .align 4.globl fftwf_codelet_n1k7i_16fftwf_codelet_n1k7i_16: subl $12,%esp addl $-4,%esp pushl $desc pushl $n1k7i_16 pushl 28(%esp) call fftwf_kdft_register addl $16,%esp addl $12,%esp ret
⌨️ 快捷键说明
复制代码
Ctrl + C
搜索代码
Ctrl + F
全屏模式
F11
切换主题
Ctrl + Shift + D
显示快捷键
?
增大字号
Ctrl + =
减小字号
Ctrl + -