📄 f1k7i_8.s
字号:
/* * Copyright (c) 2003 Matteo Frigo * Copyright (c) 2003 Massachusetts Institute of Technology * * This program is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation; either version 2 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program; if not, write to the Free Software * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA * *//* This file was automatically generated --- DO NOT EDIT *//* Generated on Sat Jul 5 21:53:21 EDT 2003 */#include "config.h"/* cheap-mode: VECTGRADE_FULL succeeded. (136 steps) *//* Generated by: /homee/stevenj/cvs/fftw3.0.1/genfft-k7/gen_twiddle -no-randomized-cse -dif -n 8 -sign 1 -name f1k7i_8 *//* * Generator Id's : * $Id: algsimp.ml,v 1.3 2003/03/15 20:29:42 stevenj Exp $ * $Id: fft.ml,v 1.3 2003/03/15 20:29:43 stevenj Exp $ * $Id: gen_twiddle.ml,v 1.13 2003/04/18 01:21:45 athena Exp $ *//* The following asm code is Copyright (c) 2000-2001 Stefan Kral */.section .rodata .balign 64chs_lo: .long 0x80000000, 0x00000000chs_hi: .long 0x00000000, 0x80000000KP707106781KP707106781: .float +0.707106781186547524400844362104849039284835938, +0.707106781186547524400844362104849039284835938.text.text .balign 64f1k7i_8: subl $60, %esp femms movl %ebx, 56(%esp) movl 76(%esp), %edx movl 84(%esp), %ebx movl 68(%esp), %ecx movl %esi, 52(%esp) movl 72(%esp), %eax movl %edi, 48(%esp) movl 80(%esp), %esi movl %ebp, 44(%esp) leal (,%edx,4), %edx leal (,%ebx,4), %ebx .p2align 4,,7.L0: /* promise simd cell size = 8 */ movq (%ecx,%edx,4), %mm0 movq (%ecx), %mm1 leal (%edx,%edx,2), %edi movq (%ecx,%edx,2), %mm4 leal (%edx,%edx,4), %ebp movq (%ecx,%edx), %mm7 movq (%ecx,%edi,2), %mm3 movq (%ecx,%ebp), %mm6 movq %mm1, %mm2 pfsub %mm0, %mm1 movq %mm4, %mm5 pfadd %mm0, %mm2 movq %mm7, %mm0 pfsub %mm3, %mm5 pfadd %mm3, %mm4 movq (%ecx,%edi), %mm3 leal (%ebp,%edx,2), %edi movq %mm1, 0(%esp) pfsub %mm6, %mm7 leal (%edx,%edx,2), %ebp movq (%ecx,%edi), %mm1 pfadd %mm6, %mm0 movq %mm5, 8(%esp) movq %mm2, %mm5 leal (%edx,%ebp,2), %edi pfadd %mm4, %mm2 leal (%edx,%edx,4), %ebp pfsub %mm4, %mm5 movq %mm1, %mm6 pfsub %mm3, %mm1 movq %mm0, %mm4 pfadd %mm3, %mm6 movq %mm7, %mm3 pfpnacc %mm1, %mm3 pswapd %mm1, %mm1 pfadd %mm6, %mm0 pfsubr %mm6, %mm4 movq 8(%esp), %mm6 pfpnacc %mm7, %mm1 movq %mm2, %mm7 pfadd %mm0, %mm2 pfsub %mm0, %mm7 pswapd %mm6, %mm6 movq 0(%esp), %mm0 pswapd %mm4, %mm4 pxor chs_lo, %mm6 movq %mm2, 16(%esp) pxor chs_hi, %mm4 movq %mm0, %mm2 pfadd %mm6, %mm2 pfsub %mm6, %mm0 movq %mm1, %mm6 pfnacc %mm3, %mm1 pfacc %mm6, %mm3 pswapd %mm7, %mm6 pfmul KP707106781KP707106781, %mm1 pfmul KP707106781KP707106781, %mm3 movq %mm1, 24(%esp) movq 24(%eax), %mm1 pfmul %mm1, %mm7 pfmul %mm1, %mm6 movq %mm5, %mm1 pfadd %mm4, %mm5 pfsub %mm4, %mm1 movq 8(%eax), %mm4 pfpnacc %mm6, %mm7 pswapd %mm5, %mm6 pfmul %mm4, %mm5 pfmul %mm4, %mm6 pswapd %mm1, %mm4 pfpnacc %mm6, %mm5 movq 40(%eax), %mm6 pfmul %mm6, %mm1 pfmul %mm6, %mm4 movq %mm2, %mm6 pfsub %mm3, %mm2 pfadd %mm3, %mm6 movq 32(%eax), %mm3 pfpnacc %mm4, %mm1 pswapd %mm2, %mm4 pfmul %mm3, %mm2 pfmul %mm3, %mm4 pswapd %mm6, %mm3 pfpnacc %mm4, %mm2 movq (%eax), %mm4 pfmul %mm4, %mm6 pfmul %mm4, %mm3 movq 24(%esp), %mm4 pfpnacc %mm3, %mm6 movq %mm0, %mm3 pfadd %mm4, %mm0 pfsub %mm4, %mm3 movq %mm0, 32(%esp) movq 48(%eax), %mm4 pswapd %mm3, %mm0 pfmul %mm4, %mm3 pfmul %mm4, %mm0 movq 16(%eax), %mm4 /* simd data load/store barrier */ movq %mm7, (%ecx,%edx,4) movq 32(%esp), %mm7 addl $56, %eax movq %mm6, (%ecx,%edx) movq %mm2, (%ecx,%ebp) movq 16(%esp), %mm2 pfpnacc %mm0, %mm3 movq %mm5, (%ecx,%edx,2) pswapd %mm7, %mm6 pfmul %mm4, %mm7 pfmul %mm4, %mm6 movq %mm2, (%ecx) movq %mm3, (%ecx,%edi) leal (%edx,%edx,2), %edi movq %mm1, (%ecx,%edi,2) pfpnacc %mm6, %mm7 movq %mm7, (%ecx,%edi) addl %ebx, %ecx decl %esi jnz .L0 femms movl 56(%esp), %ebx movl 52(%esp), %esi movl 48(%esp), %edi movl 44(%esp), %ebp addl $60, %esp ret .section .rodatanam: .string "f1k7i_8" .align 4twinstr: .byte 4 .byte 0 .value 8 .byte 3 .byte 1 .value 0 .align 4desc: .long 8 .long nam .long twinstr .zero 4 .double 33 .double 16 .double 0 .double 0 .long fftwf_kdft_ct_k7_pgenus .long 0 .long 0 .long 0.text .align 4.globl fftwf_codelet_f1k7i_8fftwf_codelet_f1k7i_8: subl $12,%esp movl 16(%esp),%eax addl $-4,%esp pushl $desc pushl $f1k7i_8 pushl %eax call fftwf_kdft_dif_register addl $16,%esp addl $12,%esp ret
⌨️ 快捷键说明
复制代码
Ctrl + C
搜索代码
Ctrl + F
全屏模式
F11
切换主题
Ctrl + Shift + D
显示快捷键
?
增大字号
Ctrl + =
减小字号
Ctrl + -