📄 t1k7_15.s
字号:
/* * Copyright (c) 2003, 2006 Matteo Frigo * Copyright (c) 2003, 2006 Massachusetts Institute of Technology * * This program is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation; either version 2 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program; if not, write to the Free Software * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA * *//* This file was automatically generated --- DO NOT EDIT *//* Generated on Fri Jan 27 20:12:12 EST 2006 */#include "config.h"/* cheap-mode: VECTGRADE_FULL succeeded. (207 steps) *//* Generated by: ../../../genfft-k7/gen_twiddle -no-randomized-cse -n 15 -name t1k7_15 *//* * Generator Id's : * $Id: algsimp.ml,v 1.4 2006-01-05 03:04:27 stevenj Exp $ * $Id: fft.ml,v 1.4 2006-01-05 03:04:27 stevenj Exp $ * $Id: gen_twiddle.ml,v 1.14 2005-12-24 21:08:49 athena Exp $ *//* The following asm code is Copyright (c) 2000-2001 Stefan Kral */.section .rodata .balign 64KP500000000KP500000000: .float +0.500000000000000000000000000000000000000000000, +0.500000000000000000000000000000000000000000000KP866025403KP866025403: .float +0.866025403784438646763723170752936183471402627, +0.866025403784438646763723170752936183471402627KN866025403KN866025403: .float -0.866025403784438646763723170752936183471402627, -0.866025403784438646763723170752936183471402627KP951056516KP587785252: .float +0.951056516295153572116439333379382143405698634, +0.587785252292473129168705954639072768597652438KP587785252KP951056516: .float +0.587785252292473129168705954639072768597652438, +0.951056516295153572116439333379382143405698634chs_lo: .long 0x80000000, 0x00000000KP250000000KP250000000: .float +0.250000000000000000000000000000000000000000000, +0.250000000000000000000000000000000000000000000KP559016994KP559016994: .float +0.559016994374947424102293417182819058860154590, +0.559016994374947424102293417182819058860154590.text.text .balign 64t1k7_15: subl $204, %esp femms movl %ebx, 200(%esp) movl 220(%esp), %edx movl 228(%esp), %ebx movl %esi, 196(%esp) movl %edi, 192(%esp) movl 208(%esp), %ecx movl %ebp, 188(%esp) movl 216(%esp), %eax movl 224(%esp), %esi leal (,%edx,4), %edx leal (,%ebx,4), %ebx .p2align 4,,7.L0: /* promise simd cell size = 8 */ leal (%edx,%edx,4), %edi movq 72(%eax), %mm0 movq 32(%eax), %mm3 leal (%edx,%edx,8), %ebp movq 64(%eax), %mm6 movq (%ecx,%edi,2), %mm1 movq (%ecx,%edi), %mm4 leal (%edx,%edx,2), %edi movq (%ecx,%ebp), %mm7 leal (%edi,%edx,8), %ebp pswapd %mm1, %mm2 pswapd %mm4, %mm5 pfmul %mm0, %mm1 pfmul %mm3, %mm4 pfmul %mm0, %mm2 pswapd %mm7, %mm0 pfmul %mm3, %mm5 movq 40(%eax), %mm3 pfmul %mm6, %mm7 pfacc %mm1, %mm4 movq (%ecx,%edi,2), %mm1 pfmul %mm6, %mm0 pfnacc %mm2, %mm5 movq %mm4, %mm2 pswapd %mm1, %mm6 pfmul %mm3, %mm1 pswapd %mm2, %mm2 pfacc %mm5, %mm4 pfmul %mm3, %mm6 movq 16(%eax), %mm3 pfnacc %mm2, %mm5 movq (%ecx,%edi), %mm2 pfacc %mm7, %mm1 movq %mm4, 16(%esp) pfmul KP500000000KP500000000, %mm4 pfnacc %mm0, %mm6 movq 88(%eax), %mm0 pswapd %mm2, %mm7 pfmul %mm3, %mm2 pfmul KP866025403KP866025403, %mm5 pfmul %mm3, %mm7 movq %mm6, 32(%esp) movq %mm4, 8(%esp) movq (%ecx,%edi,4), %mm3 movq 24(%eax), %mm4 pswapd %mm3, %mm6 pfmul %mm0, %mm3 movq %mm5, 0(%esp) movq (%ecx,%edx,4), %mm5 pfmul %mm0, %mm6 pfacc %mm3, %mm2 movq 80(%eax), %mm3 pswapd %mm5, %mm0 pfmul %mm4, %mm5 pfnacc %mm6, %mm7 movq (%ecx,%ebp), %mm6 leal (%edi,%edx,4), %ebp pfmul %mm4, %mm0 movq %mm2, 40(%esp) movq %mm7, 24(%esp) movq 104(%eax), %mm2 movq (%ecx,%ebp,2), %mm7 pswapd %mm6, %mm4 pfmul %mm3, %mm6 pfmul %mm3, %mm4 pswapd %mm7, %mm3 pfmul %mm2, %mm7 pfmul %mm2, %mm3 movq (%eax), %mm2 pfacc %mm5, %mm7 movq (%ecx,%edx), %mm5 pfnacc %mm0, %mm3 pswapd %mm5, %mm0 pfmul %mm2, %mm5 pfmul %mm2, %mm0 movq %mm3, 56(%esp) movq 48(%eax), %mm3 pfacc %mm5, %mm6 movq (%ecx,%ebp), %mm5 leal (%edx,%edi,4), %ebp leal (%edx,%edx,8), %edi pfnacc %mm0, %mm4 movq %mm6, %mm2 pfnacc %mm7, %mm6 pswapd %mm5, %mm0 pfmul %mm3, %mm5 pfacc %mm7, %mm2 movq %mm4, 64(%esp) movq (%ecx,%edx,8), %mm7 movq 56(%eax), %mm4 pfmul %mm3, %mm0 pfmul KN866025403KN866025403, %mm6 pswapd %mm7, %mm3 movq %mm2, 72(%esp) movq 8(%eax), %mm2 pfmul %mm4, %mm7 pfmul %mm4, %mm3 movq %mm6, 48(%esp) movq (%ecx,%edx,2), %mm4 pswapd %mm4, %mm6 pfmul %mm2, %mm4 pfmul %mm2, %mm6 movq 96(%eax), %mm2 addl $112, %eax pfacc %mm5, %mm4 movq (%ecx,%ebp), %mm5 leal (%edx,%edx,2), %ebp pfnacc %mm0, %mm6 pswapd %mm5, %mm0 pfmul %mm2, %mm5 pfmul %mm2, %mm0 movq 72(%esp), %mm2 pfacc %mm5, %mm7 movq %mm1, %mm5 pfnacc %mm0, %mm3 pfadd %mm2, %mm1 pfmul KP500000000KP500000000, %mm2 movq %mm7, %mm0 pfnacc %mm4, %mm7 pfacc %mm4, %mm0 movq 40(%esp), %mm4 pfmul KN866025403KN866025403, %mm7 pfsub %mm2, %mm5 movq %mm4, %mm2 pfadd %mm0, %mm4 pfmul KP500000000KP500000000, %mm0 pfsub %mm0, %mm2 movq %mm1, %mm0 pfnacc %mm4, %mm1 pfacc %mm0, %mm4 movq %mm3, %mm0 pfnacc %mm6, %mm3 pfacc %mm6, %mm0 movq %mm2, %mm6 movq %mm4, 112(%esp) movq 64(%esp), %mm4 pfmul KP866025403KP866025403, %mm3 pfsub %mm3, %mm2 pfadd %mm3, %mm6 movq %mm2, 88(%esp) movq 56(%esp), %mm3 movq %mm4, %mm2 pfnacc %mm3, %mm4 movq %mm6, 80(%esp) pfacc %mm3, %mm2 movq %mm5, %mm3 pfmul KP866025403KP866025403, %mm4 movq %mm2, %mm6 pfmul KP500000000KP500000000, %mm6 pfadd %mm4, %mm3 pfsub %mm4, %mm5 movq %mm3, 96(%esp) movq %mm5, 104(%esp) movq 32(%esp), %mm4 movq %mm4, %mm3 movq %mm0, %mm5 pfsub %mm6, %mm4 pfadd %mm2, %mm3 pfmul KP500000000KP500000000, %mm5 movq 24(%esp), %mm2 movq %mm2, %mm6 pfadd %mm0, %mm6 movq %mm3, %mm0 pfsub %mm5, %mm2 pfnacc %mm6, %mm3 movq %mm2, %mm5 pfsub %mm7, %mm2 pfacc %mm0, %mm6 movq %mm1, %mm0 pfmul KP951056516KP587785252, %mm1 pfadd %mm7, %mm5 pswapd %mm3, %mm7 pfmul KP587785252KP951056516, %mm0 movq %mm2, 136(%esp) movq 48(%esp), %mm2 pfmul KP587785252KP951056516, %mm7 movq %mm5, 128(%esp) movq %mm4, %mm5 pfmul KP587785252KP951056516, %mm3 pfadd %mm2, %mm4 pfsub %mm2, %mm5 movq 112(%esp), %mm2 pfnacc %mm1, %mm7 movq %mm4, 120(%esp) movq (%ecx), %mm4 pfacc %mm0, %mm3 movq %mm2, %mm1 pfacc %mm6, %mm2 /* simd data load/store barrier */ pfnacc %mm6, %mm1 movq %mm4, %mm0 pfsub 8(%esp), %mm4 pxor chs_lo, %mm3 movq %mm2, %mm6 pfadd 16(%esp), %mm0 pfmul KP250000000KP250000000, %mm6 pfmul KP559016994KP559016994, %mm1 movq %mm4, 144(%esp) movq %mm0, %mm4 pfsub %mm6, %mm0 pfadd %mm2, %mm4 movq %mm0, %mm6 pfsub %mm1, %mm0 movq %mm4, (%ecx) pfadd %mm1, %mm6 movq 104(%esp), %mm1 movq %mm0, %mm4 pfadd %mm7, %mm0 movq %mm6, %mm2 pfadd %mm3, %mm6 pfsub %mm7, %mm4 movq %mm1, %mm7 pfsub %mm3, %mm2 movq 88(%esp), %mm3 movq %mm0, (%ecx,%ebp,4) movq %mm5, %mm0 movq %mm6, (%ecx,%edi) movq 136(%esp), %mm6 leal (%edx,%edx,4), %edi movq %mm4, (%ecx,%ebp) pfnacc %mm3, %mm1 movq %mm2, (%ecx,%ebp,2) leal (%edi,%edx,2), %ebp pfacc %mm7, %mm3 movq 80(%esp), %mm7 pfnacc %mm6, %mm5 pfacc %mm0, %mm6 movq 96(%esp), %mm0 movq %mm1, %mm2 pfmul KP951056516KP587785252, %mm1 pswapd %mm5, %mm4 pfmul KP587785252KP951056516, %mm2 pfmul KP587785252KP951056516, %mm5 pfmul KP587785252KP951056516, %mm4 pfacc %mm2, %mm5 movq %mm7, %mm2 pfnacc %mm1, %mm4 pfacc %mm0, %mm7 pfnacc %mm0, %mm2 movq 128(%esp), %mm0 pxor chs_lo, %mm5 movq %mm4, 152(%esp) movq 120(%esp), %mm4 pswapd %mm2, %mm1 pfmul KP951056516KP587785252, %mm2 movq %mm5, 160(%esp) movq %mm0, %mm5 pfnacc %mm4, %mm0 pfmul KP951056516KP587785252, %mm1 pfacc %mm4, %mm5 movq %mm0, %mm4 pfmul KP951056516KP587785252, %mm0 pfmul KP587785252KP951056516, %mm4 pfacc %mm2, %mm0 movq 144(%esp), %mm2 pfnacc %mm1, %mm4 movq 0(%esp), %mm1 pxor chs_lo, %mm0 movq %mm0, 168(%esp) movq %mm2, %mm0 pfsub %mm1, %mm2 pfadd %mm1, %mm0 movq %mm3, %mm1 pfnacc %mm6, %mm3 pfacc %mm6, %mm1 movq %mm7, %mm6 pfacc %mm5, %mm7 pfnacc %mm5, %mm6 pfmul KP559016994KP559016994, %mm3 movq %mm1, %mm5 pfmul KP250000000KP250000000, %mm5 pfmul KP559016994KP559016994, %mm6 movq %mm3, 176(%esp) movq %mm2, %mm3 pfadd %mm1, %mm2 movq %mm0, %mm1 pfadd %mm7, %mm0 pfmul KP250000000KP250000000, %mm7 pfsub %mm5, %mm3 movq %mm6, %mm5 movq %mm2, (%ecx,%edi) movq %mm0, (%ecx,%edi,2) movq 168(%esp), %mm0 pfsub %mm7, %mm1 pfsubr %mm1, %mm6 pfadd %mm1, %mm5 movq 176(%esp), %mm1 movq %mm6, %mm2 pfsub %mm4, %mm6 movq %mm5, %mm7 pfsub %mm0, %mm5 pfadd %mm4, %mm2 movq %mm3, %mm4 pfsub %mm1, %mm3 pfadd %mm1, %mm4 movq 160(%esp), %mm1 movq %mm5, (%ecx,%edx) movq 152(%esp), %mm5 pfadd %mm0, %mm7 movq %mm2, (%ecx,%ebp) leal (%edi,%edx,8), %ebp movq %mm3, %mm2 movq %mm4, %mm0 movq %mm6, (%ecx,%ebp) pfsub %mm1, %mm4 leal (%edi,%edx,2), %ebp pfadd %mm5, %mm2 movq %mm7, (%ecx,%edx,4) pfsub %mm5, %mm3 pfadd %mm1, %mm0 leal (%ebp,%edx,4), %edi movq %mm4, (%ecx,%edi) movq %mm2, (%ecx,%edx,2) movq %mm3, (%ecx,%edx,8) movq %mm0, (%ecx,%ebp,2) addl %ebx, %ecx decl %esi jnz .L0 femms movl 200(%esp), %ebx movl 196(%esp), %esi movl 192(%esp), %edi movl 188(%esp), %ebp addl $204, %esp ret .section .rodatanam: .string "t1k7_15" .align 4twinstr: .byte 4 .byte 0 .value 15 .byte 3 .byte 1 .value 0 .align 4desc: .long 15 .long nam .long twinstr .long fftwf_kdft_ct_k7_mgenus .double 92 .double 56 .double 0 .double 0 .long 0 .long 0 .long 0.text .align 4.globl fftwf_codelet_t1k7_15fftwf_codelet_t1k7_15: subl $12,%esp movl 16(%esp),%eax addl $-4,%esp pushl $desc pushl $t1k7_15 pushl %eax call fftwf_kdft_dit_register addl $16,%esp addl $12,%esp ret
⌨️ 快捷键说明
复制代码
Ctrl + C
搜索代码
Ctrl + F
全屏模式
F11
切换主题
Ctrl + Shift + D
显示快捷键
?
增大字号
Ctrl + =
减小字号
Ctrl + -