⭐ 欢迎来到虫虫下载站! | 📦 资源下载 📁 资源专辑 ℹ️ 关于我们
⭐ 虫虫下载站

📄 t1k7_16.s

📁 fftw-3.0.1
💻 S
字号:
/* * Copyright (c) 2003 Matteo Frigo * Copyright (c) 2003 Massachusetts Institute of Technology * * This program is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation; either version 2 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program; if not, write to the Free Software * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA * *//* This file was automatically generated --- DO NOT EDIT *//* Generated on Sat Jul  5 21:52:01 EDT 2003 */#include "config.h"/* cheap-mode: VECTGRADE_FULL succeeded. (192 steps) *//* Generated by: /homee/stevenj/cvs/fftw3.0.1/genfft-k7/gen_twiddle -no-randomized-cse -n 16 -name t1k7_16 *//* * Generator Id's :  * $Id: algsimp.ml,v 1.3 2003/03/15 20:29:42 stevenj Exp $ * $Id: fft.ml,v 1.3 2003/03/15 20:29:43 stevenj Exp $ * $Id: gen_twiddle.ml,v 1.13 2003/04/18 01:21:45 athena Exp $ *//* The following asm code is Copyright (c) 2000-2001 Stefan Kral */.section .rodata	.balign 64KP707106781KP707106781: .float +0.707106781186547524400844362104849039284835938, +0.707106781186547524400844362104849039284835938KP923879532KP382683432: .float +0.923879532511286756128183189396788286822416626, +0.382683432365089771728459984030398866761344562KP382683432KP923879532: .float +0.382683432365089771728459984030398866761344562, +0.923879532511286756128183189396788286822416626.text.text	.balign 64t1k7_16:	subl $180, %esp	femms 	movl %ebx, 176(%esp)	movl 196(%esp), %edx	movl 204(%esp), %ebx	movl 184(%esp), %ecx	movl %esi, 172(%esp)	movl 192(%esp), %eax	movl %edi, 168(%esp)	movl 200(%esp), %esi	movl %ebp, 164(%esp)	leal (,%edx,4), %edx	leal (,%ebx,4), %ebx	.p2align 4,,7.L0:	/* promise simd cell size = 8 */ 	movq (%ecx,%edx), %mm1	leal (%edx,%edx,8), %edi	leal (%edx,%edx,2), %ebp	movq (%eax), %mm0	movq 64(%eax), %mm3	movq (%ecx,%edi), %mm4	movq 16(%eax), %mm6	movq (%ecx,%ebp), %mm7	leal (%ebp,%edx,8), %edi	leal (%edx,%edx,4), %ebp	pswapd %mm1, %mm2	pfmul %mm0, %mm1	pfmul %mm0, %mm2	pswapd %mm4, %mm5	pswapd %mm7, %mm0	pfmul %mm3, %mm4	pfmul %mm6, %mm7	pfmul %mm3, %mm5	movq 80(%eax), %mm3	pfmul %mm6, %mm0	movq (%ecx,%edi), %mm6	leal (%ebp,%edx,8), %edi	pfacc %mm4, %mm1	pfnacc %mm5, %mm2	movq 32(%eax), %mm5	movq %mm6, %mm4	pfmul %mm3, %mm6	pswapd %mm4, %mm4	pfacc %mm6, %mm7	pfmul %mm3, %mm4	movq (%ecx,%ebp), %mm3	leal (%edi,%edx,2), %ebp	movq %mm7, 8(%esp)	movq (%ecx,%edi), %mm7	pfnacc %mm4, %mm0	pswapd %mm3, %mm6	movq 96(%eax), %mm4	pfmul %mm5, %mm3	leal (%edx,%edx,2), %edi	pfmul %mm5, %mm6	pswapd %mm7, %mm5	movq %mm0, 0(%esp)	movq 112(%eax), %mm0	pfmul %mm4, %mm7	pfmul %mm4, %mm5	movq (%ecx,%ebp), %mm4	leal (%edx,%edi,2), %ebp	pfacc %mm7, %mm3	pswapd %mm4, %mm7	pfnacc %mm5, %mm6	movq 48(%eax), %mm5	pfmul %mm0, %mm4	pfmul %mm0, %mm7	movq %mm6, 16(%esp)	movq (%ecx,%ebp), %mm0	pswapd %mm0, %mm6	pfmul %mm5, %mm0	pfmul %mm5, %mm6	movq %mm2, %mm5	pfnacc %mm3, %mm2	pfacc %mm0, %mm4	movq %mm1, %mm0	pfnacc %mm6, %mm7	movq %mm2, 32(%esp)	movq 16(%esp), %mm6	movq 0(%esp), %mm2	pfacc %mm3, %mm0	movq %mm4, %mm3	pfacc %mm6, %mm5	pfnacc %mm6, %mm1	movq 8(%esp), %mm6	pfnacc %mm2, %mm4	movq %mm5, 24(%esp)	movq %mm7, %mm5	pfacc %mm2, %mm7	pfacc %mm6, %mm3	movq %mm0, %mm2	pfnacc %mm6, %mm5	movq 32(%esp), %mm6	pfacc %mm3, %mm0	pfnacc %mm7, %mm3	movq %mm3, 40(%esp)	movq %mm1, %mm3	pfpnacc %mm6, %mm1	pfpnacc %mm3, %mm6	movq %mm1, 64(%esp)	movq 24(%esp), %mm3	movq %mm4, %mm1	pfpnacc %mm5, %mm4	pfnacc %mm3, %mm2	movq %mm6, 56(%esp)	movq 56(%eax), %mm6	pfacc %mm7, %mm3	movq (%ecx,%edx,8), %mm7	pfpnacc %mm1, %mm5	movq %mm4, 72(%esp)	movq %mm2, 104(%esp)	movq 24(%eax), %mm2	pswapd %mm7, %mm1	movq %mm3, 112(%esp)	pfmul %mm6, %mm7	movq %mm5, 48(%esp)	movq (%ecx,%edx,4), %mm3	movq (%ecx,%edi,4), %mm5	pfmul %mm6, %mm1	movq 88(%eax), %mm6	leal (%edx,%edx,4), %edi	pswapd %mm3, %mm4	pfmul %mm2, %mm3	pfpnacc %mm7, %mm1	pswapd %mm5, %mm7	pfmul %mm6, %mm5	pfmul %mm2, %mm4	movq 8(%eax), %mm2	pfmul %mm6, %mm7	movq %mm1, 80(%esp)	movq (%ecx,%edx,2), %mm6	pfacc %mm5, %mm3	movq 72(%eax), %mm5	pfnacc %mm7, %mm4	pswapd %mm6, %mm1	pfmul %mm2, %mm6	pfmul %mm2, %mm1	movq (%ecx,%edi,2), %mm2	leal (%edx,%edx,4), %edi	pswapd %mm4, %mm7	pfnacc %mm3, %mm7	pfacc %mm4, %mm3	pswapd %mm2, %mm4	pfmul %mm5, %mm2	pfmul %mm5, %mm4	movq %mm7, 88(%esp)	movq %mm3, 96(%esp)	movq 104(%eax), %mm7	movq (%ecx,%ebp,2), %mm3	leal (%edx,%edx,2), %ebp	pfacc %mm2, %mm6	movq 40(%eax), %mm2	addl $120, %eax	pfnacc %mm4, %mm1	movq (%ecx,%ebp,2), %mm4	leal (%edx,%edx,2), %ebp	pswapd %mm3, %mm5	pfmul %mm7, %mm3	pfmul %mm7, %mm5	pswapd %mm4, %mm7	pfmul %mm2, %mm4	pfmul %mm2, %mm7	movq %mm1, %mm2	pfnacc %mm6, %mm1	pfacc %mm4, %mm3	movq 112(%esp), %mm4	pfnacc %mm7, %mm5	movq %mm0, %mm7	pswapd %mm7, %mm7	pfacc %mm3, %mm6	pfnacc %mm5, %mm3	pfacc %mm5, %mm2	movq %mm1, %mm5	pfacc %mm4, %mm0	pfnacc %mm7, %mm4	movq 104(%esp), %mm7	pfpnacc %mm3, %mm1	pfpnacc %mm5, %mm3	movq %mm1, 128(%esp)	movq 40(%esp), %mm5	movq %mm5, %mm1	movq %mm3, 120(%esp)	pswapd %mm6, %mm3	pfacc %mm2, %mm6	pfpnacc %mm7, %mm1	pswapd %mm7, %mm7	pfnacc %mm3, %mm2	movq 80(%esp), %mm3	pfpnacc %mm5, %mm7	pswapd %mm3, %mm3	movq %mm7, %mm5	pfnacc %mm1, %mm7	pfacc %mm5, %mm1	movq (%ecx), %mm5	/* simd data load/store barrier */ 	pfmul KP707106781KP707106781, %mm7	pfmul KP707106781KP707106781, %mm1	movq %mm7, 136(%esp)	movq %mm5, %mm7	pfsub %mm3, %mm5	pfadd %mm3, %mm7	movq %mm5, 144(%esp)	movq 96(%esp), %mm3	movq %mm7, %mm5	pfadd %mm3, %mm7	pfsub %mm3, %mm5	movq %mm7, %mm3	pfsub %mm6, %mm7	pfadd %mm6, %mm3	movq %mm5, %mm6	pfsub %mm2, %mm5	pfadd %mm2, %mm6	movq %mm3, %mm2	pfadd %mm0, %mm3	pfsub %mm0, %mm2	movq %mm6, %mm0	pfadd %mm1, %mm6	movq %mm3, (%ecx)	movq %mm7, %mm3	pfsub %mm1, %mm0	pfsub %mm4, %mm7	movq 136(%esp), %mm1	pfadd %mm4, %mm3	movq 72(%esp), %mm4	movq %mm2, (%ecx,%edx,8)	movq %mm6, (%ecx,%edx,2)	movq 64(%esp), %mm6	movq %mm5, %mm2	movq %mm0, (%ecx,%edi,2)	leal (%ebp,%edx,4), %edi	pfsub %mm1, %mm5	movq %mm7, (%ecx,%ebp,4)	movq 56(%esp), %mm7	movq %mm3, (%ecx,%edx,4)	movq 48(%esp), %mm3	pfadd %mm1, %mm2	movq %mm4, %mm1	pswapd %mm6, %mm6	pfmul KP923879532KP382683432, %mm4	movq %mm6, %mm0	pfmul KP382683432KP923879532, %mm1	pfmul KP923879532KP382683432, %mm6	movq %mm5, (%ecx,%edi,2)	pswapd %mm3, %mm3	movq %mm7, %mm5	pfmul KP382683432KP923879532, %mm0	movq %mm2, (%ecx,%ebp,2)	leal (%edi,%edx,8), %ebp	movq %mm3, %mm2	pfmul KP923879532KP382683432, %mm7	pfmul KP382683432KP923879532, %mm5	pfmul KP382683432KP923879532, %mm3	pfmul KP923879532KP382683432, %mm2	pfpnacc %mm6, %mm1	movq 120(%esp), %mm6	pfpnacc %mm4, %mm0	movq 128(%esp), %mm4	pfpnacc %mm3, %mm7	movq 144(%esp), %mm3	pfpnacc %mm5, %mm2	movq %mm6, %mm5	pfacc %mm4, %mm6	pfnacc %mm5, %mm4	movq %mm2, 152(%esp)	movq 88(%esp), %mm5	movq %mm3, %mm2	pfmul KP707106781KP707106781, %mm6	pfmul KP707106781KP707106781, %mm4	pfadd %mm5, %mm2	pfsub %mm5, %mm3	movq %mm2, %mm5	pfsub %mm4, %mm2	pfadd %mm4, %mm5	movq %mm3, %mm4	pfsub %mm6, %mm3	pfadd %mm6, %mm4	movq %mm0, %mm6	pfnacc %mm1, %mm0	pfacc %mm6, %mm1	movq %mm2, %mm6	pfsub %mm0, %mm6	pfadd %mm0, %mm2	movq %mm5, %mm0	pfadd %mm1, %mm5	pfsub %mm1, %mm0	movq 152(%esp), %mm1	movq %mm6, (%ecx,%ebp)	movq %mm7, %mm6	leal (%edi,%edx,4), %ebp	movq %mm2, (%ecx,%edi)	movq %mm3, %mm2	leal (%edx,%edx,2), %edi	pfnacc %mm1, %mm7	movq %mm0, (%ecx,%ebp)	movq %mm4, %mm0	pfacc %mm6, %mm1	leal (%edx,%edi,4), %ebp	movq %mm5, (%ecx,%edi)	leal (%edx,%edx,4), %edi	pfsub %mm7, %mm2	pfadd %mm7, %mm3	pfsub %mm1, %mm0	pfadd %mm1, %mm4	movq %mm2, (%ecx,%ebp)	leal (%edx,%edx,8), %ebp	movq %mm3, (%ecx,%edi)	movq %mm0, (%ecx,%ebp)	movq %mm4, (%ecx,%edx)	addl %ebx, %ecx	decl %esi	jnz .L0	femms 	movl 176(%esp), %ebx	movl 172(%esp), %esi	movl 168(%esp), %edi	movl 164(%esp), %ebp	addl $180, %esp	ret .section .rodatanam:	.string "t1k7_16"	.align 4twinstr:	.byte 4	.byte 0	.value 16	.byte 3	.byte 1	.value 0	.align 4desc:	.long 16	.long nam	.long twinstr	.zero 4	.double 87	.double 42	.double 0	.double 0	.long fftwf_kdft_ct_k7_mgenus	.long 0	.long 0	.long 0.text	.align 4.globl fftwf_codelet_t1k7_16fftwf_codelet_t1k7_16:	subl $12,%esp	movl 16(%esp),%eax	addl $-4,%esp	pushl $desc	pushl $t1k7_16	pushl %eax	call fftwf_kdft_dit_register	addl $16,%esp	addl $12,%esp	ret

⌨️ 快捷键说明

复制代码 Ctrl + C
搜索代码 Ctrl + F
全屏模式 F11
切换主题 Ctrl + Shift + D
显示快捷键 ?
增大字号 Ctrl + =
减小字号 Ctrl + -