⭐ 欢迎来到虫虫下载站! | 📦 资源下载 📁 资源专辑 ℹ️ 关于我们
⭐ 虫虫下载站

📄 t1k7_64.s

📁 fftw-3.0.1
💻 S
📖 第 1 页 / 共 3 页
字号:
/* * Copyright (c) 2003 Matteo Frigo * Copyright (c) 2003 Massachusetts Institute of Technology * * This program is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation; either version 2 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program; if not, write to the Free Software * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA * *//* This file was automatically generated --- DO NOT EDIT *//* Generated on Sat Jul  5 21:52:11 EDT 2003 */#include "config.h"/* cheap-mode: VECTGRADE_FULL succeeded. (1024 steps) *//* Generated by: /homee/stevenj/cvs/fftw3.0.1/genfft-k7/gen_twiddle -no-randomized-cse -n 64 -name t1k7_64 *//* * Generator Id's :  * $Id: algsimp.ml,v 1.3 2003/03/15 20:29:42 stevenj Exp $ * $Id: fft.ml,v 1.3 2003/03/15 20:29:43 stevenj Exp $ * $Id: gen_twiddle.ml,v 1.13 2003/04/18 01:21:45 athena Exp $ *//* CHImovopt_applicable: new! *//* CHImovopt_applicable: new! *//* CHImovopt_applicable: new! *//* CHImovopt_applicable: new! *//* CHImovopt_applicable: new! *//* CHImovopt_applicable: new! *//* The following asm code is Copyright (c) 2000-2001 Stefan Kral */.section .rodata	.balign 64KP707106781KP707106781: .float +0.707106781186547524400844362104849039284835938, +0.707106781186547524400844362104849039284835938KP923879532KP382683432: .float +0.923879532511286756128183189396788286822416626, +0.382683432365089771728459984030398866761344562KP382683432KP923879532: .float +0.382683432365089771728459984030398866761344562, +0.923879532511286756128183189396788286822416626KP555570233KP831469612: .float +0.555570233019602224742830813948532874374937191, +0.831469612302545237078788377617905756738560812KP195090322KP980785280: .float +0.195090322016128267848284868477022240927691618, +0.980785280403230449126182236134239036973933731KP831469612KP555570233: .float +0.831469612302545237078788377617905756738560812, +0.555570233019602224742830813948532874374937191KP980785280KP195090322: .float +0.980785280403230449126182236134239036973933731, +0.195090322016128267848284868477022240927691618KP995184726KP098017140: .float +0.995184726672196886244836953109479921575474869, +0.098017140329560601994195563888641845861136673KP634393284KP773010453: .float +0.634393284163645498215171613225493370675687095, +0.773010453362736960810906609758469800971041293KP881921264KP471396736: .float +0.881921264348355029712756863660388349508442621, +0.471396736825997648556387625905254377657460319KP290284677KP956940335: .float +0.290284677254462367636192375817395274691476278, +0.956940335732208864935797886980269969482849206KP956940335KP290284677: .float +0.956940335732208864935797886980269969482849206, +0.290284677254462367636192375817395274691476278KP471396736KP881921264: .float +0.471396736825997648556387625905254377657460319, +0.881921264348355029712756863660388349508442621KP098017140KP995184726: .float +0.098017140329560601994195563888641845861136673, +0.995184726672196886244836953109479921575474869KP773010453KP634393284: .float +0.773010453362736960810906609758469800971041293, +0.634393284163645498215171613225493370675687095.text.text	.balign 64t1k7_64:	subl $1476, %esp	femms 	movl 1492(%esp), %edx	movl 1480(%esp), %ecx	movl %ebx, 1472(%esp)	movl 1488(%esp), %eax	movl %esi, 1468(%esp)	movl %edi, 1464(%esp)	leal (,%edx,4), %edx	movl %ebp, 1460(%esp)	movl %edx, %ebx	sall $5, %ebx	addl %ecx, %ebx	sall $2, 1500(%esp)	.p2align 4,,7.L0:	/* promise simd cell size = 8 */ 	movq (%ebx), %mm1	movq 248(%eax), %mm0	leal (%edx,%edx,2), %esi	movq 496(%eax), %mm3	movq 240(%eax), %mm6	leal (%esi,%esi,4), %edi	leal (%edx,%edx,2), %esi	pswapd %mm1, %mm2	pfmul %mm0, %mm1	leal (%edx,%edi,2), %ebp	leal (%esi,%esi,8), %edi	pfmul %mm0, %mm2	movq (%ebx,%ebp), %mm4	movq (%ecx,%ebp), %mm7	leal (%esi,%edx,8), %ebp	leal (%ebp,%edx,4), %esi	pfpnacc %mm1, %mm2	movq (%ecx), %mm1	pswapd %mm4, %mm5	pswapd %mm7, %mm0	pfmul %mm3, %mm4	pfmul %mm3, %mm5	pfmul %mm6, %mm0	movq %mm1, %mm3	pswapd %mm2, %mm2	pfmul %mm6, %mm7	movq 336(%eax), %mm6	pfsub %mm2, %mm1	pfadd %mm2, %mm3	movq (%ebx,%ebp), %mm2	pfnacc %mm0, %mm5	pfacc %mm7, %mm4	movq %mm1, 0(%esp)	movq 464(%eax), %mm7	movq (%ebx,%edi), %mm1	pswapd %mm2, %mm0	pfmul %mm6, %mm2	movq %mm3, 8(%esp)	movq %mm5, 16(%esp)	movq 208(%eax), %mm5	pfmul %mm6, %mm0	movq (%ecx,%edi), %mm6	leal (%edx,%edx,2), %edi	pswapd %mm1, %mm3	pfmul %mm7, %mm1	pfmul %mm7, %mm3	pswapd %mm6, %mm7	pfmul %mm5, %mm6	pfmul %mm5, %mm7	movq 80(%eax), %mm5	pfacc %mm6, %mm1	movq (%ecx,%ebp), %mm6	leal (%edx,%edi,2), %ebp	leal (%esi,%edx,8), %edi	pfnacc %mm7, %mm3	pswapd %mm6, %mm7	pfmul %mm5, %mm6	movq %mm1, 32(%esp)	pfmul %mm5, %mm7	movq %mm3, 48(%esp)	movq (%ecx,%esi), %mm5	movq 112(%eax), %mm3	pfacc %mm2, %mm6	pswapd %mm5, %mm2	pfnacc %mm0, %mm7	movq 368(%eax), %mm0	pfmul %mm3, %mm5	pfmul %mm3, %mm2	movq (%ebx,%esi), %mm3	pfacc %mm6, %mm1	movq %mm6, 24(%esp)	leal (%edx,%edx,2), %esi	movq %mm7, 40(%esp)	movq 48(%eax), %mm7	pswapd %mm3, %mm6	pfmul %mm0, %mm3	movq %mm1, 56(%esp)	movq (%ecx,%ebp), %mm1	pfmul %mm0, %mm6	pfacc %mm3, %mm5	movq 176(%eax), %mm3	pswapd %mm1, %mm0	pfmul %mm7, %mm1	pfnacc %mm6, %mm2	movq (%ecx,%edi), %mm6	pfmul %mm7, %mm0	movq %mm5, 64(%esp)	movq %mm2, 72(%esp)	movq 304(%eax), %mm5	movq (%ebx,%ebp), %mm2	pswapd %mm6, %mm7	pfmul %mm3, %mm6	leal (%edx,%edx), %ebp	pfmul %mm3, %mm7	pswapd %mm2, %mm3	pfmul %mm5, %mm2	pfmul %mm5, %mm3	movq 432(%eax), %mm5	pfacc %mm2, %mm1	movq (%ebx,%edi), %mm2	leal (%esi,%ebp,8), %edi	pfnacc %mm3, %mm0	pswapd %mm2, %mm3	pfmul %mm5, %mm2	movq %mm1, 88(%esp)	pfmul %mm5, %mm3	movq %mm0, 112(%esp)	movq (%ecx,%esi), %mm0	movq 16(%eax), %mm5	pfacc %mm6, %mm2	pfnacc %mm7, %mm3	pswapd %mm0, %mm6	movq 400(%eax), %mm7	pfmul %mm5, %mm0	pfacc %mm2, %mm1	movq %mm2, 96(%esp)	movq (%ebx,%edi), %mm2	pfmul %mm5, %mm6	movq %mm3, 104(%esp)	movq %mm1, 80(%esp)	movq 272(%eax), %mm3	movq (%ebx,%esi), %mm1	pswapd %mm2, %mm5	pfmul %mm7, %mm2	leal (%edx,%edx,4), %esi	pfmul %mm7, %mm5	leal (%edi,%esi,2), %ebp	pswapd %mm1, %mm7	pfmul %mm3, %mm1	pfmul %mm3, %mm7	movq 144(%eax), %mm3	pfacc %mm1, %mm0	movq (%ecx,%edi), %mm1	leal (%esi,%edx,8), %edi	pfnacc %mm7, %mm6	leal (%edi,%edx,4), %esi	pswapd %mm1, %mm7	pfmul %mm3, %mm1	movq %mm0, 128(%esp)	pfmul %mm3, %mm7	movq 72(%esp), %mm3	pfacc %mm2, %mm1	movq %mm4, %mm2	pfnacc %mm5, %mm7	movq 16(%esp), %mm5	pfnacc %mm3, %mm4	pfacc %mm1, %mm0	movq %mm1, 120(%esp)	movq %mm7, 136(%esp)	movq 64(%esp), %mm7	movq %mm5, %mm1	pfacc %mm3, %mm5	movq %mm6, %mm3	pfnacc 120(%esp), %mm6	pfnacc %mm7, %mm1	pfacc %mm7, %mm2	movq %mm5, 184(%esp)	movq 56(%esp), %mm7	movq %mm4, %mm5	pfpnacc %mm1, %mm4	movq %mm6, 168(%esp)	movq 40(%esp), %mm6	pfpnacc %mm5, %mm1	movq %mm0, %mm5	pfacc %mm7, %mm5	movq %mm4, 144(%esp)	movq %mm1, 152(%esp)	movq %mm5, 160(%esp)	movq 136(%esp), %mm4	movq 128(%esp), %mm1	movq 32(%esp), %mm5	pfacc %mm4, %mm3	pfnacc %mm4, %mm1	movq 48(%esp), %mm4	pfnacc %mm6, %mm5	movq %mm1, 176(%esp)	movq %mm4, %mm1	pfnacc 24(%esp), %mm4	pfacc %mm6, %mm1	movq %mm5, 200(%esp)	movq 112(%esp), %mm5	movq %mm3, %mm6	pfnacc %mm0, %mm3	pfacc %mm1, %mm6	movq %mm4, 192(%esp)	movq %mm5, %mm0	pfnacc %mm1, %mm7	movq 104(%esp), %mm4	movq 96(%esp), %mm1	pfnacc 88(%esp), %mm5	pfacc %mm4, %mm0	pfnacc %mm4, %mm1	movq %mm2, %mm4	movq %mm5, 216(%esp)	movq 80(%esp), %mm5	pfnacc %mm0, %mm2	movq %mm1, 208(%esp)	movq 184(%esp), %mm1	pfacc %mm5, %mm4	pswapd %mm5, %mm5	movq %mm2, 224(%esp)	movq %mm1, %mm2	pfnacc %mm5, %mm1	movq %mm3, %mm5	pfpnacc %mm7, %mm3	pfacc %mm0, %mm2	movq %mm4, %mm0	pfpnacc %mm5, %mm7	movq %mm1, 232(%esp)	movq 160(%esp), %mm1	pfnacc %mm6, %mm4	movq %mm2, %mm5	pfacc %mm6, %mm2	movq 224(%esp), %mm6	pfacc %mm1, %mm0	movq %mm4, 296(%esp)	pswapd %mm1, %mm1	movq %mm3, %mm4	pfnacc %mm7, %mm3	pfnacc %mm1, %mm5	movq %mm2, 344(%esp)	movq 208(%esp), %mm2	pfacc %mm4, %mm7	movq 232(%esp), %mm4	movq %mm6, %mm1	movq %mm0, 304(%esp)	movq 216(%esp), %mm0	pfmul KP707106781KP707106781, %mm3	movq %mm5, 288(%esp)	pfmul KP707106781KP707106781, %mm7	pfacc %mm4, %mm6	movq %mm0, %mm5	pfpnacc %mm2, %mm0	pfnacc %mm4, %mm1	movq 200(%esp), %mm4	pfpnacc %mm5, %mm2	movq %mm3, 256(%esp)	movq %mm6, 248(%esp)	movq 192(%esp), %mm3	movq %mm0, %mm5	movq %mm7, 240(%esp)	movq 176(%esp), %mm6	movq %mm4, %mm7	pfnacc %mm2, %mm0	movq %mm1, 280(%esp)	pfacc %mm5, %mm2	movq 168(%esp), %mm5	pfpnacc %mm3, %mm4	movq %mm6, %mm1	pfpnacc %mm7, %mm3	pfmul KP707106781KP707106781, %mm0	pfpnacc %mm5, %mm6	pfmul KP707106781KP707106781, %mm2	pfpnacc %mm1, %mm5	pswapd %mm3, %mm7	pfmul KP923879532KP382683432, %mm3	pfmul KP923879532KP382683432, %mm7	pswapd %mm6, %mm6	movq %mm5, %mm1	pfmul KP382683432KP923879532, %mm5	movq %mm0, 264(%esp)	pswapd %mm4, %mm0	movq %mm2, 272(%esp)	movq %mm6, %mm2	pfmul KP923879532KP382683432, %mm1	pfmul KP382683432KP923879532, %mm2	pfmul KP382683432KP923879532, %mm0	pfmul KP382683432KP923879532, %mm4	pfpnacc %mm5, %mm7	pfmul KP923879532KP382683432, %mm6	movq (%eax), %mm5	pfpnacc %mm3, %mm1	movq %mm7, 328(%esp)	movq (%ecx,%edx), %mm3	pfpnacc %mm0, %mm2	movq 256(%eax), %mm7	movq (%ebx,%edx), %mm0	pfpnacc %mm6, %mm4	movq %mm1, 336(%esp)	pswapd %mm3, %mm6	pfmul %mm5, %mm3	movq %mm2, 320(%esp)	pfmul %mm5, %mm6	movq (%ebx,%ebp), %mm2	pswapd %mm0, %mm1	pfmul %mm7, %mm0	movq %mm4, 312(%esp)	movq 480(%eax), %mm4	pfmul %mm7, %mm1	movq 352(%eax), %mm7	pswapd %mm2, %mm5	pfacc %mm0, %mm3	movq (%ebx,%edi), %mm0	pfmul %mm4, %mm2	pfnacc %mm1, %mm6	movq 224(%eax), %mm1	pfmul %mm4, %mm5	movq %mm3, 352(%esp)	movq (%ecx,%ebp), %mm3	pswapd %mm0, %mm4	pfmul %mm7, %mm0	leal (%esi,%edx,8), %ebp	pfmul %mm7, %mm4	pswapd %mm3, %mm7	pfmul %mm1, %mm3	pfmul %mm1, %mm7	movq 96(%eax), %mm1	pfacc %mm3, %mm2	movq (%ecx,%edi), %mm3	leal (%edx,%edx,8), %edi	pfnacc %mm7, %mm5	pswapd %mm3, %mm7	pfmul %mm1, %mm3	pfmul %mm1, %mm7	movq %mm5, %mm1	pfacc %mm0, %mm3	movq %mm2, %mm0	pfnacc %mm4, %mm7	movq 384(%eax), %mm4	pfacc %mm3, %mm2	pfnacc %mm3, %mm5	movq (%ebx,%esi), %mm3	pfacc %mm7, %mm1	pfnacc %mm7, %mm0	movq %mm2, 384(%esp)	movq (%ecx,%esi), %mm2	leal (%edx,%edx,4), %esi	movq %mm5, 360(%esp)	pswapd %mm3, %mm7	movq %mm1, 376(%esp)	movq 128(%eax), %mm5	movq (%ebx,%ebp), %mm1	pfmul %mm4, %mm3	movq %mm0, 368(%esp)	pfmul %mm4, %mm7	movq 448(%eax), %mm4	pswapd %mm2, %mm0	pfmul %mm5, %mm2	pfmul %mm5, %mm0	pswapd %mm1, %mm5	pfmul %mm4, %mm1	pfmul %mm4, %mm5	movq (%ecx,%ebp), %mm4	leal (%edx,%esi,4), %ebp	pfacc %mm3, %mm2	movq 192(%eax), %mm3	pfnacc %mm7, %mm0	pswapd %mm4, %mm7	pfmul %mm3, %mm4	movq %mm2, 440(%esp)	movq 64(%eax), %mm2	pfmul %mm3, %mm7	movq %mm0, 400(%esp)	movq (%ecx,%edi), %mm0	pfacc %mm4, %mm1	movq 320(%eax), %mm4	pfnacc %mm7, %mm5	movq (%ebx,%edi), %mm7	pswapd %mm0, %mm3	pfmul %mm2, %mm0	leal (%edx,%edx), %edi	pfmul %mm2, %mm3	movq %mm1, 424(%esp)	pswapd %mm7, %mm2	pfmul %mm4, %mm7	movq %mm5, 392(%esp)	pfmul %mm4, %mm2	movq 32(%eax), %mm4	pfacc %mm7, %mm0	movq (%ecx,%esi), %mm7	pfnacc %mm2, %mm3	movq %mm0, %mm5	pfacc %mm1, %mm0	pswapd %mm7, %mm2	movq 416(%eax), %mm1	pfmul %mm4, %mm7	pfnacc %mm3, %mm5	movq %mm3, 432(%esp)	movq (%ebx,%ebp), %mm3	pfmul %mm4, %mm2	movq %mm0, 416(%esp)	movq %mm5, 408(%esp)	movq 288(%eax), %mm0	movq (%ebx,%esi), %mm5	pswapd %mm3, %mm4	pfmul %mm1, %mm3	leal (%edx,%edx,2), %esi	pfmul %mm1, %mm4	pswapd %mm5, %mm1	pfmul %mm0, %mm5	pfmul %mm0, %mm1	movq 160(%eax), %mm0	pfacc %mm5, %mm7	movq (%ecx,%ebp), %mm5	leal (%edx,%edx,4), %ebp	pfnacc %mm1, %mm2	pswapd %mm5, %mm1	pfmul %mm0, %mm5	pfmul %mm0, %mm1	movq %mm2, %mm0	pfacc %mm3, %mm5	movq %mm7, %mm3	pfnacc %mm4, %mm1	movq 440(%esp), %mm4	pfnacc %mm5, %mm2	pfacc %mm5, %mm3	movq %mm6, %mm5	pfnacc %mm1, %mm7	pfacc %mm1, %mm0	movq %mm2, 448(%esp)	movq 400(%esp), %mm1	movq 352(%esp), %mm2	pfnacc %mm4, %mm6	movq %mm7, 456(%esp)	pfacc %mm1, %mm5	movq %mm2, %mm7	pfnacc %mm1, %mm2	movq %mm3, %mm1	pfnacc %mm0, %mm1	pfacc %mm4, %mm7	movq %mm6, %mm4	pfpnacc %mm2, %mm6	pfpnacc %mm4, %mm2	movq %mm1, 496(%esp)	movq %mm6, 472(%esp)	movq 384(%esp), %mm4	movq 376(%esp), %mm1	movq 432(%esp), %mm6	pfacc %mm4, %mm3	movq %mm2, 464(%esp)	movq 392(%esp), %mm2	pfnacc %mm1, %mm4	pfacc %mm1, %mm0	movq 424(%esp), %mm1	pfacc %mm2, %mm6	movq %mm4, 480(%esp)	movq %mm7, %mm4	pfnacc %mm2, %mm1	movq 416(%esp), %mm2	pfnacc %mm6, %mm4	pfacc %mm2, %mm7	movq %mm1, 488(%esp)	pswapd %mm2, %mm2	movq %mm5, %mm1	pfacc %mm6, %mm5	pfnacc %mm2, %mm1	movq %mm7, %mm6	pfnacc %mm0, %mm7	movq %mm5, %mm2	pfacc %mm3, %mm6	pswapd %mm3, %mm3	pfacc %mm0, %mm2	movq %mm1, %mm0	pfnacc %mm3, %mm5	movq %mm7, 504(%esp)	movq 480(%esp), %mm3	movq 496(%esp), %mm7	pfnacc %mm4, %mm1	pfacc %mm0, %mm4	movq %mm6, 616(%esp)	movq %mm2, 656(%esp)	movq 488(%esp), %mm6	movq 408(%esp), %mm2	movq %mm3, %mm0	movq %mm5, 512(%esp)	movq %mm1, 560(%esp)	pfpnacc %mm7, %mm0	pswapd %mm7, %mm7	movq %mm6, %mm5	movq %mm4, 528(%esp)	movq 456(%esp), %mm4	pfpnacc %mm3, %mm7	movq 448(%esp), %mm3	pfpnacc %mm2, %mm5	pswapd %mm2, %mm2	movq %mm0, %mm1	pfpnacc %mm6, %mm2	movq %mm4, %mm6	pfacc %mm7, %mm1	pfnacc %mm7, %mm0	movq %mm5, %mm7	pfpnacc %mm3, %mm4	pfnacc %mm2, %mm5	pfmul KP707106781KP707106781, %mm1	pfpnacc %mm6, %mm3	movq 368(%esp), %mm6	pfmul KP707106781KP707106781, %mm0	pfacc %mm7, %mm2	pswapd %mm4, %mm4	pfmul KP707106781KP707106781, %mm5	movq %mm3, %mm7	pfmul KP923879532KP382683432, %mm3	pfmul KP707106781KP707106781, %mm2	movq %mm1, 520(%esp)	movq %mm0, 552(%esp)	movq 360(%esp), %mm1	movq %mm6, %mm0	pfmul KP382683432KP923879532, %mm7	movq %mm5, 536(%esp)	movq %mm4, %mm5	pfmul KP382683432KP923879532, %mm4	pfpnacc %mm1, %mm6	pfpnacc %mm0, %mm1	movq %mm2, 544(%esp)	pfmul KP923879532KP382683432, %mm5	movq %mm6, %mm2	pfmul KP382683432KP923879532, %mm6	pswapd %mm1, %mm1	pfmul KP923879532KP382683432, %mm2	movq %mm1, %mm0	pfmul KP382683432KP923879532, %mm1	pfmul KP923879532KP382683432, %mm0	pfpnacc %mm5, %mm6	movq 120(%eax), %mm5	pfpnacc %mm2, %mm4	movq (%ecx,%edi,8), %mm2	pfpnacc %mm1, %mm3	movq (%ebx,%edi,8), %mm1	leal (%ebp,%edx,2), %edi	movq %mm6, 576(%esp)	movq 376(%eax), %mm6	pfpnacc %mm7, %mm0	movq %mm4, 568(%esp)	pswapd %mm2, %mm7	pfmul %mm5, %mm2	pswapd %mm1, %mm4	movq %mm3, 584(%esp)	pfmul %mm5, %mm7	movq (%ecx,%edx,8), %mm5	pfmul %mm6, %mm4	movq %mm0, 600(%esp)	movq 56(%eax), %mm0	pfmul %mm6, %mm1	movq 312(%eax), %mm6

⌨️ 快捷键说明

复制代码 Ctrl + C
搜索代码 Ctrl + F
全屏模式 F11
切换主题 Ctrl + Shift + D
显示快捷键 ?
增大字号 Ctrl + =
减小字号 Ctrl + -