📄 t1k7i_64.s
字号:
/* * Copyright (c) 2003, 2006 Matteo Frigo * Copyright (c) 2003, 2006 Massachusetts Institute of Technology * * This program is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation; either version 2 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program; if not, write to the Free Software * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA * *//* This file was automatically generated --- DO NOT EDIT *//* Generated on Fri Jan 27 20:13:41 EST 2006 */#include "config.h"/* cheap-mode: VECTGRADE_FULL succeeded. (1024 steps) *//* Generated by: ../../../genfft-k7/gen_twiddle -no-randomized-cse -n 64 -sign 1 -name t1k7i_64 *//* * Generator Id's : * $Id: algsimp.ml,v 1.4 2006-01-05 03:04:27 stevenj Exp $ * $Id: fft.ml,v 1.4 2006-01-05 03:04:27 stevenj Exp $ * $Id: gen_twiddle.ml,v 1.14 2005-12-24 21:08:49 athena Exp $ *//* The following asm code is Copyright (c) 2000-2001 Stefan Kral */.section .rodata .balign 64KP707106781KP707106781: .float +0.707106781186547524400844362104849039284835938, +0.707106781186547524400844362104849039284835938KP382683432KP923879532: .float +0.382683432365089771728459984030398866761344562, +0.923879532511286756128183189396788286822416626KP923879532KP382683432: .float +0.923879532511286756128183189396788286822416626, +0.382683432365089771728459984030398866761344562KP831469612KP555570233: .float +0.831469612302545237078788377617905756738560812, +0.555570233019602224742830813948532874374937191KP195090322KP980785280: .float +0.195090322016128267848284868477022240927691618, +0.980785280403230449126182236134239036973933731KP555570233KP831469612: .float +0.555570233019602224742830813948532874374937191, +0.831469612302545237078788377617905756738560812KP980785280KP195090322: .float +0.980785280403230449126182236134239036973933731, +0.195090322016128267848284868477022240927691618KP634393284KP773010453: .float +0.634393284163645498215171613225493370675687095, +0.773010453362736960810906609758469800971041293KP098017140KP995184726: .float +0.098017140329560601994195563888641845861136673, +0.995184726672196886244836953109479921575474869KP773010453KP634393284: .float +0.773010453362736960810906609758469800971041293, +0.634393284163645498215171613225493370675687095KP995184726KP098017140: .float +0.995184726672196886244836953109479921575474869, +0.098017140329560601994195563888641845861136673KP881921264KP471396736: .float +0.881921264348355029712756863660388349508442621, +0.471396736825997648556387625905254377657460319KP471396736KP881921264: .float +0.471396736825997648556387625905254377657460319, +0.881921264348355029712756863660388349508442621KP290284677KP956940335: .float +0.290284677254462367636192375817395274691476278, +0.956940335732208864935797886980269969482849206KP956940335KP290284677: .float +0.956940335732208864935797886980269969482849206, +0.290284677254462367636192375817395274691476278.text.text .balign 64t1k7i_64: subl $1308, %esp femms movl 1324(%esp), %edx movl 1316(%esp), %ecx movl %ebx, 1304(%esp) movl 1320(%esp), %eax movl %esi, 1300(%esp) movl %edi, 1296(%esp) leal (,%edx,4), %edx movl %ebp, 1292(%esp) movl %edx, %ebx sall $5, %ebx addl %ecx, %ebx sall $2, 1332(%esp) .p2align 4,,7.L0: /* promise simd cell size = 8 */ movq (%ebx), %mm1 leal (%edx,%edx), %esi movq 248(%eax), %mm0 movq 376(%eax), %mm3 leal (%edx,%edx,2), %edi movq 120(%eax), %mm6 movq (%ebx,%esi,8), %mm4 movq (%ecx,%esi,8), %mm7 leal (%edi,%edx,4), %ebp pswapd %mm1, %mm2 pfmul %mm0, %mm1 leal (%ebp,%edx,8), %esi pfmul %mm0, %mm2 pswapd %mm4, %mm5 pfmul %mm3, %mm4 pswapd %mm7, %mm0 pfmul %mm6, %mm7 pfmul %mm3, %mm5 movq (%ecx), %mm3 pfmul %mm6, %mm0 pfpnacc %mm2, %mm1 pfnacc %mm4, %mm7 movq 312(%eax), %mm4 movq %mm3, %mm6 pfacc %mm5, %mm0 movq (%ebx,%edx,8), %mm5 pfadd %mm1, %mm3 movq %mm7, %mm2 pfsub %mm1, %mm6 pfacc %mm0, %mm2 pswapd %mm5, %mm1 pswapd %mm0, %mm0 pfmul %mm4, %mm5 pfmul %mm4, %mm1 movq %mm6, 8(%esp) movq (%ecx,%edx,8), %mm4 pfnacc %mm7, %mm0 movq 56(%eax), %mm7 movq %mm3, %mm6 pfsub %mm2, %mm3 pfadd %mm2, %mm6 pswapd %mm4, %mm2 pfmul %mm7, %mm4 movq %mm0, 0(%esp) movq %mm3, 16(%esp) movq 184(%eax), %mm0 pfmul %mm7, %mm2 movq %mm6, 56(%esp) movq (%ecx,%edi,8), %mm3 movq 440(%eax), %mm6 pfnacc %mm5, %mm4 movq (%ebx,%edi,8), %mm5 leal (%edx,%esi,2), %edi pfacc %mm1, %mm2 pswapd %mm3, %mm7 leal (%ebp,%edx,4), %esi pfmul %mm0, %mm3 pfmul %mm0, %mm7 pswapd %mm5, %mm1 pfmul %mm6, %mm5 movq %mm4, %mm0 pfmul %mm6, %mm1 pfnacc %mm2, %mm0 pfnacc %mm3, %mm5 pfacc %mm7, %mm1 movq %mm0, %mm6 movq 304(%eax), %mm7 pfacc %mm5, %mm4 pfnacc %mm1, %mm5 pfacc %mm2, %mm1 movq (%ebx,%ebp), %mm2 movq %mm4, %mm3 pfpnacc %mm5, %mm6 pswapd %mm5, %mm5 pfacc %mm1, %mm4 pfnacc %mm3, %mm1 pswapd %mm2, %mm3 pfpnacc %mm0, %mm5 pfmul %mm7, %mm2 movq 48(%eax), %mm0 pfmul %mm7, %mm3 movq %mm6, 32(%esp) movq %mm4, 48(%esp) movq (%ecx,%ebp), %mm7 movq 240(%eax), %mm4 leal (%edx,%edx), %ebp movq %mm1, 40(%esp) movq %mm5, 24(%esp) movq (%ecx,%edi), %mm1 pswapd %mm7, %mm6 pfmul %mm0, %mm7 pfmul %mm0, %mm6 movq 496(%eax), %mm0 pswapd %mm1, %mm5 pfmul %mm4, %mm1 pfnacc %mm2, %mm7 movq (%ebx,%edi), %mm2 pfmul %mm4, %mm5 leal (%esi,%ebp,8), %edi leal (%esi,%edx,4), %ebp pfacc %mm3, %mm6 movq 336(%eax), %mm3 pswapd %mm2, %mm4 pfmul %mm0, %mm2 movq %mm7, 64(%esp) movq %mm6, 72(%esp) movq (%ebx,%esi), %mm7 pfmul %mm0, %mm4 movq 464(%eax), %mm0 pfnacc %mm1, %mm2 movq (%ebx,%edi), %mm1 pswapd %mm7, %mm6 pfmul %mm3, %mm7 pfacc %mm5, %mm4 pfmul %mm3, %mm6 movq %mm2, 80(%esp) movq 80(%eax), %mm3 movq (%ecx,%esi), %mm2 pswapd %mm1, %mm5 pfmul %mm0, %mm1 leal (%ebp,%edx,8), %esi pfmul %mm0, %mm5 pswapd %mm2, %mm0 pfmul %mm3, %mm2 pfmul %mm3, %mm0 movq 208(%eax), %mm3 pfnacc %mm7, %mm2 movq (%ecx,%edi), %mm7 leal (%ebp,%edx,4), %edi pfacc %mm6, %mm0 pswapd %mm7, %mm6 pfmul %mm3, %mm7 pfmul %mm3, %mm6 pfnacc %mm7, %mm1 pfacc %mm6, %mm5 movq 112(%eax), %mm6 movq %mm1, %mm3 pfnacc %mm0, %mm1 movq %mm5, %mm7 pfacc %mm0, %mm5 movq (%ecx,%ebp), %mm0 pfacc %mm2, %mm3 pfnacc %mm2, %mm7 movq %mm1, 88(%esp) movq %mm5, 104(%esp) movq 368(%eax), %mm2 movq (%ebx,%ebp), %mm5 pswapd %mm0, %mm1 pfmul %mm6, %mm0 movq %mm3, 112(%esp) leal (%edx,%edx,2), %ebp movq %mm7, 96(%esp) movq (%ecx,%esi), %mm7 pfmul %mm6, %mm1 movq 176(%eax), %mm6 pswapd %mm5, %mm3 pfmul %mm2, %mm5 pfmul %mm2, %mm3 pswapd %mm7, %mm2 pfmul %mm6, %mm7 pfmul %mm6, %mm2 movq (%ebx,%esi), %mm6 pfnacc %mm5, %mm0 movq 432(%eax), %mm5 leal (%ebp,%edx,4), %esi pfacc %mm3, %mm1 pswapd %mm6, %mm3 movq %mm0, 152(%esp) movq 400(%eax), %mm0 pfmul %mm5, %mm6 pfmul %mm5, %mm3 movq %mm1, 144(%esp) movq (%ebx,%edi), %mm5 pfnacc %mm7, %mm6 movq 16(%eax), %mm7 pfacc %mm2, %mm3 movq (%ecx,%ebp), %mm2 pswapd %mm5, %mm1 pfmul %mm0, %mm5 pfmul %mm0, %mm1 movq %mm6, 128(%esp) pswapd %mm2, %mm0 pfnacc %mm3, %mm6 movq %mm3, 136(%esp) pfmul %mm7, %mm2 movq 144(%eax), %mm3 pfmul %mm7, %mm0 movq (%ecx,%edi), %mm7 leal (%edx,%edx,4), %edi movq %mm6, 120(%esp) pswapd %mm7, %mm6 pfmul %mm3, %mm7 pfmul %mm3, %mm6 movq 272(%eax), %mm3 pfnacc %mm5, %mm7 movq (%ebx,%ebp), %mm5 pfacc %mm1, %mm6 pswapd %mm5, %mm1 pfmul %mm3, %mm5 pfmul %mm3, %mm1 pfnacc %mm5, %mm2 pfacc %mm1, %mm0 movq 144(%esp), %mm1 movq %mm2, %mm3 pfnacc %mm6, %mm2 movq %mm0, %mm5 pfacc %mm7, %mm3 pfacc %mm6, %mm0 movq %mm4, %mm6 pfnacc %mm7, %mm5 movq %mm2, 160(%esp) movq 80(%esp), %mm7 pfacc %mm1, %mm4 movq %mm5, 168(%esp) movq 152(%esp), %mm5 movq %mm7, %mm2 pfnacc %mm1, %mm7 movq %mm3, %mm1 pfnacc %mm0, %mm3 pfnacc %mm5, %mm6 pfacc %mm5, %mm2 movq %mm3, 192(%esp) movq 112(%esp), %mm3 movq %mm6, %mm5 pfpnacc %mm7, %mm6 pfpnacc %mm5, %mm7 movq 104(%esp), %mm5 pfacc %mm3, %mm1 movq %mm6, 176(%esp) movq 64(%esp), %mm6 pfnacc %mm5, %mm3 movq %mm7, 184(%esp) movq 72(%esp), %mm7 pfacc %mm5, %mm0 movq %mm1, 208(%esp) movq 136(%esp), %mm5 movq %mm6, %mm1 pfacc 128(%esp), %mm6 movq %mm3, 200(%esp) pfnacc %mm7, %mm1 movq %mm4, %mm3 pfacc %mm7, %mm5 movq %mm2, %mm7 pfnacc %mm6, %mm3 pfacc %mm5, %mm4 pfacc %mm6, %mm7 movq 208(%esp), %mm6 pfnacc %mm5, %mm2 movq %mm4, %mm5 pfnacc %mm6, %mm4 pfacc %mm0, %mm5 pswapd %mm0, %mm0 movq %mm4, 216(%esp) movq %mm7, %mm4 pfnacc %mm0, %mm7 movq %mm5, 320(%esp) movq 200(%esp), %mm5 movq %mm3, %mm0 pfacc %mm6, %mm4 movq 192(%esp), %mm6 pfnacc %mm2, %mm3 pfacc %mm0, %mm2 movq %mm7, 224(%esp) movq 120(%esp), %mm7 pswapd %mm5, %mm0 movq %mm4, 312(%esp) pfpnacc %mm6, %mm0 movq %mm3, 272(%esp) pfpnacc %mm5, %mm6 pswapd %mm7, %mm4 movq %mm2, 256(%esp) movq 96(%esp), %mm2 pfpnacc %mm1, %mm4 pfpnacc %mm7, %mm1 movq 88(%esp), %mm7 movq %mm6, %mm3 pfacc %mm0, %mm6 pfnacc %mm0, %mm3 movq %mm2, %mm0 movq %mm1, %mm5 pfacc %mm4, %mm1 pfmul KP707106781KP707106781, %mm6 pfpnacc %mm7, %mm2 pfnacc %mm5, %mm4 pfmul KP707106781KP707106781, %mm3 pfpnacc %mm0, %mm7 pfmul KP707106781KP707106781, %mm1 movq %mm2, %mm5 pfmul KP382683432KP923879532, %mm2 pfmul KP707106781KP707106781, %mm4 movq %mm6, 232(%esp) movq 168(%esp), %mm6 pswapd %mm7, %mm7 pfmul KP923879532KP382683432, %mm5 movq %mm3, 264(%esp) movq 160(%esp), %mm3 movq %mm7, %mm0 movq %mm1, 248(%esp) pfmul KP923879532KP382683432, %mm7 movq %mm6, %mm1 pfmul KP382683432KP923879532, %mm0 movq %mm4, 240(%esp) pfpnacc %mm3, %mm6 pfpnacc %mm1, %mm3 pswapd %mm6, %mm4 pfmul KP382683432KP923879532, %mm6 pswapd %mm3, %mm1 pfmul KP923879532KP382683432, %mm3 pfmul KP382683432KP923879532, %mm4 pfmul KP923879532KP382683432, %mm1 pfpnacc %mm6, %mm2 movq 88(%eax), %mm6 pfpnacc %mm0, %mm3 movq (%ecx,%ebp,4), %mm0 pfpnacc %mm5, %mm4 pfpnacc %mm1, %mm7 movq %mm2, 288(%esp) movq 344(%eax), %mm1 movq (%ebx,%ebp,4), %mm2 leal (%edx,%edx,8), %ebp movq %mm3, 296(%esp) pswapd %mm0, %mm5 pfmul %mm6, %mm0 movq %mm4, 280(%esp) movq %mm7, 304(%esp) movq 280(%eax), %mm4 movq (%ebx,%edx,4), %mm7 pfmul %mm6, %mm5 pswapd %mm2, %mm3 pfmul %mm1, %mm2 pfmul %mm1, %mm3 movq 24(%eax), %mm1 pswapd %mm7, %mm6 pfmul %mm4, %mm7 pfnacc %mm2, %mm0 movq (%ecx,%edx,4), %mm2 pfmul %mm4, %mm6 pfacc %mm3, %mm5 movq 216(%eax), %mm3 pswapd %mm2, %mm4 pfmul %mm1, %mm2 movq %mm0, 328(%esp) movq (%ecx,%esi,4), %mm0 pfmul %mm1, %mm4 movq %mm5, 344(%esp) movq 472(%eax), %mm5 pfnacc %mm7, %mm2 movq (%ebx,%esi,4), %mm7 leal (%ebp,%edx,4), %esi pswapd %mm0, %mm1 pfmul %mm3, %mm0 pfacc %mm6, %mm4 pfmul %mm3, %mm1 movq 408(%eax), %mm3 pswapd %mm7, %mm6 pfmul %mm5, %mm7 pfmul %mm5, %mm6 movq (%ebx,%edi,4), %mm5 pfnacc %mm0, %mm7 pswapd %mm5, %mm0 pfacc %mm1, %mm6 movq 152(%eax), %mm1 pfmul %mm3, %mm5 pfmul %mm3, %mm0 movq (%ecx,%edi,4), %mm3 leal (%edx,%edx), %edi movq %mm6, 336(%esp) pswapd %mm3, %mm6 pfmul %mm1, %mm3 pfmul %mm1, %mm6 movq %mm4, %mm1 pfnacc %mm5, %mm3 movq %mm2, %mm5 pfacc %mm0, %mm6 movq 328(%esp), %mm0 pfnacc %mm3, %mm4 pfacc %mm3, %mm5 movq %mm7, %mm3 pfnacc %mm6, %mm2 pfacc %mm6, %mm1 movq %mm4, %mm6 pfacc %mm0, %mm3 movq %mm5, 376(%esp) pfpnacc %mm2, %mm4 pfpnacc %mm6, %mm2 movq %mm1, 368(%esp) movq 344(%esp), %mm1 pswapd %mm4, %mm5 pfmul KP382683432KP923879532, %mm4 pswapd %mm2, %mm6 pfmul KP923879532KP382683432, %mm2 pfnacc %mm1, %mm7 pfmul KP382683432KP923879532, %mm5 pfmul KP923879532KP382683432, %mm6 movq %mm2, 360(%esp) movq %mm6, 352(%esp) movq 336(%esp), %mm2 movq %mm2, %mm6 pfnacc %mm0, %mm2 movq %mm7, %mm0 pfacc %mm1, %mm6 pfpnacc %mm2, %mm7 pfpnacc %mm0, %mm2 movq %mm7, 400(%esp) movq 376(%esp), %mm0 movq %mm2, %mm1 pfmul KP382683432KP923879532, %mm2 movq %mm0, %mm7 pfacc %mm3, %mm0 pfmul KP923879532KP382683432, %mm1 pfnacc %mm6, %mm3 movq %mm0, 432(%esp) movq 320(%eax), %mm0 pfpnacc %mm4, %mm2 movq (%ebx,%ebp), %mm4 pfpnacc %mm1, %mm5 pswapd %mm4, %mm1 movq %mm2, 384(%esp) pfmul %mm0, %mm4 movq %mm5, 392(%esp) movq 368(%esp), %mm2 pfmul %mm0, %mm1 movq 64(%eax), %mm5 movq (%ecx,%ebp), %mm0 leal (%esi,%edi,8), %ebp pfnacc %mm2, %mm7 pfacc %mm2, %mm6 pswapd %mm0, %mm2 pfmul %mm5, %mm0 pfmul %mm5, %mm2 movq %mm7, %mm5 movq %mm6, 424(%esp) movq 256(%eax), %mm6 pfnacc %mm4, %mm0 movq (%ebx,%edx), %mm4 pfpnacc %mm3, %mm5 pswapd %mm3, %mm3 pfacc %mm1, %mm2 pfpnacc %mm7, %mm3 movq %mm0, 440(%esp) movq (%eax), %mm7 movq (%ecx,%edx), %mm0 pswapd %mm4, %mm1 pfmul %mm6, %mm4 movq %mm5, 408(%esp) pfmul %mm6, %mm1 movq %mm2, 448(%esp) movq %mm3, 416(%esp) movq (%ebx,%esi), %mm2 movq 352(%eax), %mm6 pswapd %mm0, %mm5 pfmul %mm7, %mm0 pfmul %mm7, %mm5 pswapd %mm2, %mm3 movq 480(%eax), %mm7 pfmul %mm6, %mm2 pfnacc %mm4, %mm0 movq (%ebx,%ebp), %mm4 pfmul %mm6, %mm3 pfacc %mm1, %mm5 movq %mm0, 456(%esp) movq 96(%eax), %mm1 movq (%ecx,%esi), %mm0 pswapd %mm4, %mm6 pfmul %mm7, %mm4 leal (%edx,%edi,8), %esi pfmul %mm7, %mm6 leal (%esi,%edx,8), %edi pswapd %mm0, %mm7 pfmul %mm1, %mm0 pfmul %mm1, %mm7 movq 224(%eax), %mm1 pfnacc %mm2, %mm0 movq (%ecx,%ebp), %mm2 leal (%esi,%edx,4), %ebp pfacc %mm3, %mm7 pswapd %mm2, %mm3 pfmul %mm1, %mm2 pfmul %mm1, %mm3 pfnacc %mm2, %mm4 pfacc %mm3, %mm6 movq 128(%eax), %mm3 movq %mm4, %mm1 pfnacc %mm7, %mm4 movq %mm6, %mm2 pfacc %mm7, %mm6 movq (%ecx,%esi), %mm7 pfacc %mm0, %mm1 pfnacc %mm0, %mm2 movq %mm4, 464(%esp) movq %mm6, 480(%esp) movq 384(%eax), %mm0 movq (%ebx,%esi), %mm6 pswapd %mm7, %mm4 pfmul %mm3, %mm7 movq %mm1, 488(%esp) leal (%edx,%edx,4), %esi movq %mm2, 472(%esp) movq (%ecx,%edi), %mm2 pfmul %mm3, %mm4 movq 192(%eax), %mm3 pswapd %mm6, %mm1 pfmul %mm0, %mm6 pfmul %mm0, %mm1 pswapd %mm2, %mm0 pfmul %mm3, %mm2 pfmul %mm3, %mm0 movq (%ebx,%edi), %mm3 pfnacc %mm6, %mm7 movq 448(%eax), %mm6 leal (%edx,%edx,8), %edi pfacc %mm1, %mm4 pswapd %mm3, %mm1 movq %mm7, 528(%esp) movq 416(%eax), %mm7 pfmul %mm6, %mm3 pfmul %mm6, %mm1 movq %mm4, 520(%esp) movq (%ebx,%ebp), %mm6
⌨️ 快捷键说明
复制代码
Ctrl + C
搜索代码
Ctrl + F
全屏模式
F11
切换主题
Ctrl + Shift + D
显示快捷键
?
增大字号
Ctrl + =
减小字号
Ctrl + -