/* * Copyright (c) 2003 Matteo Frigo * Copyright (c) 2003 Massachusetts Institute of Technology * * This program is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation; either version 2 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program; if not, write to the Free Software * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA * */ /* This file was automatically generated --- DO NOT EDIT */ /* Generated on Sat Jul 5 21:51:51 EDT 2003 */ #include "config.h" /* cheap-mode: VECTGRADE_FULL succeeded. (134 steps) */ /* Generated by: /homee/stevenj/cvs/fftw3.0.1/genfft-k7/gen_twiddle -no-randomized-cse -n 9 -name t1k7_9 */ /* * Generator Id's : * $Id: algsimp.ml,v 1.3 2003/03/15 20:29:42 stevenj Exp $ * $Id: fft.ml,v 1.3 2003/03/15 20:29:43 stevenj Exp $ * $Id: gen_twiddle.ml,v 1.13 2003/04/18 01:21:45 athena Exp $ */ /* The following asm code is Copyright (c) 2000-2001 Stefan Kral */ .section .rodata .balign 64 KP500000000KP500000000: .float +0.500000000000000000000000000000000000000000000, +0.500000000000000000000000000000000000000000000 KP866025403KP866025403: .float +0.866025403784438646763723170752936183471402627, +0.866025403784438646763723170752936183471402627 KN866025403KN866025403: .float -0.866025403784438646763723170752936183471402627, -0.866025403784438646763723170752936183471402627 KN984807753KP342020143: .float -0.984807753012208059366743024589523013670643252, +0.342020143325668733044099614682259580763083368 KP173648177KN939692620: .float +0.173648177666930348851716626769314796000375677, -0.939692620785908384054109277324731469936208134 KP984807753KP342020143: .float +0.984807753012208059366743024589523013670643252, +0.342020143325668733044099614682259580763083368 KP173648177KP939692620: .float +0.173648177666930348851716626769314796000375677, +0.939692620785908384054109277324731469936208134 KP766044443KP173648177: .float +0.766044443118978035202392650555416673935832457, +0.173648177666930348851716626769314796000375677 KP642787609KP984807753: .float +0.642787609686539326322643409907263432907559884, +0.984807753012208059366743024589523013670643252 .text .text .balign 64 t1k7_9: subl $76, %esp femms movl %ebx, 72(%esp) movl 92(%esp), %edx movl 100(%esp), %ebx movl %esi, 68(%esp) movl %edi, 64(%esp) movl 80(%esp), %ecx movl %ebp, 60(%esp) movl 88(%esp), %eax movl 96(%esp), %esi leal (,%edx,4), %edx leal (,%ebx,4), %ebx .p2align 4,,7 .L0: /* promise simd cell size = 8 */ leal (%edx,%edx,2), %edi movq 16(%eax), %mm0 movq 40(%eax), %mm3 movq (%ecx,%edx), %mm7 movq (%ecx,%edi), %mm1 movq (%ecx,%edi,2), %mm4 leal (%edi,%edx,4), %ebp movq (%eax), %mm6 leal (%edx,%edx,4), %edi pswapd %mm1, %mm2 pswapd %mm4, %mm5 pfmul %mm0, %mm1 pfmul %mm3, %mm4 pfmul %mm0, %mm2 pswapd %mm7, %mm0 pfmul %mm3, %mm5 pfmul %mm6, %mm7 pfacc %mm4, %mm1 pfmul %mm6, %mm0 movq (%ecx,%edx,2), %mm6 movq 8(%eax), %mm4 pfnacc %mm5, %mm2 movq %mm1, %mm3 pswapd %mm6, %mm5 pfmul %mm4, %mm6 pswapd %mm3, %mm3 pfacc %mm2, %mm1 pfmul %mm4, %mm5 movq (%ecx,%edx,4), %mm4 pfnacc %mm3, %mm2 movq 24(%eax), %mm3 pfacc %mm6, %mm7 movq %mm1, 16(%esp) pfmul KP500000000KP500000000, %mm1 pfnacc %mm5, %mm0 pswapd %mm4, %mm6 pfmul KP866025403KP866025403, %mm2 movq 56(%eax), %mm5 pfmul %mm3, %mm4 pfmul %mm3, %mm6 movq %mm0, 24(%esp) movq %mm1, 8(%esp) movq %mm2, 0(%esp) movq (%ecx,%edx,8), %mm3 movq 48(%eax), %mm0 movq (%ecx,%ebp), %mm2 pswapd %mm3, %mm1 pfmul %mm5, %mm3 leal (%edx,%edx,2), %ebp pfmul %mm5, %mm1 pswapd %mm2, %mm5 pfmul %mm0, %mm2 pfmul %mm0, %mm5 movq 32(%eax), %mm0 addl $64, %eax pfacc %mm2, %mm4 movq (%ecx,%edi), %mm2 leal (%ebp,%edx,4), %edi pfnacc %mm5, %mm6 pswapd %mm2, %mm5 pfmul %mm0, %mm2 pfmul %mm0, %mm5 movq %mm4, %mm0 pfacc %mm3, %mm2 movq %mm6, %mm3 pfnacc %mm1, %mm5 movq %mm7, %mm1 pfacc %mm2, %mm4 pfnacc %mm2, %mm0 pfacc %mm5, %mm3 pfnacc %mm5, %mm6 pfadd %mm4, %mm7 pfmul KP500000000KP500000000, %mm4 pfmul KN866025403KN866025403, %mm0 movq %mm3, %mm2 pfmul KP866025403KP866025403, %mm6 pfmul KP500000000KP500000000, %mm2 pfsub %mm4, %mm1 movq 24(%esp), %mm4 movq %mm1, %mm5 pfadd %mm6, %mm1 pfsub %mm6, %mm5 movq %mm4, %mm6 pfsub %mm2, %mm4 pfadd %mm3, %mm6 movq %mm0, %mm3 movq %mm1, 32(%esp) pswapd %mm7, %mm1 movq %mm5, %mm2 pfmul KN984807753KP342020143, %mm5 pfadd %mm4, %mm3 pfsubr %mm4, %mm0 pfmul KP173648177KN939692620, %mm2 movq (%ecx), %mm4 pfacc %mm6, %mm7 /* simd data load/store barrier */ pfnacc %mm1, %mm6 movq %mm3, 40(%esp) movq %mm4, %mm1 pfadd 16(%esp), %mm4 movq %mm5, 48(%esp) movq %mm7, %mm3 pfmul KP866025403KP866025403, %mm6 pfsub 8(%esp), %mm1 pfmul KP500000000KP500000000, %mm3 movq %mm4, %mm5 pfadd %mm7, %mm5 movq %mm0, %mm7 pfmul KP984807753KP342020143, %mm0 pfsub %mm3, %mm4 pfmul KP173648177KP939692620, %mm7 movq %mm5, (%ecx) movq 0(%esp), %mm5 movq %mm4, %mm3 pfsub %mm6, %mm4 pfadd %mm2, %mm0 movq %mm1, %mm2 pfadd %mm6, %mm3 movq 32(%esp), %mm6 pfadd 48(%esp), %mm7 pfadd %mm5, %mm2 movq %mm4, (%ecx,%ebp,2) pfsub %mm5, %mm1 movq 40(%esp), %mm5 movq %mm3, (%ecx,%ebp) pswapd %mm0, %mm3 movq %mm6, %mm4 pfmul KP766044443KP173648177, %mm6 leal (%edx,%edx,4), %ebp pfmul KP642787609KP984807753, %mm4 pfpnacc %mm7, %mm3 pfpnacc %mm0, %mm7 movq %mm5, %mm0 pfmul KP766044443KP173648177, %mm5 pfmul KP642787609KP984807753, %mm0 pswapd %mm3, %mm3 pswapd %mm7, %mm7 pfmul KP866025403KP866025403, %mm3 pfsub %mm4, %mm5 pfadd %mm0, %mm6 movq %mm1, %mm0 pfadd %mm7, %mm1 pfmul KP500000000KP500000000, %mm7 pswapd %mm6, %mm4 pfacc %mm5, %mm6 movq %mm1, (%ecx,%edx,2) pfnacc %mm4, %mm5 movq %mm2, %mm4 pfsub %mm7, %mm0 pfadd %mm6, %mm2 pfmul KP500000000KP500000000, %mm6 pfmul KP866025403KP866025403, %mm5 movq %mm0, %mm1 pfadd %mm3, %mm0 movq %mm2, (%ecx,%edx) pfsub %mm3, %mm1 pfsub %mm6, %mm4 movq %mm0, (%ecx,%ebp) movq %mm1, (%ecx,%edx,8) movq %mm4, %mm2 pfadd %mm5, %mm4 pfsub %mm5, %mm2 movq %mm4, (%ecx,%edx,4) movq %mm2, (%ecx,%edi) addl %ebx, %ecx decl %esi jnz .L0 femms movl 72(%esp), %ebx movl 68(%esp), %esi movl 64(%esp), %edi movl 60(%esp), %ebp addl $76, %esp ret .section .rodata nam: .string "t1k7_9" .align 4 twinstr: .byte 4 .byte 0 .value 9 .byte 3 .byte 1 .value 0 .align 4 desc: .long 9 .long nam .long twinstr .zero 4 .double 48 .double 36 .double 0 .double 0 .long fftwf_kdft_ct_k7_mgenus .long 0 .long 0 .long 0 .text .align 4 .globl fftwf_codelet_t1k7_9 fftwf_codelet_t1k7_9: subl $12,%esp movl 16(%esp),%eax addl $-4,%esp pushl $desc pushl $t1k7_9 pushl %eax call fftwf_kdft_dit_register addl $16,%esp addl $12,%esp ret