ref: 4f9a9087f16b92662389be3dc0589629359ac8a4
dir: /libfaad/fftw/fni_16.c/
/* * Copyright (c) 1997-1999 Massachusetts Institute of Technology * * This program is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation; either version 2 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program; if not, write to the Free Software * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA * */ /* This file was automatically generated --- DO NOT EDIT */ /* Generated on Sun Nov 7 20:44:15 EST 1999 */ #include <fftw-int.h> #include <fftw.h> /* Generated by: ./genfft -magic-alignment-check -magic-twiddle-load-all -magic-variables 4 -magic-loopi -notwiddleinv 16 */ /* * This function contains 144 FP additions, 24 FP multiplications, * (or, 136 additions, 16 multiplications, 8 fused multiply/add), * 46 stack variables, and 64 memory accesses */ static const fftw_real K382683432 = FFTW_KONST(+0.382683432365089771728459984030398866761344562); static const fftw_real K923879532 = FFTW_KONST(+0.923879532511286756128183189396788286822416626); static const fftw_real K707106781 = FFTW_KONST(+0.707106781186547524400844362104849039284835938); /* * Generator Id's : * $Id: fni_16.c,v 1.1 2002/04/07 21:26:04 menno Exp $ * $Id: fni_16.c,v 1.1 2002/04/07 21:26:04 menno Exp $ * $Id: fni_16.c,v 1.1 2002/04/07 21:26:04 menno Exp $ */ void fftwi_no_twiddle_16(const fftw_complex *input, fftw_complex *output, int istride, int ostride) { fftw_real tmp7; fftw_real tmp129; fftw_real tmp38; fftw_real tmp115; fftw_real tmp49; fftw_real tmp95; fftw_real tmp83; fftw_real tmp105; fftw_real tmp29; fftw_real tmp123; fftw_real tmp73; fftw_real tmp101; fftw_real tmp78; fftw_real tmp102; fftw_real tmp126; fftw_real tmp141; fftw_real tmp14; fftw_real tmp116; fftw_real tmp45; fftw_real tmp130; fftw_real tmp52; fftw_real tmp84; fftw_real tmp55; fftw_real tmp85; fftw_real tmp22; fftw_real tmp118; fftw_real tmp62; fftw_real tmp98; fftw_real tmp67; fftw_real tmp99; fftw_real tmp121; fftw_real tmp140; ASSERT_ALIGNED_DOUBLE; { fftw_real tmp3; fftw_real tmp81; fftw_real tmp34; fftw_real tmp48; fftw_real tmp6; fftw_real tmp47; fftw_real tmp37; fftw_real tmp82; ASSERT_ALIGNED_DOUBLE; { fftw_real tmp1; fftw_real tmp2; fftw_real tmp32; fftw_real tmp33; ASSERT_ALIGNED_DOUBLE; tmp1 = c_re(input[0]); tmp2 = c_re(input[8 * istride]); tmp3 = tmp1 + tmp2; tmp81 = tmp1 - tmp2; tmp32 = c_im(input[0]); tmp33 = c_im(input[8 * istride]); tmp34 = tmp32 + tmp33; tmp48 = tmp32 - tmp33; } { fftw_real tmp4; fftw_real tmp5; fftw_real tmp35; fftw_real tmp36; ASSERT_ALIGNED_DOUBLE; tmp4 = c_re(input[4 * istride]); tmp5 = c_re(input[12 * istride]); tmp6 = tmp4 + tmp5; tmp47 = tmp4 - tmp5; tmp35 = c_im(input[4 * istride]); tmp36 = c_im(input[12 * istride]); tmp37 = tmp35 + tmp36; tmp82 = tmp35 - tmp36; } tmp7 = tmp3 + tmp6; tmp129 = tmp3 - tmp6; tmp38 = tmp34 + tmp37; tmp115 = tmp34 - tmp37; tmp49 = tmp47 + tmp48; tmp95 = tmp48 - tmp47; tmp83 = tmp81 - tmp82; tmp105 = tmp81 + tmp82; } { fftw_real tmp25; fftw_real tmp74; fftw_real tmp72; fftw_real tmp124; fftw_real tmp28; fftw_real tmp69; fftw_real tmp77; fftw_real tmp125; ASSERT_ALIGNED_DOUBLE; { fftw_real tmp23; fftw_real tmp24; fftw_real tmp70; fftw_real tmp71; ASSERT_ALIGNED_DOUBLE; tmp23 = c_re(input[15 * istride]); tmp24 = c_re(input[7 * istride]); tmp25 = tmp23 + tmp24; tmp74 = tmp23 - tmp24; tmp70 = c_im(input[15 * istride]); tmp71 = c_im(input[7 * istride]); tmp72 = tmp70 - tmp71; tmp124 = tmp70 + tmp71; } { fftw_real tmp26; fftw_real tmp27; fftw_real tmp75; fftw_real tmp76; ASSERT_ALIGNED_DOUBLE; tmp26 = c_re(input[3 * istride]); tmp27 = c_re(input[11 * istride]); tmp28 = tmp26 + tmp27; tmp69 = tmp26 - tmp27; tmp75 = c_im(input[3 * istride]); tmp76 = c_im(input[11 * istride]); tmp77 = tmp75 - tmp76; tmp125 = tmp75 + tmp76; } tmp29 = tmp25 + tmp28; tmp123 = tmp25 - tmp28; tmp73 = tmp69 + tmp72; tmp101 = tmp72 - tmp69; tmp78 = tmp74 - tmp77; tmp102 = tmp74 + tmp77; tmp126 = tmp124 - tmp125; tmp141 = tmp124 + tmp125; } { fftw_real tmp10; fftw_real tmp50; fftw_real tmp41; fftw_real tmp51; fftw_real tmp13; fftw_real tmp54; fftw_real tmp44; fftw_real tmp53; ASSERT_ALIGNED_DOUBLE; { fftw_real tmp8; fftw_real tmp9; fftw_real tmp39; fftw_real tmp40; ASSERT_ALIGNED_DOUBLE; tmp8 = c_re(input[2 * istride]); tmp9 = c_re(input[10 * istride]); tmp10 = tmp8 + tmp9; tmp50 = tmp8 - tmp9; tmp39 = c_im(input[2 * istride]); tmp40 = c_im(input[10 * istride]); tmp41 = tmp39 + tmp40; tmp51 = tmp39 - tmp40; } { fftw_real tmp11; fftw_real tmp12; fftw_real tmp42; fftw_real tmp43; ASSERT_ALIGNED_DOUBLE; tmp11 = c_re(input[14 * istride]); tmp12 = c_re(input[6 * istride]); tmp13 = tmp11 + tmp12; tmp54 = tmp11 - tmp12; tmp42 = c_im(input[14 * istride]); tmp43 = c_im(input[6 * istride]); tmp44 = tmp42 + tmp43; tmp53 = tmp42 - tmp43; } tmp14 = tmp10 + tmp13; tmp116 = tmp10 - tmp13; tmp45 = tmp41 + tmp44; tmp130 = tmp44 - tmp41; tmp52 = tmp50 + tmp51; tmp84 = tmp50 - tmp51; tmp55 = tmp53 - tmp54; tmp85 = tmp54 + tmp53; } { fftw_real tmp18; fftw_real tmp63; fftw_real tmp61; fftw_real tmp119; fftw_real tmp21; fftw_real tmp58; fftw_real tmp66; fftw_real tmp120; ASSERT_ALIGNED_DOUBLE; { fftw_real tmp16; fftw_real tmp17; fftw_real tmp59; fftw_real tmp60; ASSERT_ALIGNED_DOUBLE; tmp16 = c_re(input[istride]); tmp17 = c_re(input[9 * istride]); tmp18 = tmp16 + tmp17; tmp63 = tmp16 - tmp17; tmp59 = c_im(input[istride]); tmp60 = c_im(input[9 * istride]); tmp61 = tmp59 - tmp60; tmp119 = tmp59 + tmp60; } { fftw_real tmp19; fftw_real tmp20; fftw_real tmp64; fftw_real tmp65; ASSERT_ALIGNED_DOUBLE; tmp19 = c_re(input[5 * istride]); tmp20 = c_re(input[13 * istride]); tmp21 = tmp19 + tmp20; tmp58 = tmp19 - tmp20; tmp64 = c_im(input[5 * istride]); tmp65 = c_im(input[13 * istride]); tmp66 = tmp64 - tmp65; tmp120 = tmp64 + tmp65; } tmp22 = tmp18 + tmp21; tmp118 = tmp18 - tmp21; tmp62 = tmp58 + tmp61; tmp98 = tmp61 - tmp58; tmp67 = tmp63 - tmp66; tmp99 = tmp63 + tmp66; tmp121 = tmp119 - tmp120; tmp140 = tmp119 + tmp120; } { fftw_real tmp15; fftw_real tmp30; fftw_real tmp31; fftw_real tmp46; ASSERT_ALIGNED_DOUBLE; tmp15 = tmp7 + tmp14; tmp30 = tmp22 + tmp29; c_re(output[8 * ostride]) = tmp15 - tmp30; c_re(output[0]) = tmp15 + tmp30; tmp31 = tmp22 - tmp29; tmp46 = tmp38 - tmp45; c_im(output[4 * ostride]) = tmp31 + tmp46; c_im(output[12 * ostride]) = tmp46 - tmp31; } { fftw_real tmp139; fftw_real tmp142; fftw_real tmp143; fftw_real tmp144; ASSERT_ALIGNED_DOUBLE; tmp139 = tmp38 + tmp45; tmp142 = tmp140 + tmp141; c_im(output[8 * ostride]) = tmp139 - tmp142; c_im(output[0]) = tmp139 + tmp142; tmp143 = tmp7 - tmp14; tmp144 = tmp141 - tmp140; c_re(output[12 * ostride]) = tmp143 - tmp144; c_re(output[4 * ostride]) = tmp143 + tmp144; } { fftw_real tmp117; fftw_real tmp131; fftw_real tmp128; fftw_real tmp132; fftw_real tmp122; fftw_real tmp127; ASSERT_ALIGNED_DOUBLE; tmp117 = tmp115 - tmp116; tmp131 = tmp129 + tmp130; tmp122 = tmp118 - tmp121; tmp127 = tmp123 + tmp126; tmp128 = K707106781 * (tmp122 - tmp127); tmp132 = K707106781 * (tmp122 + tmp127); c_im(output[14 * ostride]) = tmp117 - tmp128; c_im(output[6 * ostride]) = tmp117 + tmp128; c_re(output[10 * ostride]) = tmp131 - tmp132; c_re(output[2 * ostride]) = tmp131 + tmp132; } { fftw_real tmp133; fftw_real tmp137; fftw_real tmp136; fftw_real tmp138; fftw_real tmp134; fftw_real tmp135; ASSERT_ALIGNED_DOUBLE; tmp133 = tmp116 + tmp115; tmp137 = tmp129 - tmp130; tmp134 = tmp118 + tmp121; tmp135 = tmp126 - tmp123; tmp136 = K707106781 * (tmp134 + tmp135); tmp138 = K707106781 * (tmp135 - tmp134); c_im(output[10 * ostride]) = tmp133 - tmp136; c_im(output[2 * ostride]) = tmp133 + tmp136; c_re(output[14 * ostride]) = tmp137 - tmp138; c_re(output[6 * ostride]) = tmp137 + tmp138; } { fftw_real tmp57; fftw_real tmp89; fftw_real tmp92; fftw_real tmp94; fftw_real tmp87; fftw_real tmp93; fftw_real tmp80; fftw_real tmp88; ASSERT_ALIGNED_DOUBLE; { fftw_real tmp56; fftw_real tmp90; fftw_real tmp91; fftw_real tmp86; fftw_real tmp68; fftw_real tmp79; ASSERT_ALIGNED_DOUBLE; tmp56 = K707106781 * (tmp52 + tmp55); tmp57 = tmp49 + tmp56; tmp89 = tmp49 - tmp56; tmp90 = (K923879532 * tmp67) - (K382683432 * tmp62); tmp91 = (K382683432 * tmp73) + (K923879532 * tmp78); tmp92 = tmp90 - tmp91; tmp94 = tmp90 + tmp91; tmp86 = K707106781 * (tmp84 + tmp85); tmp87 = tmp83 - tmp86; tmp93 = tmp83 + tmp86; tmp68 = (K923879532 * tmp62) + (K382683432 * tmp67); tmp79 = (K923879532 * tmp73) - (K382683432 * tmp78); tmp80 = tmp68 + tmp79; tmp88 = tmp79 - tmp68; } c_im(output[9 * ostride]) = tmp57 - tmp80; c_im(output[ostride]) = tmp57 + tmp80; c_re(output[13 * ostride]) = tmp87 - tmp88; c_re(output[5 * ostride]) = tmp87 + tmp88; c_im(output[13 * ostride]) = tmp89 - tmp92; c_im(output[5 * ostride]) = tmp89 + tmp92; c_re(output[9 * ostride]) = tmp93 - tmp94; c_re(output[ostride]) = tmp93 + tmp94; } { fftw_real tmp97; fftw_real tmp109; fftw_real tmp112; fftw_real tmp114; fftw_real tmp107; fftw_real tmp113; fftw_real tmp104; fftw_real tmp108; ASSERT_ALIGNED_DOUBLE; { fftw_real tmp96; fftw_real tmp110; fftw_real tmp111; fftw_real tmp106; fftw_real tmp100; fftw_real tmp103; ASSERT_ALIGNED_DOUBLE; tmp96 = K707106781 * (tmp84 - tmp85); tmp97 = tmp95 + tmp96; tmp109 = tmp95 - tmp96; tmp110 = (K382683432 * tmp99) - (K923879532 * tmp98); tmp111 = (K923879532 * tmp101) + (K382683432 * tmp102); tmp112 = tmp110 - tmp111; tmp114 = tmp110 + tmp111; tmp106 = K707106781 * (tmp55 - tmp52); tmp107 = tmp105 - tmp106; tmp113 = tmp105 + tmp106; tmp100 = (K382683432 * tmp98) + (K923879532 * tmp99); tmp103 = (K382683432 * tmp101) - (K923879532 * tmp102); tmp104 = tmp100 + tmp103; tmp108 = tmp103 - tmp100; } c_im(output[11 * ostride]) = tmp97 - tmp104; c_im(output[3 * ostride]) = tmp97 + tmp104; c_re(output[15 * ostride]) = tmp107 - tmp108; c_re(output[7 * ostride]) = tmp107 + tmp108; c_im(output[15 * ostride]) = tmp109 - tmp112; c_im(output[7 * ostride]) = tmp109 + tmp112; c_re(output[11 * ostride]) = tmp113 - tmp114; c_re(output[3 * ostride]) = tmp113 + tmp114; } } fftw_codelet_desc fftwi_no_twiddle_16_desc = { "fftwi_no_twiddle_16", (void (*)()) fftwi_no_twiddle_16, 16, FFTW_BACKWARD, FFTW_NOTW, 364, 0, (const int *) 0, };