From 30755b92afeae5a5a32860b4f4297180f6d3398d Mon Sep 17 00:00:00 2001 From: John Glover Date: Mon, 18 Oct 2010 17:32:05 +0100 Subject: Moved project over to Git --- sndobj/rfftw/fhb_9.c | 564 +++++++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 564 insertions(+) create mode 100644 sndobj/rfftw/fhb_9.c (limited to 'sndobj/rfftw/fhb_9.c') diff --git a/sndobj/rfftw/fhb_9.c b/sndobj/rfftw/fhb_9.c new file mode 100644 index 0000000..6451692 --- /dev/null +++ b/sndobj/rfftw/fhb_9.c @@ -0,0 +1,564 @@ +/* + * Copyright (c) 1997-1999 Massachusetts Institute of Technology + * + * This program is free software; you can redistribute it and/or modify + * it under the terms of the GNU General Public License as published by + * the Free Software Foundation; either version 2 of the License, or + * (at your option) any later version. + * + * This program is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + * GNU General Public License for more details. + * + * You should have received a copy of the GNU General Public License + * along with this program; if not, write to the Free Software + * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA + * + */ + +/* This file was automatically generated --- DO NOT EDIT */ +/* Generated on Sun Nov 7 20:45:14 EST 1999 */ + +#include +#include + +/* Generated by: ./genfft -magic-alignment-check -magic-twiddle-load-all -magic-variables 4 -magic-loopi -hc2hc-backward 9 */ + +/* + * This function contains 183 FP additions, 122 FP multiplications, + * (or, 130 additions, 69 multiplications, 53 fused multiply/add), + * 43 stack variables, and 72 memory accesses + */ +static const fftw_real K663413948 = FFTW_KONST(+0.663413948168938396205421319635891297216863310); +static const fftw_real K556670399 = FFTW_KONST(+0.556670399226419366452912952047023132968291906); +static const fftw_real K296198132 = FFTW_KONST(+0.296198132726023843175338011893050938967728390); +static const fftw_real K150383733 = FFTW_KONST(+0.150383733180435296639271897612501926072238258); +static const fftw_real K813797681 = FFTW_KONST(+0.813797681349373692844693217248393223289101568); +static const fftw_real K852868531 = FFTW_KONST(+0.852868531952443209628250963940074071936020296); +static const fftw_real K939692620 = FFTW_KONST(+0.939692620785908384054109277324731469936208134); +static const fftw_real K342020143 = FFTW_KONST(+0.342020143325668733044099614682259580763083368); +static const fftw_real K984807753 = FFTW_KONST(+0.984807753012208059366743024589523013670643252); +static const fftw_real K173648177 = FFTW_KONST(+0.173648177666930348851716626769314796000375677); +static const fftw_real K300767466 = FFTW_KONST(+0.300767466360870593278543795225003852144476517); +static const fftw_real K1_705737063 = FFTW_KONST(+1.705737063904886419256501927880148143872040591); +static const fftw_real K642787609 = FFTW_KONST(+0.642787609686539326322643409907263432907559884); +static const fftw_real K766044443 = FFTW_KONST(+0.766044443118978035202392650555416673935832457); +static const fftw_real K1_326827896 = FFTW_KONST(+1.326827896337876792410842639271782594433726619); +static const fftw_real K1_113340798 = FFTW_KONST(+1.113340798452838732905825904094046265936583811); +static const fftw_real K500000000 = FFTW_KONST(+0.500000000000000000000000000000000000000000000); +static const fftw_real K866025403 = FFTW_KONST(+0.866025403784438646763723170752936183471402627); +static const fftw_real K2_000000000 = FFTW_KONST(+2.000000000000000000000000000000000000000000000); +static const fftw_real K1_732050807 = FFTW_KONST(+1.732050807568877293527446341505872366942805254); + +/* + * Generator Id's : + * $Id: fhb_9.c,v 1.1.1.1 2006/05/12 15:14:46 veplaini Exp $ + * $Id: fhb_9.c,v 1.1.1.1 2006/05/12 15:14:46 veplaini Exp $ + * $Id: fhb_9.c,v 1.1.1.1 2006/05/12 15:14:46 veplaini Exp $ + */ + +void fftw_hc2hc_backward_9(fftw_real *A, const fftw_complex *W, int iostride, int m, int dist) +{ + int i; + fftw_real *X; + fftw_real *Y; + X = A; + Y = A + (9 * iostride); + { + fftw_real tmp153; + fftw_real tmp181; + fftw_real tmp175; + fftw_real tmp160; + fftw_real tmp163; + fftw_real tmp158; + fftw_real tmp167; + fftw_real tmp178; + fftw_real tmp170; + fftw_real tmp179; + fftw_real tmp159; + fftw_real tmp164; + ASSERT_ALIGNED_DOUBLE; + { + fftw_real tmp174; + fftw_real tmp151; + fftw_real tmp152; + fftw_real tmp172; + fftw_real tmp173; + ASSERT_ALIGNED_DOUBLE; + tmp173 = Y[-3 * iostride]; + tmp174 = K1_732050807 * tmp173; + tmp151 = X[0]; + tmp152 = X[3 * iostride]; + tmp172 = tmp152 - tmp151; + tmp153 = tmp151 + (K2_000000000 * tmp152); + tmp181 = tmp174 - tmp172; + tmp175 = tmp172 + tmp174; + } + { + fftw_real tmp154; + fftw_real tmp157; + fftw_real tmp168; + fftw_real tmp166; + fftw_real tmp165; + fftw_real tmp169; + ASSERT_ALIGNED_DOUBLE; + tmp154 = X[iostride]; + tmp160 = Y[-iostride]; + { + fftw_real tmp155; + fftw_real tmp156; + fftw_real tmp161; + fftw_real tmp162; + ASSERT_ALIGNED_DOUBLE; + tmp155 = X[4 * iostride]; + tmp156 = X[2 * iostride]; + tmp157 = tmp155 + tmp156; + tmp168 = K866025403 * (tmp155 - tmp156); + tmp161 = Y[-2 * iostride]; + tmp162 = Y[-4 * iostride]; + tmp163 = tmp161 - tmp162; + tmp166 = K866025403 * (tmp162 + tmp161); + } + tmp158 = tmp154 + tmp157; + tmp165 = tmp154 - (K500000000 * tmp157); + tmp167 = tmp165 - tmp166; + tmp178 = tmp165 + tmp166; + tmp169 = (K500000000 * tmp163) + tmp160; + tmp170 = tmp168 + tmp169; + tmp179 = tmp169 - tmp168; + } + X[0] = tmp153 + (K2_000000000 * tmp158); + tmp159 = tmp153 - tmp158; + tmp164 = K1_732050807 * (tmp160 - tmp163); + X[6 * iostride] = tmp159 + tmp164; + X[3 * iostride] = tmp159 - tmp164; + { + fftw_real tmp176; + fftw_real tmp171; + fftw_real tmp177; + fftw_real tmp183; + fftw_real tmp180; + fftw_real tmp182; + ASSERT_ALIGNED_DOUBLE; + tmp176 = (K1_113340798 * tmp167) + (K1_326827896 * tmp170); + tmp171 = (K766044443 * tmp167) - (K642787609 * tmp170); + tmp177 = tmp171 + tmp175; + X[iostride] = (K2_000000000 * tmp171) - tmp175; + X[7 * iostride] = tmp176 - tmp177; + X[4 * iostride] = -(tmp176 + tmp177); + tmp183 = (K1_705737063 * tmp178) + (K300767466 * tmp179); + tmp180 = (K173648177 * tmp178) - (K984807753 * tmp179); + tmp182 = tmp181 - tmp180; + X[2 * iostride] = (K2_000000000 * tmp180) + tmp181; + X[8 * iostride] = tmp183 + tmp182; + X[5 * iostride] = tmp182 - tmp183; + } + } + X = X + dist; + Y = Y - dist; + for (i = 2; i < m; i = i + 2, X = X + dist, Y = Y - dist, W = W + 8) { + fftw_real tmp43; + fftw_real tmp86; + fftw_real tmp134; + fftw_real tmp59; + fftw_real tmp106; + fftw_real tmp124; + fftw_real tmp48; + fftw_real tmp53; + fftw_real tmp54; + fftw_real tmp100; + fftw_real tmp108; + fftw_real tmp130; + fftw_real tmp136; + fftw_real tmp127; + fftw_real tmp135; + fftw_real tmp93; + fftw_real tmp107; + fftw_real tmp64; + fftw_real tmp69; + fftw_real tmp70; + ASSERT_ALIGNED_DOUBLE; + { + fftw_real tmp39; + fftw_real tmp55; + fftw_real tmp42; + fftw_real tmp104; + fftw_real tmp58; + fftw_real tmp85; + fftw_real tmp84; + fftw_real tmp105; + ASSERT_ALIGNED_DOUBLE; + tmp39 = X[0]; + tmp55 = Y[0]; + { + fftw_real tmp40; + fftw_real tmp41; + fftw_real tmp56; + fftw_real tmp57; + ASSERT_ALIGNED_DOUBLE; + tmp40 = X[3 * iostride]; + tmp41 = Y[-6 * iostride]; + tmp42 = tmp40 + tmp41; + tmp104 = K866025403 * (tmp40 - tmp41); + tmp56 = Y[-3 * iostride]; + tmp57 = X[6 * iostride]; + tmp58 = tmp56 - tmp57; + tmp85 = K866025403 * (tmp56 + tmp57); + } + tmp43 = tmp39 + tmp42; + tmp84 = tmp39 - (K500000000 * tmp42); + tmp86 = tmp84 - tmp85; + tmp134 = tmp84 + tmp85; + tmp59 = tmp55 + tmp58; + tmp105 = tmp55 - (K500000000 * tmp58); + tmp106 = tmp104 + tmp105; + tmp124 = tmp105 - tmp104; + } + { + fftw_real tmp44; + fftw_real tmp47; + fftw_real tmp87; + fftw_real tmp90; + fftw_real tmp60; + fftw_real tmp63; + fftw_real tmp88; + fftw_real tmp91; + fftw_real tmp49; + fftw_real tmp52; + fftw_real tmp94; + fftw_real tmp97; + fftw_real tmp65; + fftw_real tmp68; + fftw_real tmp95; + fftw_real tmp98; + ASSERT_ALIGNED_DOUBLE; + { + fftw_real tmp45; + fftw_real tmp46; + fftw_real tmp61; + fftw_real tmp62; + ASSERT_ALIGNED_DOUBLE; + tmp44 = X[iostride]; + tmp45 = X[4 * iostride]; + tmp46 = Y[-7 * iostride]; + tmp47 = tmp45 + tmp46; + tmp87 = tmp44 - (K500000000 * tmp47); + tmp90 = K866025403 * (tmp45 - tmp46); + tmp60 = Y[-iostride]; + tmp61 = Y[-4 * iostride]; + tmp62 = X[7 * iostride]; + tmp63 = tmp61 - tmp62; + tmp88 = K866025403 * (tmp61 + tmp62); + tmp91 = tmp60 - (K500000000 * tmp63); + } + { + fftw_real tmp50; + fftw_real tmp51; + fftw_real tmp66; + fftw_real tmp67; + ASSERT_ALIGNED_DOUBLE; + tmp49 = X[2 * iostride]; + tmp50 = Y[-5 * iostride]; + tmp51 = Y[-8 * iostride]; + tmp52 = tmp50 + tmp51; + tmp94 = tmp49 - (K500000000 * tmp52); + tmp97 = K866025403 * (tmp50 - tmp51); + tmp65 = Y[-2 * iostride]; + tmp66 = X[5 * iostride]; + tmp67 = X[8 * iostride]; + tmp68 = tmp66 + tmp67; + tmp95 = K866025403 * (tmp66 - tmp67); + tmp98 = tmp65 + (K500000000 * tmp68); + } + tmp48 = tmp44 + tmp47; + tmp53 = tmp49 + tmp52; + tmp54 = tmp48 + tmp53; + { + fftw_real tmp96; + fftw_real tmp99; + fftw_real tmp128; + fftw_real tmp129; + ASSERT_ALIGNED_DOUBLE; + tmp96 = tmp94 + tmp95; + tmp99 = tmp97 + tmp98; + tmp100 = (K173648177 * tmp96) - (K984807753 * tmp99); + tmp108 = (K984807753 * tmp96) + (K173648177 * tmp99); + tmp128 = tmp94 - tmp95; + tmp129 = tmp98 - tmp97; + tmp130 = (K342020143 * tmp128) - (K939692620 * tmp129); + tmp136 = (K939692620 * tmp128) + (K342020143 * tmp129); + } + { + fftw_real tmp125; + fftw_real tmp126; + fftw_real tmp89; + fftw_real tmp92; + ASSERT_ALIGNED_DOUBLE; + tmp125 = tmp91 - tmp90; + tmp126 = tmp87 + tmp88; + tmp127 = (K173648177 * tmp125) + (K984807753 * tmp126); + tmp135 = (K173648177 * tmp126) - (K984807753 * tmp125); + tmp89 = tmp87 - tmp88; + tmp92 = tmp90 + tmp91; + tmp93 = (K766044443 * tmp89) - (K642787609 * tmp92); + tmp107 = (K766044443 * tmp92) + (K642787609 * tmp89); + tmp64 = tmp60 + tmp63; + tmp69 = tmp65 - tmp68; + tmp70 = tmp64 + tmp69; + } + } + X[0] = tmp43 + tmp54; + { + fftw_real tmp74; + fftw_real tmp80; + fftw_real tmp78; + fftw_real tmp82; + ASSERT_ALIGNED_DOUBLE; + { + fftw_real tmp72; + fftw_real tmp73; + fftw_real tmp76; + fftw_real tmp77; + ASSERT_ALIGNED_DOUBLE; + tmp72 = tmp59 - (K500000000 * tmp70); + tmp73 = K866025403 * (tmp48 - tmp53); + tmp74 = tmp72 - tmp73; + tmp80 = tmp73 + tmp72; + tmp76 = tmp43 - (K500000000 * tmp54); + tmp77 = K866025403 * (tmp69 - tmp64); + tmp78 = tmp76 - tmp77; + tmp82 = tmp76 + tmp77; + } + { + fftw_real tmp71; + fftw_real tmp75; + fftw_real tmp79; + fftw_real tmp81; + ASSERT_ALIGNED_DOUBLE; + tmp71 = c_re(W[5]); + tmp75 = c_im(W[5]); + Y[-2 * iostride] = (tmp71 * tmp74) - (tmp75 * tmp78); + X[6 * iostride] = (tmp75 * tmp74) + (tmp71 * tmp78); + tmp79 = c_re(W[2]); + tmp81 = c_im(W[2]); + Y[-5 * iostride] = (tmp79 * tmp80) - (tmp81 * tmp82); + X[3 * iostride] = (tmp81 * tmp80) + (tmp79 * tmp82); + } + } + Y[-8 * iostride] = tmp59 + tmp70; + { + fftw_real tmp113; + fftw_real tmp102; + fftw_real tmp116; + fftw_real tmp117; + fftw_real tmp110; + fftw_real tmp112; + fftw_real tmp101; + fftw_real tmp109; + fftw_real tmp83; + fftw_real tmp103; + ASSERT_ALIGNED_DOUBLE; + tmp113 = K866025403 * (tmp93 - tmp100); + tmp101 = tmp93 + tmp100; + tmp102 = tmp86 + tmp101; + tmp116 = tmp86 - (K500000000 * tmp101); + tmp117 = K866025403 * (tmp108 - tmp107); + tmp109 = tmp107 + tmp108; + tmp110 = tmp106 + tmp109; + tmp112 = tmp106 - (K500000000 * tmp109); + tmp83 = c_re(W[0]); + tmp103 = c_im(W[0]); + X[iostride] = (tmp83 * tmp102) + (tmp103 * tmp110); + Y[-7 * iostride] = (tmp83 * tmp110) - (tmp103 * tmp102); + { + fftw_real tmp120; + fftw_real tmp122; + fftw_real tmp119; + fftw_real tmp121; + ASSERT_ALIGNED_DOUBLE; + tmp120 = tmp113 + tmp112; + tmp122 = tmp116 + tmp117; + tmp119 = c_re(W[3]); + tmp121 = c_im(W[3]); + Y[-4 * iostride] = (tmp119 * tmp120) - (tmp121 * tmp122); + X[4 * iostride] = (tmp121 * tmp120) + (tmp119 * tmp122); + } + { + fftw_real tmp114; + fftw_real tmp118; + fftw_real tmp111; + fftw_real tmp115; + ASSERT_ALIGNED_DOUBLE; + tmp114 = tmp112 - tmp113; + tmp118 = tmp116 - tmp117; + tmp111 = c_re(W[6]); + tmp115 = c_im(W[6]); + Y[-iostride] = (tmp111 * tmp114) - (tmp115 * tmp118); + X[7 * iostride] = (tmp115 * tmp114) + (tmp111 * tmp118); + } + } + { + fftw_real tmp141; + fftw_real tmp132; + fftw_real tmp144; + fftw_real tmp145; + fftw_real tmp138; + fftw_real tmp140; + fftw_real tmp131; + fftw_real tmp137; + fftw_real tmp123; + fftw_real tmp133; + ASSERT_ALIGNED_DOUBLE; + tmp141 = K866025403 * (tmp130 - tmp127); + tmp131 = tmp127 + tmp130; + tmp132 = tmp124 + tmp131; + tmp144 = tmp124 - (K500000000 * tmp131); + tmp145 = K866025403 * (tmp135 + tmp136); + tmp137 = tmp135 - tmp136; + tmp138 = tmp134 + tmp137; + tmp140 = tmp134 - (K500000000 * tmp137); + tmp123 = c_re(W[1]); + tmp133 = c_im(W[1]); + Y[-6 * iostride] = (tmp123 * tmp132) - (tmp133 * tmp138); + X[2 * iostride] = (tmp133 * tmp132) + (tmp123 * tmp138); + { + fftw_real tmp148; + fftw_real tmp150; + fftw_real tmp147; + fftw_real tmp149; + ASSERT_ALIGNED_DOUBLE; + tmp148 = tmp141 + tmp140; + tmp150 = tmp144 + tmp145; + tmp147 = c_re(W[4]); + tmp149 = c_im(W[4]); + X[5 * iostride] = (tmp147 * tmp148) + (tmp149 * tmp150); + Y[-3 * iostride] = (tmp147 * tmp150) - (tmp149 * tmp148); + } + { + fftw_real tmp142; + fftw_real tmp146; + fftw_real tmp139; + fftw_real tmp143; + ASSERT_ALIGNED_DOUBLE; + tmp142 = tmp140 - tmp141; + tmp146 = tmp144 - tmp145; + tmp139 = c_re(W[7]); + tmp143 = c_im(W[7]); + X[8 * iostride] = (tmp139 * tmp142) + (tmp143 * tmp146); + Y[0] = (tmp139 * tmp146) - (tmp143 * tmp142); + } + } + } + if (i == m) { + fftw_real tmp3; + fftw_real tmp31; + fftw_real tmp28; + fftw_real tmp17; + fftw_real tmp34; + fftw_real tmp7; + fftw_real tmp33; + fftw_real tmp23; + fftw_real tmp20; + fftw_real tmp35; + fftw_real tmp12; + fftw_real tmp14; + fftw_real tmp32; + fftw_real tmp8; + ASSERT_ALIGNED_DOUBLE; + { + fftw_real tmp27; + fftw_real tmp1; + fftw_real tmp2; + fftw_real tmp25; + fftw_real tmp26; + ASSERT_ALIGNED_DOUBLE; + tmp26 = Y[-iostride]; + tmp27 = K1_732050807 * tmp26; + tmp1 = X[4 * iostride]; + tmp2 = X[iostride]; + tmp25 = tmp2 - tmp1; + tmp3 = tmp1 + (K2_000000000 * tmp2); + tmp31 = tmp25 - tmp27; + tmp28 = tmp25 + tmp27; + } + { + fftw_real tmp4; + fftw_real tmp6; + fftw_real tmp5; + fftw_real tmp13; + fftw_real tmp15; + fftw_real tmp18; + fftw_real tmp22; + fftw_real tmp9; + fftw_real tmp11; + fftw_real tmp10; + fftw_real tmp21; + fftw_real tmp19; + fftw_real tmp16; + ASSERT_ALIGNED_DOUBLE; + tmp4 = X[3 * iostride]; + tmp6 = X[2 * iostride]; + tmp5 = X[0]; + tmp13 = K500000000 * (tmp5 + tmp6); + tmp15 = K866025403 * (tmp6 - tmp5); + tmp18 = K866025403 * (tmp4 - tmp5); + tmp22 = K500000000 * (tmp4 + tmp5); + tmp9 = Y[-2 * iostride]; + tmp11 = Y[0]; + tmp10 = Y[-3 * iostride]; + tmp21 = K866025403 * (tmp11 - tmp10); + tmp19 = (K500000000 * (tmp11 + tmp10)) + tmp9; + tmp16 = (K500000000 * (tmp9 - tmp11)) + tmp10; + tmp17 = tmp15 - tmp16; + tmp34 = tmp15 + tmp16; + tmp7 = tmp4 + tmp5 + tmp6; + tmp33 = tmp22 + tmp21 - tmp6; + tmp23 = (tmp6 + tmp21) - tmp22; + tmp20 = tmp18 - tmp19; + tmp35 = tmp18 + tmp19; + tmp12 = (K1_732050807 * (tmp9 - tmp10)) - (K1_732050807 * tmp11); + tmp14 = tmp4 - (K866025403 * (tmp11 + tmp9)) - tmp13; + tmp32 = tmp13 - (K866025403 * (tmp11 + tmp9)) - tmp4; + } + X[0] = tmp3 + (K2_000000000 * tmp7); + tmp8 = tmp7 - tmp3; + X[3 * iostride] = tmp8 + tmp12; + X[6 * iostride] = tmp12 - tmp8; + { + fftw_real tmp30; + fftw_real tmp24; + fftw_real tmp29; + fftw_real tmp38; + fftw_real tmp36; + fftw_real tmp37; + ASSERT_ALIGNED_DOUBLE; + tmp30 = (K852868531 * tmp14) + (K813797681 * tmp20) + (K150383733 * tmp17) - (K296198132 * tmp23); + tmp24 = (K173648177 * tmp14) - (K984807753 * tmp17) - (K342020143 * tmp20) - (K939692620 * tmp23); + tmp29 = tmp28 + (K500000000 * tmp24); + X[2 * iostride] = tmp24 - tmp28; + X[8 * iostride] = tmp30 - tmp29; + X[5 * iostride] = tmp29 + tmp30; + tmp38 = (K556670399 * tmp32) + (K663413948 * tmp34) - (K150383733 * tmp35) - (K852868531 * tmp33); + tmp36 = (K766044443 * tmp32) + (K173648177 * tmp33) - (K642787609 * tmp34) - (K984807753 * tmp35); + tmp37 = (K500000000 * tmp36) - tmp31; + X[iostride] = tmp31 + tmp36; + X[7 * iostride] = tmp38 - tmp37; + X[4 * iostride] = tmp37 + tmp38; + } + } +} + +static const int twiddle_order[] = +{1, 2, 3, 4, 5, 6, 7, 8}; +fftw_codelet_desc fftw_hc2hc_backward_9_desc = +{ + "fftw_hc2hc_backward_9", + (void (*)()) fftw_hc2hc_backward_9, + 9, + FFTW_BACKWARD, + FFTW_HC2HC, + 212, + 8, + twiddle_order, +}; -- cgit v1.2.3