1 /*
2  * Copyright (c) 1997-1999, 2003 Massachusetts Institute of Technology
3  *
4  * This program is free software; you can redistribute it and/or modify
5  * it under the terms of the GNU General Public License as published by
6  * the Free Software Foundation; either version 2 of the License, or
7  * (at your option) any later version.
8  *
9  * This program is distributed in the hope that it will be useful,
10  * but WITHOUT ANY WARRANTY; without even the implied warranty of
11  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
12  * GNU General Public License for more details.
13  *
14  * You should have received a copy of the GNU General Public License
15  * along with this program; if not, write to the Free Software
16  * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
17  *
18  */
19 
20 /* This file was automatically generated --- DO NOT EDIT */
21 /* Generated on Mon Mar 24 02:07:51 EST 2003 */
22 
23 #include "fftw-int.h"
24 #include "fftw.h"
25 
26 /* Generated by: /homee/stevenj/cvs/fftw/gensrc/genfft -magic-alignment-check -magic-twiddle-load-all -magic-variables 4 -magic-loopi -hc2hc-forward 6 */
27 
28 /*
29  * This function contains 72 FP additions, 36 FP multiplications,
30  * (or, 54 additions, 18 multiplications, 18 fused multiply/add),
31  * 23 stack variables, and 48 memory accesses
32  */
33 static const fftw_real K500000000 =
34 FFTW_KONST(+0.500000000000000000000000000000000000000000000);
35 static const fftw_real K866025403 =
36 FFTW_KONST(+0.866025403784438646763723170752936183471402627);
37 
38 /*
39  * Generator Id's :
40  * $Id: exprdag.ml,v 1.43 2003/03/16 23:43:46 stevenj Exp $
41  * $Id: fft.ml,v 1.44 2003/03/16 23:43:46 stevenj Exp $
42  * $Id: to_c.ml,v 1.26 2003/03/16 23:43:46 stevenj Exp $
43  */
44 
fftw_hc2hc_forward_6(fftw_real * A,const fftw_complex * W,int iostride,int m,int dist)45 void fftw_hc2hc_forward_6(fftw_real *A, const fftw_complex *W,
46 			  int iostride, int m, int dist)
47 {
48      int i;
49      fftw_real *X;
50      fftw_real *Y;
51      X = A;
52      Y = A + (6 * iostride);
53      {
54 	  fftw_real tmp71;
55 	  fftw_real tmp81;
56 	  fftw_real tmp77;
57 	  fftw_real tmp79;
58 	  fftw_real tmp74;
59 	  fftw_real tmp80;
60 	  fftw_real tmp69;
61 	  fftw_real tmp70;
62 	  fftw_real tmp78;
63 	  fftw_real tmp82;
64 	  ASSERT_ALIGNED_DOUBLE;
65 	  tmp69 = X[0];
66 	  tmp70 = X[3 * iostride];
67 	  tmp71 = tmp69 - tmp70;
68 	  tmp81 = tmp69 + tmp70;
69 	  {
70 	       fftw_real tmp75;
71 	       fftw_real tmp76;
72 	       fftw_real tmp72;
73 	       fftw_real tmp73;
74 	       ASSERT_ALIGNED_DOUBLE;
75 	       tmp75 = X[4 * iostride];
76 	       tmp76 = X[iostride];
77 	       tmp77 = tmp75 - tmp76;
78 	       tmp79 = tmp75 + tmp76;
79 	       tmp72 = X[2 * iostride];
80 	       tmp73 = X[5 * iostride];
81 	       tmp74 = tmp72 - tmp73;
82 	       tmp80 = tmp72 + tmp73;
83 	  }
84 	  Y[-iostride] = K866025403 * (tmp77 - tmp74);
85 	  tmp78 = tmp74 + tmp77;
86 	  X[iostride] = tmp71 - (K500000000 * tmp78);
87 	  X[3 * iostride] = tmp71 + tmp78;
88 	  Y[-2 * iostride] = -(K866025403 * (tmp79 - tmp80));
89 	  tmp82 = tmp80 + tmp79;
90 	  X[2 * iostride] = tmp81 - (K500000000 * tmp82);
91 	  X[0] = tmp81 + tmp82;
92      }
93      X = X + dist;
94      Y = Y - dist;
95      for (i = 2; i < m; i = i + 2, X = X + dist, Y = Y - dist, W = W + 5) {
96 	  fftw_real tmp19;
97 	  fftw_real tmp43;
98 	  fftw_real tmp62;
99 	  fftw_real tmp66;
100 	  fftw_real tmp41;
101 	  fftw_real tmp45;
102 	  fftw_real tmp53;
103 	  fftw_real tmp57;
104 	  fftw_real tmp30;
105 	  fftw_real tmp44;
106 	  fftw_real tmp50;
107 	  fftw_real tmp56;
108 	  ASSERT_ALIGNED_DOUBLE;
109 	  {
110 	       fftw_real tmp13;
111 	       fftw_real tmp61;
112 	       fftw_real tmp18;
113 	       fftw_real tmp60;
114 	       ASSERT_ALIGNED_DOUBLE;
115 	       tmp13 = X[0];
116 	       tmp61 = Y[-5 * iostride];
117 	       {
118 		    fftw_real tmp15;
119 		    fftw_real tmp17;
120 		    fftw_real tmp14;
121 		    fftw_real tmp16;
122 		    ASSERT_ALIGNED_DOUBLE;
123 		    tmp15 = X[3 * iostride];
124 		    tmp17 = Y[-2 * iostride];
125 		    tmp14 = c_re(W[2]);
126 		    tmp16 = c_im(W[2]);
127 		    tmp18 = (tmp14 * tmp15) - (tmp16 * tmp17);
128 		    tmp60 = (tmp16 * tmp15) + (tmp14 * tmp17);
129 	       }
130 	       tmp19 = tmp13 - tmp18;
131 	       tmp43 = tmp13 + tmp18;
132 	       tmp62 = tmp60 + tmp61;
133 	       tmp66 = tmp61 - tmp60;
134 	  }
135 	  {
136 	       fftw_real tmp35;
137 	       fftw_real tmp51;
138 	       fftw_real tmp40;
139 	       fftw_real tmp52;
140 	       ASSERT_ALIGNED_DOUBLE;
141 	       {
142 		    fftw_real tmp32;
143 		    fftw_real tmp34;
144 		    fftw_real tmp31;
145 		    fftw_real tmp33;
146 		    ASSERT_ALIGNED_DOUBLE;
147 		    tmp32 = X[4 * iostride];
148 		    tmp34 = Y[-iostride];
149 		    tmp31 = c_re(W[3]);
150 		    tmp33 = c_im(W[3]);
151 		    tmp35 = (tmp31 * tmp32) - (tmp33 * tmp34);
152 		    tmp51 = (tmp33 * tmp32) + (tmp31 * tmp34);
153 	       }
154 	       {
155 		    fftw_real tmp37;
156 		    fftw_real tmp39;
157 		    fftw_real tmp36;
158 		    fftw_real tmp38;
159 		    ASSERT_ALIGNED_DOUBLE;
160 		    tmp37 = X[iostride];
161 		    tmp39 = Y[-4 * iostride];
162 		    tmp36 = c_re(W[0]);
163 		    tmp38 = c_im(W[0]);
164 		    tmp40 = (tmp36 * tmp37) - (tmp38 * tmp39);
165 		    tmp52 = (tmp38 * tmp37) + (tmp36 * tmp39);
166 	       }
167 	       tmp41 = tmp35 - tmp40;
168 	       tmp45 = tmp35 + tmp40;
169 	       tmp53 = tmp51 + tmp52;
170 	       tmp57 = tmp51 - tmp52;
171 	  }
172 	  {
173 	       fftw_real tmp24;
174 	       fftw_real tmp48;
175 	       fftw_real tmp29;
176 	       fftw_real tmp49;
177 	       ASSERT_ALIGNED_DOUBLE;
178 	       {
179 		    fftw_real tmp21;
180 		    fftw_real tmp23;
181 		    fftw_real tmp20;
182 		    fftw_real tmp22;
183 		    ASSERT_ALIGNED_DOUBLE;
184 		    tmp21 = X[2 * iostride];
185 		    tmp23 = Y[-3 * iostride];
186 		    tmp20 = c_re(W[1]);
187 		    tmp22 = c_im(W[1]);
188 		    tmp24 = (tmp20 * tmp21) - (tmp22 * tmp23);
189 		    tmp48 = (tmp22 * tmp21) + (tmp20 * tmp23);
190 	       }
191 	       {
192 		    fftw_real tmp26;
193 		    fftw_real tmp28;
194 		    fftw_real tmp25;
195 		    fftw_real tmp27;
196 		    ASSERT_ALIGNED_DOUBLE;
197 		    tmp26 = X[5 * iostride];
198 		    tmp28 = Y[0];
199 		    tmp25 = c_re(W[4]);
200 		    tmp27 = c_im(W[4]);
201 		    tmp29 = (tmp25 * tmp26) - (tmp27 * tmp28);
202 		    tmp49 = (tmp27 * tmp26) + (tmp25 * tmp28);
203 	       }
204 	       tmp30 = tmp24 - tmp29;
205 	       tmp44 = tmp24 + tmp29;
206 	       tmp50 = tmp48 + tmp49;
207 	       tmp56 = tmp48 - tmp49;
208 	  }
209 	  {
210 	       fftw_real tmp58;
211 	       fftw_real tmp42;
212 	       fftw_real tmp55;
213 	       fftw_real tmp68;
214 	       fftw_real tmp65;
215 	       fftw_real tmp67;
216 	       ASSERT_ALIGNED_DOUBLE;
217 	       tmp58 = K866025403 * (tmp56 - tmp57);
218 	       tmp42 = tmp30 + tmp41;
219 	       tmp55 = tmp19 - (K500000000 * tmp42);
220 	       Y[-3 * iostride] = tmp19 + tmp42;
221 	       X[iostride] = tmp55 + tmp58;
222 	       Y[-5 * iostride] = tmp55 - tmp58;
223 	       tmp68 = K866025403 * (tmp41 - tmp30);
224 	       tmp65 = tmp56 + tmp57;
225 	       tmp67 = tmp66 - (K500000000 * tmp65);
226 	       X[3 * iostride] = -(tmp65 + tmp66);
227 	       Y[-iostride] = tmp68 + tmp67;
228 	       X[5 * iostride] = -(tmp67 - tmp68);
229 	  }
230 	  {
231 	       fftw_real tmp54;
232 	       fftw_real tmp46;
233 	       fftw_real tmp47;
234 	       fftw_real tmp63;
235 	       fftw_real tmp59;
236 	       fftw_real tmp64;
237 	       ASSERT_ALIGNED_DOUBLE;
238 	       tmp54 = K866025403 * (tmp50 - tmp53);
239 	       tmp46 = tmp44 + tmp45;
240 	       tmp47 = tmp43 - (K500000000 * tmp46);
241 	       X[0] = tmp43 + tmp46;
242 	       Y[-4 * iostride] = tmp47 + tmp54;
243 	       X[2 * iostride] = tmp47 - tmp54;
244 	       tmp63 = K866025403 * (tmp45 - tmp44);
245 	       tmp59 = tmp50 + tmp53;
246 	       tmp64 = tmp62 - (K500000000 * tmp59);
247 	       Y[0] = tmp59 + tmp62;
248 	       Y[-2 * iostride] = tmp64 - tmp63;
249 	       X[4 * iostride] = -(tmp63 + tmp64);
250 	  }
251      }
252      if (i == m) {
253 	  fftw_real tmp1;
254 	  fftw_real tmp11;
255 	  fftw_real tmp4;
256 	  fftw_real tmp9;
257 	  fftw_real tmp8;
258 	  fftw_real tmp10;
259 	  fftw_real tmp5;
260 	  fftw_real tmp12;
261 	  ASSERT_ALIGNED_DOUBLE;
262 	  tmp1 = X[0];
263 	  tmp11 = X[3 * iostride];
264 	  {
265 	       fftw_real tmp2;
266 	       fftw_real tmp3;
267 	       fftw_real tmp6;
268 	       fftw_real tmp7;
269 	       ASSERT_ALIGNED_DOUBLE;
270 	       tmp2 = X[2 * iostride];
271 	       tmp3 = X[4 * iostride];
272 	       tmp4 = tmp2 - tmp3;
273 	       tmp9 = K866025403 * (tmp2 + tmp3);
274 	       tmp6 = X[iostride];
275 	       tmp7 = X[5 * iostride];
276 	       tmp8 = K866025403 * (tmp6 - tmp7);
277 	       tmp10 = tmp6 + tmp7;
278 	  }
279 	  X[iostride] = tmp1 - tmp4;
280 	  tmp5 = tmp1 + (K500000000 * tmp4);
281 	  X[2 * iostride] = tmp5 - tmp8;
282 	  X[0] = tmp5 + tmp8;
283 	  Y[-iostride] = tmp11 - tmp10;
284 	  tmp12 = (K500000000 * tmp10) + tmp11;
285 	  Y[0] = -(tmp9 + tmp12);
286 	  Y[-2 * iostride] = tmp9 - tmp12;
287      }
288 }
289 
290 static const int twiddle_order[] = { 1, 2, 3, 4, 5 };
291 fftw_codelet_desc fftw_hc2hc_forward_6_desc = {
292      "fftw_hc2hc_forward_6",
293      (void (*)()) fftw_hc2hc_forward_6,
294      6,
295      FFTW_FORWARD,
296      FFTW_HC2HC,
297      135,
298      5,
299      twiddle_order,
300 };
301