1 /*
2 * Copyright (c) 1997-1999, 2003 Massachusetts Institute of Technology
3 *
4 * This program is free software; you can redistribute it and/or modify
5 * it under the terms of the GNU General Public License as published by
6 * the Free Software Foundation; either version 2 of the License, or
7 * (at your option) any later version.
8 *
9 * This program is distributed in the hope that it will be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 * GNU General Public License for more details.
13 *
14 * You should have received a copy of the GNU General Public License
15 * along with this program; if not, write to the Free Software
16 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
17 *
18 */
19
20 /* This file was automatically generated --- DO NOT EDIT */
21 /* Generated on Mon Mar 24 02:07:41 EST 2003 */
22
23 #include "fftw-int.h"
24 #include "fftw.h"
25
26 /* Generated by: /homee/stevenj/cvs/fftw/gensrc/genfft -magic-alignment-check -magic-twiddle-load-all -magic-variables 4 -magic-loopi -twiddle 10 */
27
28 /*
29 * This function contains 102 FP additions, 60 FP multiplications,
30 * (or, 72 additions, 30 multiplications, 30 fused multiply/add),
31 * 42 stack variables, and 40 memory accesses
32 */
33 static const fftw_real K587785252 =
34 FFTW_KONST(+0.587785252292473129168705954639072768597652438);
35 static const fftw_real K951056516 =
36 FFTW_KONST(+0.951056516295153572116439333379382143405698634);
37 static const fftw_real K250000000 =
38 FFTW_KONST(+0.250000000000000000000000000000000000000000000);
39 static const fftw_real K559016994 =
40 FFTW_KONST(+0.559016994374947424102293417182819058860154590);
41
42 /*
43 * Generator Id's :
44 * $Id: exprdag.ml,v 1.43 2003/03/16 23:43:46 stevenj Exp $
45 * $Id: fft.ml,v 1.44 2003/03/16 23:43:46 stevenj Exp $
46 * $Id: to_c.ml,v 1.26 2003/03/16 23:43:46 stevenj Exp $
47 */
48
fftw_twiddle_10(fftw_complex * A,const fftw_complex * W,int iostride,int m,int dist)49 void fftw_twiddle_10(fftw_complex *A, const fftw_complex *W, int iostride,
50 int m, int dist)
51 {
52 int i;
53 fftw_complex *inout;
54 inout = A;
55 for (i = m; i > 0; i = i - 1, inout = inout + dist, W = W + 9) {
56 fftw_real tmp7;
57 fftw_real tmp55;
58 fftw_real tmp100;
59 fftw_real tmp112;
60 fftw_real tmp41;
61 fftw_real tmp52;
62 fftw_real tmp53;
63 fftw_real tmp59;
64 fftw_real tmp60;
65 fftw_real tmp61;
66 fftw_real tmp75;
67 fftw_real tmp78;
68 fftw_real tmp110;
69 fftw_real tmp86;
70 fftw_real tmp87;
71 fftw_real tmp96;
72 fftw_real tmp18;
73 fftw_real tmp29;
74 fftw_real tmp30;
75 fftw_real tmp56;
76 fftw_real tmp57;
77 fftw_real tmp58;
78 fftw_real tmp68;
79 fftw_real tmp71;
80 fftw_real tmp109;
81 fftw_real tmp89;
82 fftw_real tmp90;
83 fftw_real tmp95;
84 ASSERT_ALIGNED_DOUBLE;
85 {
86 fftw_real tmp1;
87 fftw_real tmp99;
88 fftw_real tmp6;
89 fftw_real tmp98;
90 ASSERT_ALIGNED_DOUBLE;
91 tmp1 = c_re(inout[0]);
92 tmp99 = c_im(inout[0]);
93 {
94 fftw_real tmp3;
95 fftw_real tmp5;
96 fftw_real tmp2;
97 fftw_real tmp4;
98 ASSERT_ALIGNED_DOUBLE;
99 tmp3 = c_re(inout[5 * iostride]);
100 tmp5 = c_im(inout[5 * iostride]);
101 tmp2 = c_re(W[4]);
102 tmp4 = c_im(W[4]);
103 tmp6 = (tmp2 * tmp3) - (tmp4 * tmp5);
104 tmp98 = (tmp4 * tmp3) + (tmp2 * tmp5);
105 }
106 tmp7 = tmp1 - tmp6;
107 tmp55 = tmp1 + tmp6;
108 tmp100 = tmp98 + tmp99;
109 tmp112 = tmp99 - tmp98;
110 }
111 {
112 fftw_real tmp35;
113 fftw_real tmp73;
114 fftw_real tmp51;
115 fftw_real tmp77;
116 fftw_real tmp40;
117 fftw_real tmp74;
118 fftw_real tmp46;
119 fftw_real tmp76;
120 ASSERT_ALIGNED_DOUBLE;
121 {
122 fftw_real tmp32;
123 fftw_real tmp34;
124 fftw_real tmp31;
125 fftw_real tmp33;
126 ASSERT_ALIGNED_DOUBLE;
127 tmp32 = c_re(inout[4 * iostride]);
128 tmp34 = c_im(inout[4 * iostride]);
129 tmp31 = c_re(W[3]);
130 tmp33 = c_im(W[3]);
131 tmp35 = (tmp31 * tmp32) - (tmp33 * tmp34);
132 tmp73 = (tmp33 * tmp32) + (tmp31 * tmp34);
133 }
134 {
135 fftw_real tmp48;
136 fftw_real tmp50;
137 fftw_real tmp47;
138 fftw_real tmp49;
139 ASSERT_ALIGNED_DOUBLE;
140 tmp48 = c_re(inout[iostride]);
141 tmp50 = c_im(inout[iostride]);
142 tmp47 = c_re(W[0]);
143 tmp49 = c_im(W[0]);
144 tmp51 = (tmp47 * tmp48) - (tmp49 * tmp50);
145 tmp77 = (tmp49 * tmp48) + (tmp47 * tmp50);
146 }
147 {
148 fftw_real tmp37;
149 fftw_real tmp39;
150 fftw_real tmp36;
151 fftw_real tmp38;
152 ASSERT_ALIGNED_DOUBLE;
153 tmp37 = c_re(inout[9 * iostride]);
154 tmp39 = c_im(inout[9 * iostride]);
155 tmp36 = c_re(W[8]);
156 tmp38 = c_im(W[8]);
157 tmp40 = (tmp36 * tmp37) - (tmp38 * tmp39);
158 tmp74 = (tmp38 * tmp37) + (tmp36 * tmp39);
159 }
160 {
161 fftw_real tmp43;
162 fftw_real tmp45;
163 fftw_real tmp42;
164 fftw_real tmp44;
165 ASSERT_ALIGNED_DOUBLE;
166 tmp43 = c_re(inout[6 * iostride]);
167 tmp45 = c_im(inout[6 * iostride]);
168 tmp42 = c_re(W[5]);
169 tmp44 = c_im(W[5]);
170 tmp46 = (tmp42 * tmp43) - (tmp44 * tmp45);
171 tmp76 = (tmp44 * tmp43) + (tmp42 * tmp45);
172 }
173 tmp41 = tmp35 - tmp40;
174 tmp52 = tmp46 - tmp51;
175 tmp53 = tmp41 + tmp52;
176 tmp59 = tmp35 + tmp40;
177 tmp60 = tmp46 + tmp51;
178 tmp61 = tmp59 + tmp60;
179 tmp75 = tmp73 - tmp74;
180 tmp78 = tmp76 - tmp77;
181 tmp110 = tmp75 + tmp78;
182 tmp86 = tmp73 + tmp74;
183 tmp87 = tmp76 + tmp77;
184 tmp96 = tmp86 + tmp87;
185 }
186 {
187 fftw_real tmp12;
188 fftw_real tmp66;
189 fftw_real tmp28;
190 fftw_real tmp70;
191 fftw_real tmp17;
192 fftw_real tmp67;
193 fftw_real tmp23;
194 fftw_real tmp69;
195 ASSERT_ALIGNED_DOUBLE;
196 {
197 fftw_real tmp9;
198 fftw_real tmp11;
199 fftw_real tmp8;
200 fftw_real tmp10;
201 ASSERT_ALIGNED_DOUBLE;
202 tmp9 = c_re(inout[2 * iostride]);
203 tmp11 = c_im(inout[2 * iostride]);
204 tmp8 = c_re(W[1]);
205 tmp10 = c_im(W[1]);
206 tmp12 = (tmp8 * tmp9) - (tmp10 * tmp11);
207 tmp66 = (tmp10 * tmp9) + (tmp8 * tmp11);
208 }
209 {
210 fftw_real tmp25;
211 fftw_real tmp27;
212 fftw_real tmp24;
213 fftw_real tmp26;
214 ASSERT_ALIGNED_DOUBLE;
215 tmp25 = c_re(inout[3 * iostride]);
216 tmp27 = c_im(inout[3 * iostride]);
217 tmp24 = c_re(W[2]);
218 tmp26 = c_im(W[2]);
219 tmp28 = (tmp24 * tmp25) - (tmp26 * tmp27);
220 tmp70 = (tmp26 * tmp25) + (tmp24 * tmp27);
221 }
222 {
223 fftw_real tmp14;
224 fftw_real tmp16;
225 fftw_real tmp13;
226 fftw_real tmp15;
227 ASSERT_ALIGNED_DOUBLE;
228 tmp14 = c_re(inout[7 * iostride]);
229 tmp16 = c_im(inout[7 * iostride]);
230 tmp13 = c_re(W[6]);
231 tmp15 = c_im(W[6]);
232 tmp17 = (tmp13 * tmp14) - (tmp15 * tmp16);
233 tmp67 = (tmp15 * tmp14) + (tmp13 * tmp16);
234 }
235 {
236 fftw_real tmp20;
237 fftw_real tmp22;
238 fftw_real tmp19;
239 fftw_real tmp21;
240 ASSERT_ALIGNED_DOUBLE;
241 tmp20 = c_re(inout[8 * iostride]);
242 tmp22 = c_im(inout[8 * iostride]);
243 tmp19 = c_re(W[7]);
244 tmp21 = c_im(W[7]);
245 tmp23 = (tmp19 * tmp20) - (tmp21 * tmp22);
246 tmp69 = (tmp21 * tmp20) + (tmp19 * tmp22);
247 }
248 tmp18 = tmp12 - tmp17;
249 tmp29 = tmp23 - tmp28;
250 tmp30 = tmp18 + tmp29;
251 tmp56 = tmp12 + tmp17;
252 tmp57 = tmp23 + tmp28;
253 tmp58 = tmp56 + tmp57;
254 tmp68 = tmp66 - tmp67;
255 tmp71 = tmp69 - tmp70;
256 tmp109 = tmp68 + tmp71;
257 tmp89 = tmp66 + tmp67;
258 tmp90 = tmp69 + tmp70;
259 tmp95 = tmp89 + tmp90;
260 }
261 {
262 fftw_real tmp63;
263 fftw_real tmp54;
264 fftw_real tmp64;
265 fftw_real tmp80;
266 fftw_real tmp82;
267 fftw_real tmp72;
268 fftw_real tmp79;
269 fftw_real tmp81;
270 fftw_real tmp65;
271 ASSERT_ALIGNED_DOUBLE;
272 tmp63 = K559016994 * (tmp30 - tmp53);
273 tmp54 = tmp30 + tmp53;
274 tmp64 = tmp7 - (K250000000 * tmp54);
275 tmp72 = tmp68 - tmp71;
276 tmp79 = tmp75 - tmp78;
277 tmp80 = (K951056516 * tmp72) + (K587785252 * tmp79);
278 tmp82 = (K951056516 * tmp79) - (K587785252 * tmp72);
279 c_re(inout[5 * iostride]) = tmp7 + tmp54;
280 tmp81 = tmp64 - tmp63;
281 c_re(inout[7 * iostride]) = tmp81 - tmp82;
282 c_re(inout[3 * iostride]) = tmp81 + tmp82;
283 tmp65 = tmp63 + tmp64;
284 c_re(inout[9 * iostride]) = tmp65 - tmp80;
285 c_re(inout[iostride]) = tmp65 + tmp80;
286 }
287 {
288 fftw_real tmp111;
289 fftw_real tmp113;
290 fftw_real tmp114;
291 fftw_real tmp118;
292 fftw_real tmp120;
293 fftw_real tmp116;
294 fftw_real tmp117;
295 fftw_real tmp119;
296 fftw_real tmp115;
297 ASSERT_ALIGNED_DOUBLE;
298 tmp111 = K559016994 * (tmp109 - tmp110);
299 tmp113 = tmp109 + tmp110;
300 tmp114 = tmp112 - (K250000000 * tmp113);
301 tmp116 = tmp18 - tmp29;
302 tmp117 = tmp41 - tmp52;
303 tmp118 = (K951056516 * tmp116) + (K587785252 * tmp117);
304 tmp120 = (K951056516 * tmp117) - (K587785252 * tmp116);
305 c_im(inout[5 * iostride]) = tmp113 + tmp112;
306 tmp119 = tmp114 - tmp111;
307 c_im(inout[3 * iostride]) = tmp119 - tmp120;
308 c_im(inout[7 * iostride]) = tmp120 + tmp119;
309 tmp115 = tmp111 + tmp114;
310 c_im(inout[iostride]) = tmp115 - tmp118;
311 c_im(inout[9 * iostride]) = tmp118 + tmp115;
312 }
313 {
314 fftw_real tmp84;
315 fftw_real tmp62;
316 fftw_real tmp83;
317 fftw_real tmp92;
318 fftw_real tmp94;
319 fftw_real tmp88;
320 fftw_real tmp91;
321 fftw_real tmp93;
322 fftw_real tmp85;
323 ASSERT_ALIGNED_DOUBLE;
324 tmp84 = K559016994 * (tmp58 - tmp61);
325 tmp62 = tmp58 + tmp61;
326 tmp83 = tmp55 - (K250000000 * tmp62);
327 tmp88 = tmp86 - tmp87;
328 tmp91 = tmp89 - tmp90;
329 tmp92 = (K951056516 * tmp88) - (K587785252 * tmp91);
330 tmp94 = (K951056516 * tmp91) + (K587785252 * tmp88);
331 c_re(inout[0]) = tmp55 + tmp62;
332 tmp93 = tmp84 + tmp83;
333 c_re(inout[4 * iostride]) = tmp93 - tmp94;
334 c_re(inout[6 * iostride]) = tmp93 + tmp94;
335 tmp85 = tmp83 - tmp84;
336 c_re(inout[2 * iostride]) = tmp85 - tmp92;
337 c_re(inout[8 * iostride]) = tmp85 + tmp92;
338 }
339 {
340 fftw_real tmp105;
341 fftw_real tmp97;
342 fftw_real tmp104;
343 fftw_real tmp103;
344 fftw_real tmp107;
345 fftw_real tmp101;
346 fftw_real tmp102;
347 fftw_real tmp108;
348 fftw_real tmp106;
349 ASSERT_ALIGNED_DOUBLE;
350 tmp105 = K559016994 * (tmp95 - tmp96);
351 tmp97 = tmp95 + tmp96;
352 tmp104 = tmp100 - (K250000000 * tmp97);
353 tmp101 = tmp59 - tmp60;
354 tmp102 = tmp56 - tmp57;
355 tmp103 = (K951056516 * tmp101) - (K587785252 * tmp102);
356 tmp107 = (K951056516 * tmp102) + (K587785252 * tmp101);
357 c_im(inout[0]) = tmp97 + tmp100;
358 tmp108 = tmp105 + tmp104;
359 c_im(inout[4 * iostride]) = tmp107 + tmp108;
360 c_im(inout[6 * iostride]) = tmp108 - tmp107;
361 tmp106 = tmp104 - tmp105;
362 c_im(inout[2 * iostride]) = tmp103 + tmp106;
363 c_im(inout[8 * iostride]) = tmp106 - tmp103;
364 }
365 }
366 }
367
368 static const int twiddle_order[] = { 1, 2, 3, 4, 5, 6, 7, 8, 9 };
369 fftw_codelet_desc fftw_twiddle_10_desc = {
370 "fftw_twiddle_10",
371 (void (*)()) fftw_twiddle_10,
372 10,
373 FFTW_FORWARD,
374 FFTW_TWIDDLE,
375 220,
376 9,
377 twiddle_order,
378 };
379