1 /*
2 * Copyright (c) 1997-1999, 2003 Massachusetts Institute of Technology
3 *
4 * This program is free software; you can redistribute it and/or modify
5 * it under the terms of the GNU General Public License as published by
6 * the Free Software Foundation; either version 2 of the License, or
7 * (at your option) any later version.
8 *
9 * This program is distributed in the hope that it will be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 * GNU General Public License for more details.
13 *
14 * You should have received a copy of the GNU General Public License
15 * along with this program; if not, write to the Free Software
16 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
17 *
18 */
19
20 /* This file was automatically generated --- DO NOT EDIT */
21 /* Generated on Mon Mar 24 02:08:59 EST 2003 */
22
23 #include "fftw-int.h"
24 #include "fftw.h"
25
26 /* Generated by: /homee/stevenj/cvs/fftw/gensrc/genfft -magic-alignment-check -magic-twiddle-load-all -magic-variables 4 -magic-loopi -hc2hc-backward 10 */
27
28 /*
29 * This function contains 168 FP additions, 90 FP multiplications,
30 * (or, 124 additions, 46 multiplications, 44 fused multiply/add),
31 * 37 stack variables, and 80 memory accesses
32 */
33 static const fftw_real K250000000 =
34 FFTW_KONST(+0.250000000000000000000000000000000000000000000);
35 static const fftw_real K951056516 =
36 FFTW_KONST(+0.951056516295153572116439333379382143405698634);
37 static const fftw_real K587785252 =
38 FFTW_KONST(+0.587785252292473129168705954639072768597652438);
39 static const fftw_real K559016994 =
40 FFTW_KONST(+0.559016994374947424102293417182819058860154590);
41 static const fftw_real K500000000 =
42 FFTW_KONST(+0.500000000000000000000000000000000000000000000);
43 static const fftw_real K1_902113032 =
44 FFTW_KONST(+1.902113032590307144232878666758764286811397268);
45 static const fftw_real K1_175570504 =
46 FFTW_KONST(+1.175570504584946258337411909278145537195304875);
47 static const fftw_real K2_000000000 =
48 FFTW_KONST(+2.000000000000000000000000000000000000000000000);
49 static const fftw_real K1_118033988 =
50 FFTW_KONST(+1.118033988749894848204586834365638117720309180);
51
52 /*
53 * Generator Id's :
54 * $Id: exprdag.ml,v 1.43 2003/03/16 23:43:46 stevenj Exp $
55 * $Id: fft.ml,v 1.44 2003/03/16 23:43:46 stevenj Exp $
56 * $Id: to_c.ml,v 1.26 2003/03/16 23:43:46 stevenj Exp $
57 */
58
fftw_hc2hc_backward_10(fftw_real * A,const fftw_complex * W,int iostride,int m,int dist)59 void fftw_hc2hc_backward_10(fftw_real *A, const fftw_complex *W,
60 int iostride, int m, int dist)
61 {
62 int i;
63 fftw_real *X;
64 fftw_real *Y;
65 X = A;
66 Y = A + (10 * iostride);
67 {
68 fftw_real tmp155;
69 fftw_real tmp163;
70 fftw_real tmp175;
71 fftw_real tmp183;
72 fftw_real tmp172;
73 fftw_real tmp182;
74 fftw_real tmp162;
75 fftw_real tmp180;
76 fftw_real tmp166;
77 fftw_real tmp167;
78 fftw_real tmp170;
79 fftw_real tmp171;
80 ASSERT_ALIGNED_DOUBLE;
81 {
82 fftw_real tmp153;
83 fftw_real tmp154;
84 fftw_real tmp173;
85 fftw_real tmp174;
86 ASSERT_ALIGNED_DOUBLE;
87 tmp153 = X[0];
88 tmp154 = X[5 * iostride];
89 tmp155 = tmp153 - tmp154;
90 tmp163 = tmp153 + tmp154;
91 tmp173 = Y[-4 * iostride];
92 tmp174 = Y[-iostride];
93 tmp175 = tmp173 - tmp174;
94 tmp183 = tmp173 + tmp174;
95 }
96 tmp170 = Y[-2 * iostride];
97 tmp171 = Y[-3 * iostride];
98 tmp172 = tmp170 - tmp171;
99 tmp182 = tmp170 + tmp171;
100 {
101 fftw_real tmp158;
102 fftw_real tmp164;
103 fftw_real tmp161;
104 fftw_real tmp165;
105 ASSERT_ALIGNED_DOUBLE;
106 {
107 fftw_real tmp156;
108 fftw_real tmp157;
109 fftw_real tmp159;
110 fftw_real tmp160;
111 ASSERT_ALIGNED_DOUBLE;
112 tmp156 = X[2 * iostride];
113 tmp157 = X[3 * iostride];
114 tmp158 = tmp156 - tmp157;
115 tmp164 = tmp156 + tmp157;
116 tmp159 = X[4 * iostride];
117 tmp160 = X[iostride];
118 tmp161 = tmp159 - tmp160;
119 tmp165 = tmp159 + tmp160;
120 }
121 tmp162 = tmp158 + tmp161;
122 tmp180 = K1_118033988 * (tmp158 - tmp161);
123 tmp166 = tmp164 + tmp165;
124 tmp167 = K1_118033988 * (tmp164 - tmp165);
125 }
126 X[5 * iostride] = tmp155 + (K2_000000000 * tmp162);
127 {
128 fftw_real tmp184;
129 fftw_real tmp186;
130 fftw_real tmp181;
131 fftw_real tmp185;
132 fftw_real tmp179;
133 ASSERT_ALIGNED_DOUBLE;
134 tmp184 = (K1_175570504 * tmp182) - (K1_902113032 * tmp183);
135 tmp186 = (K1_902113032 * tmp182) + (K1_175570504 * tmp183);
136 tmp179 = tmp155 - (K500000000 * tmp162);
137 tmp181 = tmp179 - tmp180;
138 tmp185 = tmp179 + tmp180;
139 X[7 * iostride] = tmp181 - tmp184;
140 X[3 * iostride] = tmp181 + tmp184;
141 X[iostride] = tmp185 - tmp186;
142 X[9 * iostride] = tmp185 + tmp186;
143 }
144 X[0] = tmp163 + (K2_000000000 * tmp166);
145 {
146 fftw_real tmp176;
147 fftw_real tmp178;
148 fftw_real tmp169;
149 fftw_real tmp177;
150 fftw_real tmp168;
151 ASSERT_ALIGNED_DOUBLE;
152 tmp176 = (K1_902113032 * tmp172) + (K1_175570504 * tmp175);
153 tmp178 = (K1_902113032 * tmp175) - (K1_175570504 * tmp172);
154 tmp168 = tmp163 - (K500000000 * tmp166);
155 tmp169 = tmp167 + tmp168;
156 tmp177 = tmp168 - tmp167;
157 X[4 * iostride] = tmp169 + tmp176;
158 X[6 * iostride] = tmp169 - tmp176;
159 X[8 * iostride] = tmp177 - tmp178;
160 X[2 * iostride] = tmp177 + tmp178;
161 }
162 }
163 X = X + dist;
164 Y = Y - dist;
165 for (i = 2; i < m; i = i + 2, X = X + dist, Y = Y - dist, W = W + 9) {
166 fftw_real tmp35;
167 fftw_real tmp102;
168 fftw_real tmp77;
169 fftw_real tmp119;
170 fftw_real tmp72;
171 fftw_real tmp73;
172 fftw_real tmp50;
173 fftw_real tmp53;
174 fftw_real tmp123;
175 fftw_real tmp122;
176 fftw_real tmp109;
177 fftw_real tmp131;
178 fftw_real tmp61;
179 fftw_real tmp68;
180 fftw_real tmp80;
181 fftw_real tmp82;
182 fftw_real tmp134;
183 fftw_real tmp133;
184 fftw_real tmp118;
185 fftw_real tmp126;
186 ASSERT_ALIGNED_DOUBLE;
187 {
188 fftw_real tmp33;
189 fftw_real tmp34;
190 fftw_real tmp75;
191 fftw_real tmp76;
192 ASSERT_ALIGNED_DOUBLE;
193 tmp33 = X[0];
194 tmp34 = Y[-5 * iostride];
195 tmp35 = tmp33 + tmp34;
196 tmp102 = tmp33 - tmp34;
197 tmp75 = Y[0];
198 tmp76 = X[5 * iostride];
199 tmp77 = tmp75 - tmp76;
200 tmp119 = tmp75 + tmp76;
201 }
202 {
203 fftw_real tmp38;
204 fftw_real tmp103;
205 fftw_real tmp48;
206 fftw_real tmp107;
207 fftw_real tmp41;
208 fftw_real tmp104;
209 fftw_real tmp45;
210 fftw_real tmp106;
211 ASSERT_ALIGNED_DOUBLE;
212 {
213 fftw_real tmp36;
214 fftw_real tmp37;
215 fftw_real tmp46;
216 fftw_real tmp47;
217 ASSERT_ALIGNED_DOUBLE;
218 tmp36 = X[2 * iostride];
219 tmp37 = Y[-7 * iostride];
220 tmp38 = tmp36 + tmp37;
221 tmp103 = tmp36 - tmp37;
222 tmp46 = Y[-6 * iostride];
223 tmp47 = X[iostride];
224 tmp48 = tmp46 + tmp47;
225 tmp107 = tmp46 - tmp47;
226 }
227 {
228 fftw_real tmp39;
229 fftw_real tmp40;
230 fftw_real tmp43;
231 fftw_real tmp44;
232 ASSERT_ALIGNED_DOUBLE;
233 tmp39 = Y[-8 * iostride];
234 tmp40 = X[3 * iostride];
235 tmp41 = tmp39 + tmp40;
236 tmp104 = tmp39 - tmp40;
237 tmp43 = X[4 * iostride];
238 tmp44 = Y[-9 * iostride];
239 tmp45 = tmp43 + tmp44;
240 tmp106 = tmp43 - tmp44;
241 }
242 {
243 fftw_real tmp42;
244 fftw_real tmp49;
245 fftw_real tmp105;
246 fftw_real tmp108;
247 ASSERT_ALIGNED_DOUBLE;
248 tmp72 = tmp38 - tmp41;
249 tmp73 = tmp45 - tmp48;
250 tmp42 = tmp38 + tmp41;
251 tmp49 = tmp45 + tmp48;
252 tmp50 = tmp42 + tmp49;
253 tmp53 = K559016994 * (tmp42 - tmp49);
254 tmp123 = tmp106 - tmp107;
255 tmp122 = tmp103 - tmp104;
256 tmp105 = tmp103 + tmp104;
257 tmp108 = tmp106 + tmp107;
258 tmp109 = tmp105 + tmp108;
259 tmp131 = K559016994 * (tmp105 - tmp108);
260 }
261 }
262 {
263 fftw_real tmp57;
264 fftw_real tmp112;
265 fftw_real tmp67;
266 fftw_real tmp116;
267 fftw_real tmp60;
268 fftw_real tmp113;
269 fftw_real tmp64;
270 fftw_real tmp115;
271 ASSERT_ALIGNED_DOUBLE;
272 {
273 fftw_real tmp55;
274 fftw_real tmp56;
275 fftw_real tmp65;
276 fftw_real tmp66;
277 ASSERT_ALIGNED_DOUBLE;
278 tmp55 = Y[-2 * iostride];
279 tmp56 = X[7 * iostride];
280 tmp57 = tmp55 - tmp56;
281 tmp112 = tmp55 + tmp56;
282 tmp65 = Y[-iostride];
283 tmp66 = X[6 * iostride];
284 tmp67 = tmp65 - tmp66;
285 tmp116 = tmp65 + tmp66;
286 }
287 {
288 fftw_real tmp58;
289 fftw_real tmp59;
290 fftw_real tmp62;
291 fftw_real tmp63;
292 ASSERT_ALIGNED_DOUBLE;
293 tmp58 = Y[-3 * iostride];
294 tmp59 = X[8 * iostride];
295 tmp60 = tmp58 - tmp59;
296 tmp113 = tmp58 + tmp59;
297 tmp62 = Y[-4 * iostride];
298 tmp63 = X[9 * iostride];
299 tmp64 = tmp62 - tmp63;
300 tmp115 = tmp62 + tmp63;
301 }
302 {
303 fftw_real tmp78;
304 fftw_real tmp79;
305 fftw_real tmp114;
306 fftw_real tmp117;
307 ASSERT_ALIGNED_DOUBLE;
308 tmp61 = tmp57 - tmp60;
309 tmp68 = tmp64 - tmp67;
310 tmp78 = tmp57 + tmp60;
311 tmp79 = tmp64 + tmp67;
312 tmp80 = tmp78 + tmp79;
313 tmp82 = K559016994 * (tmp78 - tmp79);
314 tmp134 = tmp115 + tmp116;
315 tmp133 = tmp112 + tmp113;
316 tmp114 = tmp112 - tmp113;
317 tmp117 = tmp115 - tmp116;
318 tmp118 = tmp114 + tmp117;
319 tmp126 = K559016994 * (tmp114 - tmp117);
320 }
321 }
322 X[0] = tmp35 + tmp50;
323 {
324 fftw_real tmp69;
325 fftw_real tmp91;
326 fftw_real tmp54;
327 fftw_real tmp90;
328 fftw_real tmp95;
329 fftw_real tmp74;
330 fftw_real tmp83;
331 fftw_real tmp94;
332 fftw_real tmp52;
333 fftw_real tmp81;
334 ASSERT_ALIGNED_DOUBLE;
335 tmp69 = (K587785252 * tmp61) - (K951056516 * tmp68);
336 tmp91 = (K951056516 * tmp61) + (K587785252 * tmp68);
337 tmp52 = tmp35 - (K250000000 * tmp50);
338 tmp54 = tmp52 - tmp53;
339 tmp90 = tmp53 + tmp52;
340 tmp95 = (K951056516 * tmp72) + (K587785252 * tmp73);
341 tmp74 = (K587785252 * tmp72) - (K951056516 * tmp73);
342 tmp81 = tmp77 - (K250000000 * tmp80);
343 tmp83 = tmp81 - tmp82;
344 tmp94 = tmp82 + tmp81;
345 {
346 fftw_real tmp70;
347 fftw_real tmp84;
348 fftw_real tmp51;
349 fftw_real tmp71;
350 ASSERT_ALIGNED_DOUBLE;
351 tmp70 = tmp54 - tmp69;
352 tmp84 = tmp74 + tmp83;
353 tmp51 = c_re(W[1]);
354 tmp71 = c_im(W[1]);
355 X[2 * iostride] = (tmp51 * tmp70) + (tmp71 * tmp84);
356 Y[-7 * iostride] = (tmp51 * tmp84) - (tmp71 * tmp70);
357 }
358 {
359 fftw_real tmp86;
360 fftw_real tmp88;
361 fftw_real tmp85;
362 fftw_real tmp87;
363 ASSERT_ALIGNED_DOUBLE;
364 tmp86 = tmp54 + tmp69;
365 tmp88 = tmp83 - tmp74;
366 tmp85 = c_re(W[7]);
367 tmp87 = c_im(W[7]);
368 X[8 * iostride] = (tmp85 * tmp86) + (tmp87 * tmp88);
369 Y[-iostride] = (tmp85 * tmp88) - (tmp87 * tmp86);
370 }
371 {
372 fftw_real tmp92;
373 fftw_real tmp96;
374 fftw_real tmp89;
375 fftw_real tmp93;
376 ASSERT_ALIGNED_DOUBLE;
377 tmp92 = tmp90 + tmp91;
378 tmp96 = tmp94 - tmp95;
379 tmp89 = c_re(W[3]);
380 tmp93 = c_im(W[3]);
381 X[4 * iostride] = (tmp89 * tmp92) + (tmp93 * tmp96);
382 Y[-5 * iostride] = (tmp89 * tmp96) - (tmp93 * tmp92);
383 }
384 {
385 fftw_real tmp98;
386 fftw_real tmp100;
387 fftw_real tmp97;
388 fftw_real tmp99;
389 ASSERT_ALIGNED_DOUBLE;
390 tmp98 = tmp90 - tmp91;
391 tmp100 = tmp95 + tmp94;
392 tmp97 = c_re(W[5]);
393 tmp99 = c_im(W[5]);
394 X[6 * iostride] = (tmp97 * tmp98) + (tmp99 * tmp100);
395 Y[-3 * iostride] = (tmp97 * tmp100) - (tmp99 * tmp98);
396 }
397 }
398 Y[-9 * iostride] = tmp80 + tmp77;
399 {
400 fftw_real tmp110;
401 fftw_real tmp120;
402 fftw_real tmp101;
403 fftw_real tmp111;
404 ASSERT_ALIGNED_DOUBLE;
405 tmp110 = tmp102 + tmp109;
406 tmp120 = tmp118 + tmp119;
407 tmp101 = c_re(W[4]);
408 tmp111 = c_im(W[4]);
409 X[5 * iostride] = (tmp101 * tmp110) + (tmp111 * tmp120);
410 Y[-4 * iostride] = (tmp101 * tmp120) - (tmp111 * tmp110);
411 }
412 {
413 fftw_real tmp124;
414 fftw_real tmp142;
415 fftw_real tmp127;
416 fftw_real tmp143;
417 fftw_real tmp147;
418 fftw_real tmp135;
419 fftw_real tmp132;
420 fftw_real tmp146;
421 fftw_real tmp125;
422 fftw_real tmp130;
423 ASSERT_ALIGNED_DOUBLE;
424 tmp124 = (K587785252 * tmp122) - (K951056516 * tmp123);
425 tmp142 = (K951056516 * tmp122) + (K587785252 * tmp123);
426 tmp125 = tmp119 - (K250000000 * tmp118);
427 tmp127 = tmp125 - tmp126;
428 tmp143 = tmp126 + tmp125;
429 tmp147 = (K951056516 * tmp133) + (K587785252 * tmp134);
430 tmp135 = (K587785252 * tmp133) - (K951056516 * tmp134);
431 tmp130 = tmp102 - (K250000000 * tmp109);
432 tmp132 = tmp130 - tmp131;
433 tmp146 = tmp131 + tmp130;
434 {
435 fftw_real tmp128;
436 fftw_real tmp136;
437 fftw_real tmp121;
438 fftw_real tmp129;
439 ASSERT_ALIGNED_DOUBLE;
440 tmp128 = tmp124 + tmp127;
441 tmp136 = tmp132 - tmp135;
442 tmp121 = c_re(W[6]);
443 tmp129 = c_im(W[6]);
444 Y[-2 * iostride] =
445 (tmp121 * tmp128) - (tmp129 * tmp136);
446 X[7 * iostride] =
447 (tmp121 * tmp136) + (tmp129 * tmp128);
448 }
449 {
450 fftw_real tmp138;
451 fftw_real tmp140;
452 fftw_real tmp137;
453 fftw_real tmp139;
454 ASSERT_ALIGNED_DOUBLE;
455 tmp138 = tmp127 - tmp124;
456 tmp140 = tmp132 + tmp135;
457 tmp137 = c_re(W[2]);
458 tmp139 = c_im(W[2]);
459 Y[-6 * iostride] =
460 (tmp137 * tmp138) - (tmp139 * tmp140);
461 X[3 * iostride] =
462 (tmp137 * tmp140) + (tmp139 * tmp138);
463 }
464 {
465 fftw_real tmp144;
466 fftw_real tmp148;
467 fftw_real tmp141;
468 fftw_real tmp145;
469 ASSERT_ALIGNED_DOUBLE;
470 tmp144 = tmp142 + tmp143;
471 tmp148 = tmp146 - tmp147;
472 tmp141 = c_re(W[0]);
473 tmp145 = c_im(W[0]);
474 Y[-8 * iostride] =
475 (tmp141 * tmp144) - (tmp145 * tmp148);
476 X[iostride] = (tmp141 * tmp148) + (tmp145 * tmp144);
477 }
478 {
479 fftw_real tmp150;
480 fftw_real tmp152;
481 fftw_real tmp149;
482 fftw_real tmp151;
483 ASSERT_ALIGNED_DOUBLE;
484 tmp150 = tmp143 - tmp142;
485 tmp152 = tmp146 + tmp147;
486 tmp149 = c_re(W[8]);
487 tmp151 = c_im(W[8]);
488 Y[0] = (tmp149 * tmp150) - (tmp151 * tmp152);
489 X[9 * iostride] =
490 (tmp149 * tmp152) + (tmp151 * tmp150);
491 }
492 }
493 }
494 if (i == m) {
495 fftw_real tmp1;
496 fftw_real tmp24;
497 fftw_real tmp8;
498 fftw_real tmp10;
499 fftw_real tmp25;
500 fftw_real tmp26;
501 fftw_real tmp14;
502 fftw_real tmp28;
503 fftw_real tmp23;
504 fftw_real tmp17;
505 ASSERT_ALIGNED_DOUBLE;
506 tmp1 = X[2 * iostride];
507 tmp24 = Y[-2 * iostride];
508 {
509 fftw_real tmp2;
510 fftw_real tmp3;
511 fftw_real tmp4;
512 fftw_real tmp5;
513 fftw_real tmp6;
514 fftw_real tmp7;
515 ASSERT_ALIGNED_DOUBLE;
516 tmp2 = X[4 * iostride];
517 tmp3 = X[0];
518 tmp4 = tmp2 + tmp3;
519 tmp5 = X[3 * iostride];
520 tmp6 = X[iostride];
521 tmp7 = tmp5 + tmp6;
522 tmp8 = tmp4 + tmp7;
523 tmp10 = K1_118033988 * (tmp7 - tmp4);
524 tmp25 = tmp2 - tmp3;
525 tmp26 = tmp5 - tmp6;
526 }
527 {
528 fftw_real tmp12;
529 fftw_real tmp13;
530 fftw_real tmp22;
531 fftw_real tmp15;
532 fftw_real tmp16;
533 fftw_real tmp21;
534 ASSERT_ALIGNED_DOUBLE;
535 tmp12 = Y[-4 * iostride];
536 tmp13 = Y[0];
537 tmp22 = tmp12 + tmp13;
538 tmp15 = Y[-iostride];
539 tmp16 = Y[-3 * iostride];
540 tmp21 = tmp15 + tmp16;
541 tmp14 = tmp12 - tmp13;
542 tmp28 = K1_118033988 * (tmp22 + tmp21);
543 tmp23 = tmp21 - tmp22;
544 tmp17 = tmp15 - tmp16;
545 }
546 X[0] = K2_000000000 * (tmp1 + tmp8);
547 {
548 fftw_real tmp18;
549 fftw_real tmp19;
550 fftw_real tmp11;
551 fftw_real tmp20;
552 fftw_real tmp9;
553 ASSERT_ALIGNED_DOUBLE;
554 tmp18 = (K1_175570504 * tmp14) - (K1_902113032 * tmp17);
555 tmp19 = (K1_902113032 * tmp14) + (K1_175570504 * tmp17);
556 tmp9 = (K500000000 * tmp8) - (K2_000000000 * tmp1);
557 tmp11 = tmp9 - tmp10;
558 tmp20 = tmp9 + tmp10;
559 X[2 * iostride] = tmp11 + tmp18;
560 X[8 * iostride] = tmp18 - tmp11;
561 X[4 * iostride] = tmp19 - tmp20;
562 X[6 * iostride] = tmp20 + tmp19;
563 }
564 X[5 * iostride] = K2_000000000 * (tmp23 - tmp24);
565 {
566 fftw_real tmp27;
567 fftw_real tmp31;
568 fftw_real tmp30;
569 fftw_real tmp32;
570 fftw_real tmp29;
571 ASSERT_ALIGNED_DOUBLE;
572 tmp27 = (K1_902113032 * tmp25) + (K1_175570504 * tmp26);
573 tmp31 = (K1_902113032 * tmp26) - (K1_175570504 * tmp25);
574 tmp29 = (K500000000 * tmp23) + (K2_000000000 * tmp24);
575 tmp30 = tmp28 + tmp29;
576 tmp32 = tmp29 - tmp28;
577 X[iostride] = -(tmp27 + tmp30);
578 X[9 * iostride] = tmp27 - tmp30;
579 X[3 * iostride] = tmp31 + tmp32;
580 X[7 * iostride] = tmp32 - tmp31;
581 }
582 }
583 }
584
585 static const int twiddle_order[] = { 1, 2, 3, 4, 5, 6, 7, 8, 9 };
586 fftw_codelet_desc fftw_hc2hc_backward_10_desc = {
587 "fftw_hc2hc_backward_10",
588 (void (*)()) fftw_hc2hc_backward_10,
589 10,
590 FFTW_BACKWARD,
591 FFTW_HC2HC,
592 234,
593 9,
594 twiddle_order,
595 };
596