1 /*
2  * Copyright (c) 1997-1999, 2003 Massachusetts Institute of Technology
3  *
4  * This program is free software; you can redistribute it and/or modify
5  * it under the terms of the GNU General Public License as published by
6  * the Free Software Foundation; either version 2 of the License, or
7  * (at your option) any later version.
8  *
9  * This program is distributed in the hope that it will be useful,
10  * but WITHOUT ANY WARRANTY; without even the implied warranty of
11  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
12  * GNU General Public License for more details.
13  *
14  * You should have received a copy of the GNU General Public License
15  * along with this program; if not, write to the Free Software
16  * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
17  *
18  */
19 
20 /* This file was automatically generated --- DO NOT EDIT */
21 /* Generated on Mon Mar 24 02:09:07 EST 2003 */
22 
23 #include "fftw-int.h"
24 #include "fftw.h"
25 
26 /* Generated by: /homee/stevenj/cvs/fftw/gensrc/genfft -magic-alignment-check -magic-twiddle-load-all -magic-variables 4 -magic-loopi -hc2hc-backward 32 */
27 
28 /*
29  * This function contains 764 FP additions, 346 FP multiplications,
30  * (or, 618 additions, 200 multiplications, 146 fused multiply/add),
31  * 93 stack variables, and 256 memory accesses
32  */
33 static const fftw_real K1_662939224 =
34 FFTW_KONST(+1.662939224605090474157576755235811513477121624);
35 static const fftw_real K1_111140466 =
36 FFTW_KONST(+1.111140466039204449485661627897065748749874382);
37 static const fftw_real K390180644 =
38 FFTW_KONST(+0.390180644032256535696569736954044481855383236);
39 static const fftw_real K1_961570560 =
40 FFTW_KONST(+1.961570560806460898252364472268478073947867462);
41 static const fftw_real K1_913880671 =
42 FFTW_KONST(+1.913880671464417729871595773960539938965698411);
43 static const fftw_real K580569354 =
44 FFTW_KONST(+0.580569354508924735272384751634790549382952557);
45 static const fftw_real K942793473 =
46 FFTW_KONST(+0.942793473651995297112775251810508755314920638);
47 static const fftw_real K1_763842528 =
48 FFTW_KONST(+1.763842528696710059425513727320776699016885241);
49 static const fftw_real K1_546020906 =
50 FFTW_KONST(+1.546020906725473921621813219516939601942082586);
51 static const fftw_real K1_268786568 =
52 FFTW_KONST(+1.268786568327290996430343226450986741351374190);
53 static const fftw_real K196034280 =
54 FFTW_KONST(+0.196034280659121203988391127777283691722273346);
55 static const fftw_real K1_990369453 =
56 FFTW_KONST(+1.990369453344393772489673906218959843150949737);
57 static const fftw_real K382683432 =
58 FFTW_KONST(+0.382683432365089771728459984030398866761344562);
59 static const fftw_real K923879532 =
60 FFTW_KONST(+0.923879532511286756128183189396788286822416626);
61 static const fftw_real K707106781 =
62 FFTW_KONST(+0.707106781186547524400844362104849039284835938);
63 static const fftw_real K765366864 =
64 FFTW_KONST(+0.765366864730179543456919968060797733522689125);
65 static const fftw_real K1_847759065 =
66 FFTW_KONST(+1.847759065022573512256366378793576573644833252);
67 static const fftw_real K555570233 =
68 FFTW_KONST(+0.555570233019602224742830813948532874374937191);
69 static const fftw_real K831469612 =
70 FFTW_KONST(+0.831469612302545237078788377617905756738560812);
71 static const fftw_real K195090322 =
72 FFTW_KONST(+0.195090322016128267848284868477022240927691618);
73 static const fftw_real K980785280 =
74 FFTW_KONST(+0.980785280403230449126182236134239036973933731);
75 static const fftw_real K1_414213562 =
76 FFTW_KONST(+1.414213562373095048801688724209698078569671875);
77 static const fftw_real K2_000000000 =
78 FFTW_KONST(+2.000000000000000000000000000000000000000000000);
79 
80 /*
81  * Generator Id's :
82  * $Id: exprdag.ml,v 1.43 2003/03/16 23:43:46 stevenj Exp $
83  * $Id: fft.ml,v 1.44 2003/03/16 23:43:46 stevenj Exp $
84  * $Id: to_c.ml,v 1.26 2003/03/16 23:43:46 stevenj Exp $
85  */
86 
fftw_hc2hc_backward_32(fftw_real * A,const fftw_complex * W,int iostride,int m,int dist)87 void fftw_hc2hc_backward_32(fftw_real *A, const fftw_complex *W,
88 			    int iostride, int m, int dist)
89 {
90      int i;
91      fftw_real *X;
92      fftw_real *Y;
93      X = A;
94      Y = A + (32 * iostride);
95      {
96 	  fftw_real tmp679;
97 	  fftw_real tmp804;
98 	  fftw_real tmp769;
99 	  fftw_real tmp707;
100 	  fftw_real tmp702;
101 	  fftw_real tmp728;
102 	  fftw_real tmp726;
103 	  fftw_real tmp750;
104 	  fftw_real tmp815;
105 	  fftw_real tmp819;
106 	  fftw_real tmp782;
107 	  fftw_real tmp793;
108 	  fftw_real tmp676;
109 	  fftw_real tmp704;
110 	  fftw_real tmp773;
111 	  fftw_real tmp803;
112 	  fftw_real tmp687;
113 	  fftw_real tmp709;
114 	  fftw_real tmp716;
115 	  fftw_real tmp753;
116 	  fftw_real tmp762;
117 	  fftw_real tmp806;
118 	  fftw_real tmp765;
119 	  fftw_real tmp807;
120 	  fftw_real tmp695;
121 	  fftw_real tmp719;
122 	  fftw_real tmp735;
123 	  fftw_real tmp749;
124 	  fftw_real tmp812;
125 	  fftw_real tmp818;
126 	  fftw_real tmp789;
127 	  fftw_real tmp792;
128 	  ASSERT_ALIGNED_DOUBLE;
129 	  {
130 	       fftw_real tmp677;
131 	       fftw_real tmp678;
132 	       fftw_real tmp767;
133 	       fftw_real tmp705;
134 	       fftw_real tmp706;
135 	       fftw_real tmp768;
136 	       ASSERT_ALIGNED_DOUBLE;
137 	       tmp677 = X[4 * iostride];
138 	       tmp678 = X[12 * iostride];
139 	       tmp767 = tmp677 - tmp678;
140 	       tmp705 = Y[-4 * iostride];
141 	       tmp706 = Y[-12 * iostride];
142 	       tmp768 = tmp705 + tmp706;
143 	       tmp679 = K2_000000000 * (tmp677 + tmp678);
144 	       tmp804 = K1_414213562 * (tmp767 + tmp768);
145 	       tmp769 = K1_414213562 * (tmp767 - tmp768);
146 	       tmp707 = K2_000000000 * (tmp705 - tmp706);
147 	  }
148 	  {
149 	       fftw_real tmp698;
150 	       fftw_real tmp776;
151 	       fftw_real tmp725;
152 	       fftw_real tmp780;
153 	       fftw_real tmp701;
154 	       fftw_real tmp779;
155 	       fftw_real tmp722;
156 	       fftw_real tmp777;
157 	       ASSERT_ALIGNED_DOUBLE;
158 	       {
159 		    fftw_real tmp696;
160 		    fftw_real tmp697;
161 		    fftw_real tmp723;
162 		    fftw_real tmp724;
163 		    ASSERT_ALIGNED_DOUBLE;
164 		    tmp696 = X[3 * iostride];
165 		    tmp697 = X[13 * iostride];
166 		    tmp698 = tmp696 + tmp697;
167 		    tmp776 = tmp696 - tmp697;
168 		    tmp723 = Y[-3 * iostride];
169 		    tmp724 = Y[-13 * iostride];
170 		    tmp725 = tmp723 - tmp724;
171 		    tmp780 = tmp723 + tmp724;
172 	       }
173 	       {
174 		    fftw_real tmp699;
175 		    fftw_real tmp700;
176 		    fftw_real tmp720;
177 		    fftw_real tmp721;
178 		    ASSERT_ALIGNED_DOUBLE;
179 		    tmp699 = X[5 * iostride];
180 		    tmp700 = X[11 * iostride];
181 		    tmp701 = tmp699 + tmp700;
182 		    tmp779 = tmp700 - tmp699;
183 		    tmp720 = Y[-5 * iostride];
184 		    tmp721 = Y[-11 * iostride];
185 		    tmp722 = tmp720 - tmp721;
186 		    tmp777 = tmp720 + tmp721;
187 	       }
188 	       tmp702 = tmp698 + tmp701;
189 	       tmp728 = tmp701 - tmp698;
190 	       tmp726 = tmp722 + tmp725;
191 	       tmp750 = tmp725 - tmp722;
192 	       {
193 		    fftw_real tmp813;
194 		    fftw_real tmp814;
195 		    fftw_real tmp778;
196 		    fftw_real tmp781;
197 		    ASSERT_ALIGNED_DOUBLE;
198 		    tmp813 = tmp776 + tmp777;
199 		    tmp814 = tmp780 - tmp779;
200 		    tmp815 = (K980785280 * tmp813) - (K195090322 * tmp814);
201 		    tmp819 = (K195090322 * tmp813) + (K980785280 * tmp814);
202 		    tmp778 = tmp776 - tmp777;
203 		    tmp781 = tmp779 + tmp780;
204 		    tmp782 = (K831469612 * tmp778) - (K555570233 * tmp781);
205 		    tmp793 = (K555570233 * tmp778) + (K831469612 * tmp781);
206 	       }
207 	  }
208 	  {
209 	       fftw_real tmp675;
210 	       fftw_real tmp772;
211 	       fftw_real tmp673;
212 	       fftw_real tmp770;
213 	       ASSERT_ALIGNED_DOUBLE;
214 	       {
215 		    fftw_real tmp674;
216 		    fftw_real tmp771;
217 		    fftw_real tmp671;
218 		    fftw_real tmp672;
219 		    ASSERT_ALIGNED_DOUBLE;
220 		    tmp674 = X[8 * iostride];
221 		    tmp675 = K2_000000000 * tmp674;
222 		    tmp771 = Y[-8 * iostride];
223 		    tmp772 = K2_000000000 * tmp771;
224 		    tmp671 = X[0];
225 		    tmp672 = X[16 * iostride];
226 		    tmp673 = tmp671 + tmp672;
227 		    tmp770 = tmp671 - tmp672;
228 	       }
229 	       tmp676 = tmp673 + tmp675;
230 	       tmp704 = tmp673 - tmp675;
231 	       tmp773 = tmp770 - tmp772;
232 	       tmp803 = tmp770 + tmp772;
233 	  }
234 	  {
235 	       fftw_real tmp683;
236 	       fftw_real tmp760;
237 	       fftw_real tmp715;
238 	       fftw_real tmp764;
239 	       fftw_real tmp686;
240 	       fftw_real tmp763;
241 	       fftw_real tmp712;
242 	       fftw_real tmp761;
243 	       ASSERT_ALIGNED_DOUBLE;
244 	       {
245 		    fftw_real tmp681;
246 		    fftw_real tmp682;
247 		    fftw_real tmp713;
248 		    fftw_real tmp714;
249 		    ASSERT_ALIGNED_DOUBLE;
250 		    tmp681 = X[2 * iostride];
251 		    tmp682 = X[14 * iostride];
252 		    tmp683 = tmp681 + tmp682;
253 		    tmp760 = tmp681 - tmp682;
254 		    tmp713 = Y[-2 * iostride];
255 		    tmp714 = Y[-14 * iostride];
256 		    tmp715 = tmp713 - tmp714;
257 		    tmp764 = tmp713 + tmp714;
258 	       }
259 	       {
260 		    fftw_real tmp684;
261 		    fftw_real tmp685;
262 		    fftw_real tmp710;
263 		    fftw_real tmp711;
264 		    ASSERT_ALIGNED_DOUBLE;
265 		    tmp684 = X[6 * iostride];
266 		    tmp685 = X[10 * iostride];
267 		    tmp686 = tmp684 + tmp685;
268 		    tmp763 = tmp685 - tmp684;
269 		    tmp710 = Y[-6 * iostride];
270 		    tmp711 = Y[-10 * iostride];
271 		    tmp712 = tmp710 - tmp711;
272 		    tmp761 = tmp710 + tmp711;
273 	       }
274 	       tmp687 = K2_000000000 * (tmp683 + tmp686);
275 	       tmp709 = tmp683 - tmp686;
276 	       tmp716 = tmp712 + tmp715;
277 	       tmp753 = K2_000000000 * (tmp715 - tmp712);
278 	       tmp762 = tmp760 - tmp761;
279 	       tmp806 = tmp760 + tmp761;
280 	       tmp765 = tmp763 + tmp764;
281 	       tmp807 = tmp764 - tmp763;
282 	  }
283 	  {
284 	       fftw_real tmp691;
285 	       fftw_real tmp783;
286 	       fftw_real tmp734;
287 	       fftw_real tmp787;
288 	       fftw_real tmp694;
289 	       fftw_real tmp786;
290 	       fftw_real tmp731;
291 	       fftw_real tmp784;
292 	       ASSERT_ALIGNED_DOUBLE;
293 	       {
294 		    fftw_real tmp689;
295 		    fftw_real tmp690;
296 		    fftw_real tmp732;
297 		    fftw_real tmp733;
298 		    ASSERT_ALIGNED_DOUBLE;
299 		    tmp689 = X[iostride];
300 		    tmp690 = X[15 * iostride];
301 		    tmp691 = tmp689 + tmp690;
302 		    tmp783 = tmp689 - tmp690;
303 		    tmp732 = Y[-iostride];
304 		    tmp733 = Y[-15 * iostride];
305 		    tmp734 = tmp732 - tmp733;
306 		    tmp787 = tmp732 + tmp733;
307 	       }
308 	       {
309 		    fftw_real tmp692;
310 		    fftw_real tmp693;
311 		    fftw_real tmp729;
312 		    fftw_real tmp730;
313 		    ASSERT_ALIGNED_DOUBLE;
314 		    tmp692 = X[7 * iostride];
315 		    tmp693 = X[9 * iostride];
316 		    tmp694 = tmp692 + tmp693;
317 		    tmp786 = tmp693 - tmp692;
318 		    tmp729 = Y[-7 * iostride];
319 		    tmp730 = Y[-9 * iostride];
320 		    tmp731 = tmp729 - tmp730;
321 		    tmp784 = tmp729 + tmp730;
322 	       }
323 	       tmp695 = tmp691 + tmp694;
324 	       tmp719 = tmp691 - tmp694;
325 	       tmp735 = tmp731 + tmp734;
326 	       tmp749 = tmp734 - tmp731;
327 	       {
328 		    fftw_real tmp810;
329 		    fftw_real tmp811;
330 		    fftw_real tmp785;
331 		    fftw_real tmp788;
332 		    ASSERT_ALIGNED_DOUBLE;
333 		    tmp810 = tmp783 + tmp784;
334 		    tmp811 = tmp787 - tmp786;
335 		    tmp812 = (K555570233 * tmp810) + (K831469612 * tmp811);
336 		    tmp818 = (K831469612 * tmp810) - (K555570233 * tmp811);
337 		    tmp785 = tmp783 - tmp784;
338 		    tmp788 = tmp786 + tmp787;
339 		    tmp789 = (K980785280 * tmp785) - (K195090322 * tmp788);
340 		    tmp792 = (K195090322 * tmp785) + (K980785280 * tmp788);
341 	       }
342 	  }
343 	  {
344 	       fftw_real tmp703;
345 	       fftw_real tmp751;
346 	       fftw_real tmp688;
347 	       fftw_real tmp748;
348 	       fftw_real tmp680;
349 	       ASSERT_ALIGNED_DOUBLE;
350 	       tmp703 = K2_000000000 * (tmp695 + tmp702);
351 	       tmp751 = K2_000000000 * (tmp749 - tmp750);
352 	       tmp680 = tmp676 + tmp679;
353 	       tmp688 = tmp680 + tmp687;
354 	       tmp748 = tmp680 - tmp687;
355 	       X[16 * iostride] = tmp688 - tmp703;
356 	       X[0] = tmp688 + tmp703;
357 	       X[24 * iostride] = tmp748 + tmp751;
358 	       X[8 * iostride] = tmp748 - tmp751;
359 	  }
360 	  {
361 	       fftw_real tmp754;
362 	       fftw_real tmp758;
363 	       fftw_real tmp757;
364 	       fftw_real tmp759;
365 	       fftw_real tmp752;
366 	       fftw_real tmp755;
367 	       fftw_real tmp756;
368 	       ASSERT_ALIGNED_DOUBLE;
369 	       tmp752 = tmp676 - tmp679;
370 	       tmp754 = tmp752 - tmp753;
371 	       tmp758 = tmp752 + tmp753;
372 	       tmp755 = tmp695 - tmp702;
373 	       tmp756 = tmp750 + tmp749;
374 	       tmp757 = K1_414213562 * (tmp755 - tmp756);
375 	       tmp759 = K1_414213562 * (tmp755 + tmp756);
376 	       X[20 * iostride] = tmp754 - tmp757;
377 	       X[4 * iostride] = tmp754 + tmp757;
378 	       X[12 * iostride] = tmp758 - tmp759;
379 	       X[28 * iostride] = tmp758 + tmp759;
380 	  }
381 	  {
382 	       fftw_real tmp718;
383 	       fftw_real tmp738;
384 	       fftw_real tmp737;
385 	       fftw_real tmp739;
386 	       ASSERT_ALIGNED_DOUBLE;
387 	       {
388 		    fftw_real tmp708;
389 		    fftw_real tmp717;
390 		    fftw_real tmp727;
391 		    fftw_real tmp736;
392 		    ASSERT_ALIGNED_DOUBLE;
393 		    tmp708 = tmp704 - tmp707;
394 		    tmp717 = K1_414213562 * (tmp709 - tmp716);
395 		    tmp718 = tmp708 + tmp717;
396 		    tmp738 = tmp708 - tmp717;
397 		    tmp727 = tmp719 - tmp726;
398 		    tmp736 = tmp728 + tmp735;
399 		    tmp737 =
400 			(K1_847759065 * tmp727) - (K765366864 * tmp736);
401 		    tmp739 =
402 			(K765366864 * tmp727) + (K1_847759065 * tmp736);
403 	       }
404 	       X[18 * iostride] = tmp718 - tmp737;
405 	       X[2 * iostride] = tmp718 + tmp737;
406 	       X[10 * iostride] = tmp738 - tmp739;
407 	       X[26 * iostride] = tmp738 + tmp739;
408 	  }
409 	  {
410 	       fftw_real tmp742;
411 	       fftw_real tmp746;
412 	       fftw_real tmp745;
413 	       fftw_real tmp747;
414 	       ASSERT_ALIGNED_DOUBLE;
415 	       {
416 		    fftw_real tmp740;
417 		    fftw_real tmp741;
418 		    fftw_real tmp743;
419 		    fftw_real tmp744;
420 		    ASSERT_ALIGNED_DOUBLE;
421 		    tmp740 = tmp704 + tmp707;
422 		    tmp741 = K1_414213562 * (tmp709 + tmp716);
423 		    tmp742 = tmp740 - tmp741;
424 		    tmp746 = tmp740 + tmp741;
425 		    tmp743 = tmp719 + tmp726;
426 		    tmp744 = tmp735 - tmp728;
427 		    tmp745 =
428 			(K765366864 * tmp743) - (K1_847759065 * tmp744);
429 		    tmp747 =
430 			(K1_847759065 * tmp743) + (K765366864 * tmp744);
431 	       }
432 	       X[22 * iostride] = tmp742 - tmp745;
433 	       X[6 * iostride] = tmp742 + tmp745;
434 	       X[14 * iostride] = tmp746 - tmp747;
435 	       X[30 * iostride] = tmp746 + tmp747;
436 	  }
437 	  {
438 	       fftw_real tmp790;
439 	       fftw_real tmp794;
440 	       fftw_real tmp775;
441 	       fftw_real tmp791;
442 	       fftw_real tmp766;
443 	       fftw_real tmp774;
444 	       ASSERT_ALIGNED_DOUBLE;
445 	       tmp790 = K2_000000000 * (tmp782 + tmp789);
446 	       tmp794 = K2_000000000 * (tmp792 - tmp793);
447 	       tmp766 = (K1_847759065 * tmp762) - (K765366864 * tmp765);
448 	       tmp774 = tmp769 + tmp773;
449 	       tmp775 = tmp766 + tmp774;
450 	       tmp791 = tmp774 - tmp766;
451 	       X[17 * iostride] = tmp775 - tmp790;
452 	       X[iostride] = tmp790 + tmp775;
453 	       X[9 * iostride] = tmp791 - tmp794;
454 	       X[25 * iostride] = tmp794 + tmp791;
455 	  }
456 	  {
457 	       fftw_real tmp797;
458 	       fftw_real tmp801;
459 	       fftw_real tmp800;
460 	       fftw_real tmp802;
461 	       ASSERT_ALIGNED_DOUBLE;
462 	       {
463 		    fftw_real tmp795;
464 		    fftw_real tmp796;
465 		    fftw_real tmp798;
466 		    fftw_real tmp799;
467 		    ASSERT_ALIGNED_DOUBLE;
468 		    tmp795 = tmp773 - tmp769;
469 		    tmp796 =
470 			(K765366864 * tmp762) + (K1_847759065 * tmp765);
471 		    tmp797 = tmp795 - tmp796;
472 		    tmp801 = tmp796 + tmp795;
473 		    tmp798 = tmp789 - tmp782;
474 		    tmp799 = tmp793 + tmp792;
475 		    tmp800 = K1_414213562 * (tmp798 - tmp799);
476 		    tmp802 = K1_414213562 * (tmp798 + tmp799);
477 	       }
478 	       X[21 * iostride] = tmp797 - tmp800;
479 	       X[5 * iostride] = tmp800 + tmp797;
480 	       X[13 * iostride] = tmp801 - tmp802;
481 	       X[29 * iostride] = tmp802 + tmp801;
482 	  }
483 	  {
484 	       fftw_real tmp816;
485 	       fftw_real tmp820;
486 	       fftw_real tmp809;
487 	       fftw_real tmp817;
488 	       fftw_real tmp805;
489 	       fftw_real tmp808;
490 	       ASSERT_ALIGNED_DOUBLE;
491 	       tmp816 = K2_000000000 * (tmp812 - tmp815);
492 	       tmp820 = K2_000000000 * (tmp818 - tmp819);
493 	       tmp805 = tmp803 - tmp804;
494 	       tmp808 = (K765366864 * tmp806) - (K1_847759065 * tmp807);
495 	       tmp809 = tmp805 - tmp808;
496 	       tmp817 = tmp808 + tmp805;
497 	       X[11 * iostride] = tmp809 - tmp816;
498 	       X[27 * iostride] = tmp816 + tmp809;
499 	       X[19 * iostride] = tmp817 - tmp820;
500 	       X[3 * iostride] = tmp820 + tmp817;
501 	  }
502 	  {
503 	       fftw_real tmp823;
504 	       fftw_real tmp827;
505 	       fftw_real tmp826;
506 	       fftw_real tmp828;
507 	       ASSERT_ALIGNED_DOUBLE;
508 	       {
509 		    fftw_real tmp821;
510 		    fftw_real tmp822;
511 		    fftw_real tmp824;
512 		    fftw_real tmp825;
513 		    ASSERT_ALIGNED_DOUBLE;
514 		    tmp821 = tmp804 + tmp803;
515 		    tmp822 =
516 			(K1_847759065 * tmp806) + (K765366864 * tmp807);
517 		    tmp823 = tmp821 - tmp822;
518 		    tmp827 = tmp822 + tmp821;
519 		    tmp824 = tmp819 + tmp818;
520 		    tmp825 = tmp815 + tmp812;
521 		    tmp826 = K1_414213562 * (tmp824 - tmp825);
522 		    tmp828 = K1_414213562 * (tmp824 + tmp825);
523 	       }
524 	       X[23 * iostride] = tmp823 - tmp826;
525 	       X[7 * iostride] = tmp826 + tmp823;
526 	       X[15 * iostride] = tmp827 - tmp828;
527 	       X[31 * iostride] = tmp828 + tmp827;
528 	  }
529      }
530      X = X + dist;
531      Y = Y - dist;
532      for (i = 2; i < m; i = i + 2, X = X + dist, Y = Y - dist, W = W + 31) {
533 	  fftw_real tmp446;
534 	  fftw_real tmp580;
535 	  fftw_real tmp189;
536 	  fftw_real tmp238;
537 	  fftw_real tmp382;
538 	  fftw_real tmp420;
539 	  fftw_real tmp307;
540 	  fftw_real tmp332;
541 	  fftw_real tmp514;
542 	  fftw_real tmp608;
543 	  fftw_real tmp354;
544 	  fftw_real tmp408;
545 	  fftw_real tmp453;
546 	  fftw_real tmp609;
547 	  fftw_real tmp517;
548 	  fftw_real tmp581;
549 	  fftw_real tmp235;
550 	  fftw_real tmp272;
551 	  fftw_real tmp365;
552 	  fftw_real tmp411;
553 	  fftw_real tmp287;
554 	  fftw_real tmp336;
555 	  fftw_real tmp368;
556 	  fftw_real tmp412;
557 	  fftw_real tmp500;
558 	  fftw_real tmp550;
559 	  fftw_real tmp593;
560 	  fftw_real tmp643;
561 	  fftw_real tmp507;
562 	  fftw_real tmp551;
563 	  fftw_real tmp596;
564 	  fftw_real tmp642;
565 	  fftw_real tmp204;
566 	  fftw_real tmp292;
567 	  fftw_real tmp357;
568 	  fftw_real tmp384;
569 	  fftw_real tmp253;
570 	  fftw_real tmp333;
571 	  fftw_real tmp360;
572 	  fftw_real tmp383;
573 	  fftw_real tmp461;
574 	  fftw_real tmp520;
575 	  fftw_real tmp588;
576 	  fftw_real tmp612;
577 	  fftw_real tmp468;
578 	  fftw_real tmp519;
579 	  fftw_real tmp585;
580 	  fftw_real tmp611;
581 	  fftw_real tmp220;
582 	  fftw_real tmp255;
583 	  fftw_real tmp372;
584 	  fftw_real tmp414;
585 	  fftw_real tmp270;
586 	  fftw_real tmp335;
587 	  fftw_real tmp375;
588 	  fftw_real tmp415;
589 	  fftw_real tmp481;
590 	  fftw_real tmp547;
591 	  fftw_real tmp600;
592 	  fftw_real tmp640;
593 	  fftw_real tmp488;
594 	  fftw_real tmp548;
595 	  fftw_real tmp603;
596 	  fftw_real tmp639;
597 	  ASSERT_ALIGNED_DOUBLE;
598 	  {
599 	       fftw_real tmp177;
600 	       fftw_real tmp444;
601 	       fftw_real tmp295;
602 	       fftw_real tmp513;
603 	       fftw_real tmp180;
604 	       fftw_real tmp512;
605 	       fftw_real tmp298;
606 	       fftw_real tmp445;
607 	       fftw_real tmp184;
608 	       fftw_real tmp447;
609 	       fftw_real tmp302;
610 	       fftw_real tmp448;
611 	       fftw_real tmp187;
612 	       fftw_real tmp450;
613 	       fftw_real tmp305;
614 	       fftw_real tmp451;
615 	       ASSERT_ALIGNED_DOUBLE;
616 	       {
617 		    fftw_real tmp175;
618 		    fftw_real tmp176;
619 		    fftw_real tmp293;
620 		    fftw_real tmp294;
621 		    ASSERT_ALIGNED_DOUBLE;
622 		    tmp175 = X[0];
623 		    tmp176 = Y[-16 * iostride];
624 		    tmp177 = tmp175 + tmp176;
625 		    tmp444 = tmp175 - tmp176;
626 		    tmp293 = Y[0];
627 		    tmp294 = X[16 * iostride];
628 		    tmp295 = tmp293 - tmp294;
629 		    tmp513 = tmp293 + tmp294;
630 	       }
631 	       {
632 		    fftw_real tmp178;
633 		    fftw_real tmp179;
634 		    fftw_real tmp296;
635 		    fftw_real tmp297;
636 		    ASSERT_ALIGNED_DOUBLE;
637 		    tmp178 = X[8 * iostride];
638 		    tmp179 = Y[-24 * iostride];
639 		    tmp180 = tmp178 + tmp179;
640 		    tmp512 = tmp178 - tmp179;
641 		    tmp296 = Y[-8 * iostride];
642 		    tmp297 = X[24 * iostride];
643 		    tmp298 = tmp296 - tmp297;
644 		    tmp445 = tmp296 + tmp297;
645 	       }
646 	       {
647 		    fftw_real tmp182;
648 		    fftw_real tmp183;
649 		    fftw_real tmp300;
650 		    fftw_real tmp301;
651 		    ASSERT_ALIGNED_DOUBLE;
652 		    tmp182 = X[4 * iostride];
653 		    tmp183 = Y[-20 * iostride];
654 		    tmp184 = tmp182 + tmp183;
655 		    tmp447 = tmp182 - tmp183;
656 		    tmp300 = Y[-4 * iostride];
657 		    tmp301 = X[20 * iostride];
658 		    tmp302 = tmp300 - tmp301;
659 		    tmp448 = tmp300 + tmp301;
660 	       }
661 	       {
662 		    fftw_real tmp185;
663 		    fftw_real tmp186;
664 		    fftw_real tmp303;
665 		    fftw_real tmp304;
666 		    ASSERT_ALIGNED_DOUBLE;
667 		    tmp185 = Y[-28 * iostride];
668 		    tmp186 = X[12 * iostride];
669 		    tmp187 = tmp185 + tmp186;
670 		    tmp450 = tmp185 - tmp186;
671 		    tmp303 = Y[-12 * iostride];
672 		    tmp304 = X[28 * iostride];
673 		    tmp305 = tmp303 - tmp304;
674 		    tmp451 = tmp303 + tmp304;
675 	       }
676 	       {
677 		    fftw_real tmp181;
678 		    fftw_real tmp188;
679 		    fftw_real tmp352;
680 		    fftw_real tmp353;
681 		    ASSERT_ALIGNED_DOUBLE;
682 		    tmp446 = tmp444 - tmp445;
683 		    tmp580 = tmp444 + tmp445;
684 		    tmp181 = tmp177 + tmp180;
685 		    tmp188 = tmp184 + tmp187;
686 		    tmp189 = tmp181 + tmp188;
687 		    tmp238 = tmp181 - tmp188;
688 		    {
689 			 fftw_real tmp380;
690 			 fftw_real tmp381;
691 			 fftw_real tmp299;
692 			 fftw_real tmp306;
693 			 ASSERT_ALIGNED_DOUBLE;
694 			 tmp380 = tmp295 - tmp298;
695 			 tmp381 = tmp184 - tmp187;
696 			 tmp382 = tmp380 - tmp381;
697 			 tmp420 = tmp381 + tmp380;
698 			 tmp299 = tmp295 + tmp298;
699 			 tmp306 = tmp302 + tmp305;
700 			 tmp307 = tmp299 - tmp306;
701 			 tmp332 = tmp299 + tmp306;
702 		    }
703 		    tmp514 = tmp512 + tmp513;
704 		    tmp608 = tmp513 - tmp512;
705 		    tmp352 = tmp177 - tmp180;
706 		    tmp353 = tmp305 - tmp302;
707 		    tmp354 = tmp352 - tmp353;
708 		    tmp408 = tmp352 + tmp353;
709 		    {
710 			 fftw_real tmp449;
711 			 fftw_real tmp452;
712 			 fftw_real tmp515;
713 			 fftw_real tmp516;
714 			 ASSERT_ALIGNED_DOUBLE;
715 			 tmp449 = tmp447 - tmp448;
716 			 tmp452 = tmp450 - tmp451;
717 			 tmp453 = K707106781 * (tmp449 + tmp452);
718 			 tmp609 = K707106781 * (tmp449 - tmp452);
719 			 tmp515 = tmp447 + tmp448;
720 			 tmp516 = tmp450 + tmp451;
721 			 tmp517 = K707106781 * (tmp515 - tmp516);
722 			 tmp581 = K707106781 * (tmp515 + tmp516);
723 		    }
724 	       }
725 	  }
726 	  {
727 	       fftw_real tmp223;
728 	       fftw_real tmp490;
729 	       fftw_real tmp275;
730 	       fftw_real tmp502;
731 	       fftw_real tmp226;
732 	       fftw_real tmp501;
733 	       fftw_real tmp278;
734 	       fftw_real tmp491;
735 	       fftw_real tmp233;
736 	       fftw_real tmp505;
737 	       fftw_real tmp498;
738 	       fftw_real tmp285;
739 	       fftw_real tmp230;
740 	       fftw_real tmp504;
741 	       fftw_real tmp495;
742 	       fftw_real tmp282;
743 	       ASSERT_ALIGNED_DOUBLE;
744 	       {
745 		    fftw_real tmp221;
746 		    fftw_real tmp222;
747 		    fftw_real tmp276;
748 		    fftw_real tmp277;
749 		    ASSERT_ALIGNED_DOUBLE;
750 		    tmp221 = Y[-31 * iostride];
751 		    tmp222 = X[15 * iostride];
752 		    tmp223 = tmp221 + tmp222;
753 		    tmp490 = tmp221 - tmp222;
754 		    {
755 			 fftw_real tmp273;
756 			 fftw_real tmp274;
757 			 fftw_real tmp224;
758 			 fftw_real tmp225;
759 			 ASSERT_ALIGNED_DOUBLE;
760 			 tmp273 = Y[-15 * iostride];
761 			 tmp274 = X[31 * iostride];
762 			 tmp275 = tmp273 - tmp274;
763 			 tmp502 = tmp273 + tmp274;
764 			 tmp224 = X[7 * iostride];
765 			 tmp225 = Y[-23 * iostride];
766 			 tmp226 = tmp224 + tmp225;
767 			 tmp501 = tmp224 - tmp225;
768 		    }
769 		    tmp276 = Y[-7 * iostride];
770 		    tmp277 = X[23 * iostride];
771 		    tmp278 = tmp276 - tmp277;
772 		    tmp491 = tmp276 + tmp277;
773 		    {
774 			 fftw_real tmp231;
775 			 fftw_real tmp232;
776 			 fftw_real tmp496;
777 			 fftw_real tmp283;
778 			 fftw_real tmp284;
779 			 fftw_real tmp497;
780 			 ASSERT_ALIGNED_DOUBLE;
781 			 tmp231 = Y[-27 * iostride];
782 			 tmp232 = X[11 * iostride];
783 			 tmp496 = tmp231 - tmp232;
784 			 tmp283 = Y[-11 * iostride];
785 			 tmp284 = X[27 * iostride];
786 			 tmp497 = tmp283 + tmp284;
787 			 tmp233 = tmp231 + tmp232;
788 			 tmp505 = tmp496 + tmp497;
789 			 tmp498 = tmp496 - tmp497;
790 			 tmp285 = tmp283 - tmp284;
791 		    }
792 		    {
793 			 fftw_real tmp228;
794 			 fftw_real tmp229;
795 			 fftw_real tmp493;
796 			 fftw_real tmp280;
797 			 fftw_real tmp281;
798 			 fftw_real tmp494;
799 			 ASSERT_ALIGNED_DOUBLE;
800 			 tmp228 = X[3 * iostride];
801 			 tmp229 = Y[-19 * iostride];
802 			 tmp493 = tmp228 - tmp229;
803 			 tmp280 = Y[-3 * iostride];
804 			 tmp281 = X[19 * iostride];
805 			 tmp494 = tmp280 + tmp281;
806 			 tmp230 = tmp228 + tmp229;
807 			 tmp504 = tmp493 + tmp494;
808 			 tmp495 = tmp493 - tmp494;
809 			 tmp282 = tmp280 - tmp281;
810 		    }
811 	       }
812 	       {
813 		    fftw_real tmp227;
814 		    fftw_real tmp234;
815 		    fftw_real tmp363;
816 		    fftw_real tmp364;
817 		    ASSERT_ALIGNED_DOUBLE;
818 		    tmp227 = tmp223 + tmp226;
819 		    tmp234 = tmp230 + tmp233;
820 		    tmp235 = tmp227 + tmp234;
821 		    tmp272 = tmp227 - tmp234;
822 		    tmp363 = tmp275 - tmp278;
823 		    tmp364 = tmp230 - tmp233;
824 		    tmp365 = tmp363 - tmp364;
825 		    tmp411 = tmp364 + tmp363;
826 	       }
827 	       {
828 		    fftw_real tmp279;
829 		    fftw_real tmp286;
830 		    fftw_real tmp366;
831 		    fftw_real tmp367;
832 		    ASSERT_ALIGNED_DOUBLE;
833 		    tmp279 = tmp275 + tmp278;
834 		    tmp286 = tmp282 + tmp285;
835 		    tmp287 = tmp279 - tmp286;
836 		    tmp336 = tmp279 + tmp286;
837 		    tmp366 = tmp223 - tmp226;
838 		    tmp367 = tmp285 - tmp282;
839 		    tmp368 = tmp366 - tmp367;
840 		    tmp412 = tmp366 + tmp367;
841 	       }
842 	       {
843 		    fftw_real tmp492;
844 		    fftw_real tmp499;
845 		    fftw_real tmp591;
846 		    fftw_real tmp592;
847 		    ASSERT_ALIGNED_DOUBLE;
848 		    tmp492 = tmp490 - tmp491;
849 		    tmp499 = K707106781 * (tmp495 + tmp498);
850 		    tmp500 = tmp492 - tmp499;
851 		    tmp550 = tmp492 + tmp499;
852 		    tmp591 = K707106781 * (tmp495 - tmp498);
853 		    tmp592 = tmp501 + tmp502;
854 		    tmp593 = tmp591 - tmp592;
855 		    tmp643 = tmp592 + tmp591;
856 	       }
857 	       {
858 		    fftw_real tmp503;
859 		    fftw_real tmp506;
860 		    fftw_real tmp594;
861 		    fftw_real tmp595;
862 		    ASSERT_ALIGNED_DOUBLE;
863 		    tmp503 = tmp501 - tmp502;
864 		    tmp506 = K707106781 * (tmp504 - tmp505);
865 		    tmp507 = tmp503 - tmp506;
866 		    tmp551 = tmp503 + tmp506;
867 		    tmp594 = tmp490 + tmp491;
868 		    tmp595 = K707106781 * (tmp504 + tmp505);
869 		    tmp596 = tmp594 - tmp595;
870 		    tmp642 = tmp594 + tmp595;
871 	       }
872 	  }
873 	  {
874 	       fftw_real tmp192;
875 	       fftw_real tmp465;
876 	       fftw_real tmp248;
877 	       fftw_real tmp463;
878 	       fftw_real tmp195;
879 	       fftw_real tmp462;
880 	       fftw_real tmp251;
881 	       fftw_real tmp466;
882 	       fftw_real tmp199;
883 	       fftw_real tmp458;
884 	       fftw_real tmp241;
885 	       fftw_real tmp456;
886 	       fftw_real tmp202;
887 	       fftw_real tmp455;
888 	       fftw_real tmp244;
889 	       fftw_real tmp459;
890 	       ASSERT_ALIGNED_DOUBLE;
891 	       {
892 		    fftw_real tmp190;
893 		    fftw_real tmp191;
894 		    fftw_real tmp246;
895 		    fftw_real tmp247;
896 		    ASSERT_ALIGNED_DOUBLE;
897 		    tmp190 = X[2 * iostride];
898 		    tmp191 = Y[-18 * iostride];
899 		    tmp192 = tmp190 + tmp191;
900 		    tmp465 = tmp190 - tmp191;
901 		    tmp246 = Y[-2 * iostride];
902 		    tmp247 = X[18 * iostride];
903 		    tmp248 = tmp246 - tmp247;
904 		    tmp463 = tmp246 + tmp247;
905 	       }
906 	       {
907 		    fftw_real tmp193;
908 		    fftw_real tmp194;
909 		    fftw_real tmp249;
910 		    fftw_real tmp250;
911 		    ASSERT_ALIGNED_DOUBLE;
912 		    tmp193 = X[10 * iostride];
913 		    tmp194 = Y[-26 * iostride];
914 		    tmp195 = tmp193 + tmp194;
915 		    tmp462 = tmp193 - tmp194;
916 		    tmp249 = Y[-10 * iostride];
917 		    tmp250 = X[26 * iostride];
918 		    tmp251 = tmp249 - tmp250;
919 		    tmp466 = tmp249 + tmp250;
920 	       }
921 	       {
922 		    fftw_real tmp197;
923 		    fftw_real tmp198;
924 		    fftw_real tmp239;
925 		    fftw_real tmp240;
926 		    ASSERT_ALIGNED_DOUBLE;
927 		    tmp197 = Y[-30 * iostride];
928 		    tmp198 = X[14 * iostride];
929 		    tmp199 = tmp197 + tmp198;
930 		    tmp458 = tmp197 - tmp198;
931 		    tmp239 = Y[-14 * iostride];
932 		    tmp240 = X[30 * iostride];
933 		    tmp241 = tmp239 - tmp240;
934 		    tmp456 = tmp239 + tmp240;
935 	       }
936 	       {
937 		    fftw_real tmp200;
938 		    fftw_real tmp201;
939 		    fftw_real tmp242;
940 		    fftw_real tmp243;
941 		    ASSERT_ALIGNED_DOUBLE;
942 		    tmp200 = X[6 * iostride];
943 		    tmp201 = Y[-22 * iostride];
944 		    tmp202 = tmp200 + tmp201;
945 		    tmp455 = tmp200 - tmp201;
946 		    tmp242 = Y[-6 * iostride];
947 		    tmp243 = X[22 * iostride];
948 		    tmp244 = tmp242 - tmp243;
949 		    tmp459 = tmp242 + tmp243;
950 	       }
951 	       {
952 		    fftw_real tmp196;
953 		    fftw_real tmp203;
954 		    fftw_real tmp355;
955 		    fftw_real tmp356;
956 		    ASSERT_ALIGNED_DOUBLE;
957 		    tmp196 = tmp192 + tmp195;
958 		    tmp203 = tmp199 + tmp202;
959 		    tmp204 = tmp196 + tmp203;
960 		    tmp292 = tmp196 - tmp203;
961 		    tmp355 = tmp241 - tmp244;
962 		    tmp356 = tmp199 - tmp202;
963 		    tmp357 = tmp355 - tmp356;
964 		    tmp384 = tmp356 + tmp355;
965 	       }
966 	       {
967 		    fftw_real tmp245;
968 		    fftw_real tmp252;
969 		    fftw_real tmp358;
970 		    fftw_real tmp359;
971 		    ASSERT_ALIGNED_DOUBLE;
972 		    tmp245 = tmp241 + tmp244;
973 		    tmp252 = tmp248 + tmp251;
974 		    tmp253 = tmp245 - tmp252;
975 		    tmp333 = tmp252 + tmp245;
976 		    tmp358 = tmp192 - tmp195;
977 		    tmp359 = tmp248 - tmp251;
978 		    tmp360 = tmp358 + tmp359;
979 		    tmp383 = tmp358 - tmp359;
980 	       }
981 	       {
982 		    fftw_real tmp457;
983 		    fftw_real tmp460;
984 		    fftw_real tmp586;
985 		    fftw_real tmp587;
986 		    ASSERT_ALIGNED_DOUBLE;
987 		    tmp457 = tmp455 - tmp456;
988 		    tmp460 = tmp458 - tmp459;
989 		    tmp461 = (K923879532 * tmp457) - (K382683432 * tmp460);
990 		    tmp520 = (K382683432 * tmp457) + (K923879532 * tmp460);
991 		    tmp586 = tmp458 + tmp459;
992 		    tmp587 = tmp455 + tmp456;
993 		    tmp588 = (K382683432 * tmp586) - (K923879532 * tmp587);
994 		    tmp612 = (K382683432 * tmp587) + (K923879532 * tmp586);
995 	       }
996 	       {
997 		    fftw_real tmp464;
998 		    fftw_real tmp467;
999 		    fftw_real tmp583;
1000 		    fftw_real tmp584;
1001 		    ASSERT_ALIGNED_DOUBLE;
1002 		    tmp464 = tmp462 + tmp463;
1003 		    tmp467 = tmp465 - tmp466;
1004 		    tmp468 = (K923879532 * tmp464) + (K382683432 * tmp467);
1005 		    tmp519 = (K923879532 * tmp467) - (K382683432 * tmp464);
1006 		    tmp583 = tmp465 + tmp466;
1007 		    tmp584 = tmp463 - tmp462;
1008 		    tmp585 = (K382683432 * tmp583) - (K923879532 * tmp584);
1009 		    tmp611 = (K382683432 * tmp584) + (K923879532 * tmp583);
1010 	       }
1011 	  }
1012 	  {
1013 	       fftw_real tmp208;
1014 	       fftw_real tmp471;
1015 	       fftw_real tmp258;
1016 	       fftw_real tmp483;
1017 	       fftw_real tmp211;
1018 	       fftw_real tmp482;
1019 	       fftw_real tmp261;
1020 	       fftw_real tmp472;
1021 	       fftw_real tmp218;
1022 	       fftw_real tmp486;
1023 	       fftw_real tmp479;
1024 	       fftw_real tmp268;
1025 	       fftw_real tmp215;
1026 	       fftw_real tmp485;
1027 	       fftw_real tmp476;
1028 	       fftw_real tmp265;
1029 	       ASSERT_ALIGNED_DOUBLE;
1030 	       {
1031 		    fftw_real tmp206;
1032 		    fftw_real tmp207;
1033 		    fftw_real tmp259;
1034 		    fftw_real tmp260;
1035 		    ASSERT_ALIGNED_DOUBLE;
1036 		    tmp206 = X[iostride];
1037 		    tmp207 = Y[-17 * iostride];
1038 		    tmp208 = tmp206 + tmp207;
1039 		    tmp471 = tmp206 - tmp207;
1040 		    {
1041 			 fftw_real tmp256;
1042 			 fftw_real tmp257;
1043 			 fftw_real tmp209;
1044 			 fftw_real tmp210;
1045 			 ASSERT_ALIGNED_DOUBLE;
1046 			 tmp256 = Y[-iostride];
1047 			 tmp257 = X[17 * iostride];
1048 			 tmp258 = tmp256 - tmp257;
1049 			 tmp483 = tmp256 + tmp257;
1050 			 tmp209 = X[9 * iostride];
1051 			 tmp210 = Y[-25 * iostride];
1052 			 tmp211 = tmp209 + tmp210;
1053 			 tmp482 = tmp209 - tmp210;
1054 		    }
1055 		    tmp259 = Y[-9 * iostride];
1056 		    tmp260 = X[25 * iostride];
1057 		    tmp261 = tmp259 - tmp260;
1058 		    tmp472 = tmp259 + tmp260;
1059 		    {
1060 			 fftw_real tmp216;
1061 			 fftw_real tmp217;
1062 			 fftw_real tmp477;
1063 			 fftw_real tmp266;
1064 			 fftw_real tmp267;
1065 			 fftw_real tmp478;
1066 			 ASSERT_ALIGNED_DOUBLE;
1067 			 tmp216 = Y[-29 * iostride];
1068 			 tmp217 = X[13 * iostride];
1069 			 tmp477 = tmp216 - tmp217;
1070 			 tmp266 = Y[-13 * iostride];
1071 			 tmp267 = X[29 * iostride];
1072 			 tmp478 = tmp266 + tmp267;
1073 			 tmp218 = tmp216 + tmp217;
1074 			 tmp486 = tmp477 + tmp478;
1075 			 tmp479 = tmp477 - tmp478;
1076 			 tmp268 = tmp266 - tmp267;
1077 		    }
1078 		    {
1079 			 fftw_real tmp213;
1080 			 fftw_real tmp214;
1081 			 fftw_real tmp474;
1082 			 fftw_real tmp263;
1083 			 fftw_real tmp264;
1084 			 fftw_real tmp475;
1085 			 ASSERT_ALIGNED_DOUBLE;
1086 			 tmp213 = X[5 * iostride];
1087 			 tmp214 = Y[-21 * iostride];
1088 			 tmp474 = tmp213 - tmp214;
1089 			 tmp263 = Y[-5 * iostride];
1090 			 tmp264 = X[21 * iostride];
1091 			 tmp475 = tmp263 + tmp264;
1092 			 tmp215 = tmp213 + tmp214;
1093 			 tmp485 = tmp474 + tmp475;
1094 			 tmp476 = tmp474 - tmp475;
1095 			 tmp265 = tmp263 - tmp264;
1096 		    }
1097 	       }
1098 	       {
1099 		    fftw_real tmp212;
1100 		    fftw_real tmp219;
1101 		    fftw_real tmp370;
1102 		    fftw_real tmp371;
1103 		    ASSERT_ALIGNED_DOUBLE;
1104 		    tmp212 = tmp208 + tmp211;
1105 		    tmp219 = tmp215 + tmp218;
1106 		    tmp220 = tmp212 + tmp219;
1107 		    tmp255 = tmp212 - tmp219;
1108 		    tmp370 = tmp258 - tmp261;
1109 		    tmp371 = tmp215 - tmp218;
1110 		    tmp372 = tmp370 - tmp371;
1111 		    tmp414 = tmp371 + tmp370;
1112 	       }
1113 	       {
1114 		    fftw_real tmp262;
1115 		    fftw_real tmp269;
1116 		    fftw_real tmp373;
1117 		    fftw_real tmp374;
1118 		    ASSERT_ALIGNED_DOUBLE;
1119 		    tmp262 = tmp258 + tmp261;
1120 		    tmp269 = tmp265 + tmp268;
1121 		    tmp270 = tmp262 - tmp269;
1122 		    tmp335 = tmp262 + tmp269;
1123 		    tmp373 = tmp208 - tmp211;
1124 		    tmp374 = tmp268 - tmp265;
1125 		    tmp375 = tmp373 - tmp374;
1126 		    tmp415 = tmp373 + tmp374;
1127 	       }
1128 	       {
1129 		    fftw_real tmp473;
1130 		    fftw_real tmp480;
1131 		    fftw_real tmp598;
1132 		    fftw_real tmp599;
1133 		    ASSERT_ALIGNED_DOUBLE;
1134 		    tmp473 = tmp471 - tmp472;
1135 		    tmp480 = K707106781 * (tmp476 + tmp479);
1136 		    tmp481 = tmp473 - tmp480;
1137 		    tmp547 = tmp473 + tmp480;
1138 		    tmp598 = tmp483 - tmp482;
1139 		    tmp599 = K707106781 * (tmp476 - tmp479);
1140 		    tmp600 = tmp598 + tmp599;
1141 		    tmp640 = tmp598 - tmp599;
1142 	       }
1143 	       {
1144 		    fftw_real tmp484;
1145 		    fftw_real tmp487;
1146 		    fftw_real tmp601;
1147 		    fftw_real tmp602;
1148 		    ASSERT_ALIGNED_DOUBLE;
1149 		    tmp484 = tmp482 + tmp483;
1150 		    tmp487 = K707106781 * (tmp485 - tmp486);
1151 		    tmp488 = tmp484 - tmp487;
1152 		    tmp548 = tmp484 + tmp487;
1153 		    tmp601 = tmp471 + tmp472;
1154 		    tmp602 = K707106781 * (tmp485 + tmp486);
1155 		    tmp603 = tmp601 - tmp602;
1156 		    tmp639 = tmp601 + tmp602;
1157 	       }
1158 	  }
1159 	  {
1160 	       fftw_real tmp205;
1161 	       fftw_real tmp236;
1162 	       fftw_real tmp330;
1163 	       fftw_real tmp334;
1164 	       fftw_real tmp337;
1165 	       fftw_real tmp338;
1166 	       fftw_real tmp329;
1167 	       fftw_real tmp331;
1168 	       ASSERT_ALIGNED_DOUBLE;
1169 	       tmp205 = tmp189 + tmp204;
1170 	       tmp236 = tmp220 + tmp235;
1171 	       tmp330 = tmp205 - tmp236;
1172 	       tmp334 = tmp332 + tmp333;
1173 	       tmp337 = tmp335 + tmp336;
1174 	       tmp338 = tmp334 - tmp337;
1175 	       X[0] = tmp205 + tmp236;
1176 	       Y[-31 * iostride] = tmp334 + tmp337;
1177 	       tmp329 = c_re(W[15]);
1178 	       tmp331 = c_im(W[15]);
1179 	       X[16 * iostride] = (tmp329 * tmp330) + (tmp331 * tmp338);
1180 	       Y[-15 * iostride] = (tmp329 * tmp338) - (tmp331 * tmp330);
1181 	  }
1182 	  {
1183 	       fftw_real tmp342;
1184 	       fftw_real tmp348;
1185 	       fftw_real tmp346;
1186 	       fftw_real tmp350;
1187 	       ASSERT_ALIGNED_DOUBLE;
1188 	       {
1189 		    fftw_real tmp340;
1190 		    fftw_real tmp341;
1191 		    fftw_real tmp344;
1192 		    fftw_real tmp345;
1193 		    ASSERT_ALIGNED_DOUBLE;
1194 		    tmp340 = tmp332 - tmp333;
1195 		    tmp341 = tmp220 - tmp235;
1196 		    tmp342 = tmp340 - tmp341;
1197 		    tmp348 = tmp341 + tmp340;
1198 		    tmp344 = tmp189 - tmp204;
1199 		    tmp345 = tmp336 - tmp335;
1200 		    tmp346 = tmp344 - tmp345;
1201 		    tmp350 = tmp344 + tmp345;
1202 	       }
1203 	       {
1204 		    fftw_real tmp339;
1205 		    fftw_real tmp343;
1206 		    fftw_real tmp347;
1207 		    fftw_real tmp349;
1208 		    ASSERT_ALIGNED_DOUBLE;
1209 		    tmp339 = c_re(W[23]);
1210 		    tmp343 = c_im(W[23]);
1211 		    Y[-7 * iostride] =
1212 			(tmp339 * tmp342) - (tmp343 * tmp346);
1213 		    X[24 * iostride] =
1214 			(tmp343 * tmp342) + (tmp339 * tmp346);
1215 		    tmp347 = c_re(W[7]);
1216 		    tmp349 = c_im(W[7]);
1217 		    Y[-23 * iostride] =
1218 			(tmp347 * tmp348) - (tmp349 * tmp350);
1219 		    X[8 * iostride] =
1220 			(tmp349 * tmp348) + (tmp347 * tmp350);
1221 	       }
1222 	  }
1223 	  {
1224 	       fftw_real tmp254;
1225 	       fftw_real tmp322;
1226 	       fftw_real tmp289;
1227 	       fftw_real tmp319;
1228 	       fftw_real tmp308;
1229 	       fftw_real tmp318;
1230 	       fftw_real tmp311;
1231 	       fftw_real tmp323;
1232 	       ASSERT_ALIGNED_DOUBLE;
1233 	       {
1234 		    fftw_real tmp271;
1235 		    fftw_real tmp288;
1236 		    fftw_real tmp309;
1237 		    fftw_real tmp310;
1238 		    ASSERT_ALIGNED_DOUBLE;
1239 		    tmp254 = tmp238 + tmp253;
1240 		    tmp322 = tmp238 - tmp253;
1241 		    tmp271 = tmp255 - tmp270;
1242 		    tmp288 = tmp272 + tmp287;
1243 		    tmp289 = K707106781 * (tmp271 + tmp288);
1244 		    tmp319 = K707106781 * (tmp271 - tmp288);
1245 		    tmp308 = tmp292 + tmp307;
1246 		    tmp318 = tmp307 - tmp292;
1247 		    tmp309 = tmp255 + tmp270;
1248 		    tmp310 = tmp287 - tmp272;
1249 		    tmp311 = K707106781 * (tmp309 + tmp310);
1250 		    tmp323 = K707106781 * (tmp310 - tmp309);
1251 	       }
1252 	       {
1253 		    fftw_real tmp290;
1254 		    fftw_real tmp312;
1255 		    fftw_real tmp237;
1256 		    fftw_real tmp291;
1257 		    ASSERT_ALIGNED_DOUBLE;
1258 		    tmp290 = tmp254 - tmp289;
1259 		    tmp312 = tmp308 - tmp311;
1260 		    tmp237 = c_re(W[19]);
1261 		    tmp291 = c_im(W[19]);
1262 		    X[20 * iostride] =
1263 			(tmp237 * tmp290) + (tmp291 * tmp312);
1264 		    Y[-11 * iostride] =
1265 			(tmp237 * tmp312) - (tmp291 * tmp290);
1266 	       }
1267 	       {
1268 		    fftw_real tmp314;
1269 		    fftw_real tmp316;
1270 		    fftw_real tmp313;
1271 		    fftw_real tmp315;
1272 		    ASSERT_ALIGNED_DOUBLE;
1273 		    tmp314 = tmp254 + tmp289;
1274 		    tmp316 = tmp308 + tmp311;
1275 		    tmp313 = c_re(W[3]);
1276 		    tmp315 = c_im(W[3]);
1277 		    X[4 * iostride] =
1278 			(tmp313 * tmp314) + (tmp315 * tmp316);
1279 		    Y[-27 * iostride] =
1280 			(tmp313 * tmp316) - (tmp315 * tmp314);
1281 	       }
1282 	       {
1283 		    fftw_real tmp320;
1284 		    fftw_real tmp324;
1285 		    fftw_real tmp317;
1286 		    fftw_real tmp321;
1287 		    ASSERT_ALIGNED_DOUBLE;
1288 		    tmp320 = tmp318 - tmp319;
1289 		    tmp324 = tmp322 - tmp323;
1290 		    tmp317 = c_re(W[27]);
1291 		    tmp321 = c_im(W[27]);
1292 		    Y[-3 * iostride] =
1293 			(tmp317 * tmp320) - (tmp321 * tmp324);
1294 		    X[28 * iostride] =
1295 			(tmp321 * tmp320) + (tmp317 * tmp324);
1296 	       }
1297 	       {
1298 		    fftw_real tmp326;
1299 		    fftw_real tmp328;
1300 		    fftw_real tmp325;
1301 		    fftw_real tmp327;
1302 		    ASSERT_ALIGNED_DOUBLE;
1303 		    tmp326 = tmp318 + tmp319;
1304 		    tmp328 = tmp322 + tmp323;
1305 		    tmp325 = c_re(W[11]);
1306 		    tmp327 = c_im(W[11]);
1307 		    Y[-19 * iostride] =
1308 			(tmp325 * tmp326) - (tmp327 * tmp328);
1309 		    X[12 * iostride] =
1310 			(tmp327 * tmp326) + (tmp325 * tmp328);
1311 	       }
1312 	  }
1313 	  {
1314 	       fftw_real tmp638;
1315 	       fftw_real tmp664;
1316 	       fftw_real tmp653;
1317 	       fftw_real tmp665;
1318 	       fftw_real tmp645;
1319 	       fftw_real tmp661;
1320 	       fftw_real tmp650;
1321 	       fftw_real tmp660;
1322 	       ASSERT_ALIGNED_DOUBLE;
1323 	       {
1324 		    fftw_real tmp636;
1325 		    fftw_real tmp637;
1326 		    fftw_real tmp651;
1327 		    fftw_real tmp652;
1328 		    ASSERT_ALIGNED_DOUBLE;
1329 		    tmp636 = tmp580 + tmp581;
1330 		    tmp637 = tmp611 + tmp612;
1331 		    tmp638 = tmp636 - tmp637;
1332 		    tmp664 = tmp636 + tmp637;
1333 		    tmp651 = (K195090322 * tmp640) + (K980785280 * tmp639);
1334 		    tmp652 = (K195090322 * tmp643) + (K980785280 * tmp642);
1335 		    tmp653 = tmp651 - tmp652;
1336 		    tmp665 = tmp651 + tmp652;
1337 	       }
1338 	       {
1339 		    fftw_real tmp641;
1340 		    fftw_real tmp644;
1341 		    fftw_real tmp648;
1342 		    fftw_real tmp649;
1343 		    ASSERT_ALIGNED_DOUBLE;
1344 		    tmp641 = (K195090322 * tmp639) - (K980785280 * tmp640);
1345 		    tmp644 = (K195090322 * tmp642) - (K980785280 * tmp643);
1346 		    tmp645 = tmp641 + tmp644;
1347 		    tmp661 = tmp641 - tmp644;
1348 		    tmp648 = tmp608 - tmp609;
1349 		    tmp649 = tmp585 - tmp588;
1350 		    tmp650 = tmp648 + tmp649;
1351 		    tmp660 = tmp648 - tmp649;
1352 	       }
1353 	       {
1354 		    fftw_real tmp646;
1355 		    fftw_real tmp654;
1356 		    fftw_real tmp635;
1357 		    fftw_real tmp647;
1358 		    ASSERT_ALIGNED_DOUBLE;
1359 		    tmp646 = tmp638 - tmp645;
1360 		    tmp654 = tmp650 - tmp653;
1361 		    tmp635 = c_re(W[22]);
1362 		    tmp647 = c_im(W[22]);
1363 		    X[23 * iostride] =
1364 			(tmp635 * tmp646) + (tmp647 * tmp654);
1365 		    Y[-8 * iostride] =
1366 			(tmp635 * tmp654) - (tmp647 * tmp646);
1367 	       }
1368 	       {
1369 		    fftw_real tmp656;
1370 		    fftw_real tmp658;
1371 		    fftw_real tmp655;
1372 		    fftw_real tmp657;
1373 		    ASSERT_ALIGNED_DOUBLE;
1374 		    tmp656 = tmp638 + tmp645;
1375 		    tmp658 = tmp650 + tmp653;
1376 		    tmp655 = c_re(W[6]);
1377 		    tmp657 = c_im(W[6]);
1378 		    X[7 * iostride] =
1379 			(tmp655 * tmp656) + (tmp657 * tmp658);
1380 		    Y[-24 * iostride] =
1381 			(tmp655 * tmp658) - (tmp657 * tmp656);
1382 	       }
1383 	       {
1384 		    fftw_real tmp662;
1385 		    fftw_real tmp666;
1386 		    fftw_real tmp659;
1387 		    fftw_real tmp663;
1388 		    ASSERT_ALIGNED_DOUBLE;
1389 		    tmp662 = tmp660 + tmp661;
1390 		    tmp666 = tmp664 - tmp665;
1391 		    tmp659 = c_re(W[14]);
1392 		    tmp663 = c_im(W[14]);
1393 		    Y[-16 * iostride] =
1394 			(tmp659 * tmp662) - (tmp663 * tmp666);
1395 		    X[15 * iostride] =
1396 			(tmp663 * tmp662) + (tmp659 * tmp666);
1397 	       }
1398 	       {
1399 		    fftw_real tmp668;
1400 		    fftw_real tmp670;
1401 		    fftw_real tmp667;
1402 		    fftw_real tmp669;
1403 		    ASSERT_ALIGNED_DOUBLE;
1404 		    tmp668 = tmp660 - tmp661;
1405 		    tmp670 = tmp664 + tmp665;
1406 		    tmp667 = c_re(W[30]);
1407 		    tmp669 = c_im(W[30]);
1408 		    Y[0] = (tmp667 * tmp668) - (tmp669 * tmp670);
1409 		    X[31 * iostride] =
1410 			(tmp669 * tmp668) + (tmp667 * tmp670);
1411 	       }
1412 	  }
1413 	  {
1414 	       fftw_real tmp410;
1415 	       fftw_real tmp436;
1416 	       fftw_real tmp425;
1417 	       fftw_real tmp437;
1418 	       fftw_real tmp422;
1419 	       fftw_real tmp432;
1420 	       fftw_real tmp417;
1421 	       fftw_real tmp433;
1422 	       ASSERT_ALIGNED_DOUBLE;
1423 	       {
1424 		    fftw_real tmp409;
1425 		    fftw_real tmp423;
1426 		    fftw_real tmp424;
1427 		    fftw_real tmp421;
1428 		    fftw_real tmp413;
1429 		    fftw_real tmp416;
1430 		    ASSERT_ALIGNED_DOUBLE;
1431 		    tmp409 = K707106781 * (tmp383 + tmp384);
1432 		    tmp410 = tmp408 - tmp409;
1433 		    tmp436 = tmp408 + tmp409;
1434 		    tmp423 = (K923879532 * tmp415) - (K382683432 * tmp414);
1435 		    tmp424 = (K382683432 * tmp411) + (K923879532 * tmp412);
1436 		    tmp425 = tmp423 - tmp424;
1437 		    tmp437 = tmp423 + tmp424;
1438 		    tmp421 = K707106781 * (tmp360 + tmp357);
1439 		    tmp422 = tmp420 - tmp421;
1440 		    tmp432 = tmp420 + tmp421;
1441 		    tmp413 = (K923879532 * tmp411) - (K382683432 * tmp412);
1442 		    tmp416 = (K923879532 * tmp414) + (K382683432 * tmp415);
1443 		    tmp417 = tmp413 - tmp416;
1444 		    tmp433 = tmp416 + tmp413;
1445 	       }
1446 	       {
1447 		    fftw_real tmp418;
1448 		    fftw_real tmp426;
1449 		    fftw_real tmp407;
1450 		    fftw_real tmp419;
1451 		    ASSERT_ALIGNED_DOUBLE;
1452 		    tmp418 = tmp410 - tmp417;
1453 		    tmp426 = tmp422 - tmp425;
1454 		    tmp407 = c_re(W[25]);
1455 		    tmp419 = c_im(W[25]);
1456 		    X[26 * iostride] =
1457 			(tmp407 * tmp418) + (tmp419 * tmp426);
1458 		    Y[-5 * iostride] =
1459 			(tmp407 * tmp426) - (tmp419 * tmp418);
1460 	       }
1461 	       {
1462 		    fftw_real tmp428;
1463 		    fftw_real tmp430;
1464 		    fftw_real tmp427;
1465 		    fftw_real tmp429;
1466 		    ASSERT_ALIGNED_DOUBLE;
1467 		    tmp428 = tmp410 + tmp417;
1468 		    tmp430 = tmp422 + tmp425;
1469 		    tmp427 = c_re(W[9]);
1470 		    tmp429 = c_im(W[9]);
1471 		    X[10 * iostride] =
1472 			(tmp427 * tmp428) + (tmp429 * tmp430);
1473 		    Y[-21 * iostride] =
1474 			(tmp427 * tmp430) - (tmp429 * tmp428);
1475 	       }
1476 	       {
1477 		    fftw_real tmp434;
1478 		    fftw_real tmp438;
1479 		    fftw_real tmp431;
1480 		    fftw_real tmp435;
1481 		    ASSERT_ALIGNED_DOUBLE;
1482 		    tmp434 = tmp432 - tmp433;
1483 		    tmp438 = tmp436 - tmp437;
1484 		    tmp431 = c_re(W[17]);
1485 		    tmp435 = c_im(W[17]);
1486 		    Y[-13 * iostride] =
1487 			(tmp431 * tmp434) - (tmp435 * tmp438);
1488 		    X[18 * iostride] =
1489 			(tmp435 * tmp434) + (tmp431 * tmp438);
1490 	       }
1491 	       {
1492 		    fftw_real tmp440;
1493 		    fftw_real tmp442;
1494 		    fftw_real tmp439;
1495 		    fftw_real tmp441;
1496 		    ASSERT_ALIGNED_DOUBLE;
1497 		    tmp440 = tmp432 + tmp433;
1498 		    tmp442 = tmp436 + tmp437;
1499 		    tmp439 = c_re(W[1]);
1500 		    tmp441 = c_im(W[1]);
1501 		    Y[-29 * iostride] =
1502 			(tmp439 * tmp440) - (tmp441 * tmp442);
1503 		    X[2 * iostride] =
1504 			(tmp441 * tmp440) + (tmp439 * tmp442);
1505 	       }
1506 	  }
1507 	  {
1508 	       fftw_real tmp362;
1509 	       fftw_real tmp400;
1510 	       fftw_real tmp389;
1511 	       fftw_real tmp401;
1512 	       fftw_real tmp386;
1513 	       fftw_real tmp396;
1514 	       fftw_real tmp377;
1515 	       fftw_real tmp397;
1516 	       ASSERT_ALIGNED_DOUBLE;
1517 	       {
1518 		    fftw_real tmp361;
1519 		    fftw_real tmp387;
1520 		    fftw_real tmp388;
1521 		    fftw_real tmp385;
1522 		    fftw_real tmp369;
1523 		    fftw_real tmp376;
1524 		    ASSERT_ALIGNED_DOUBLE;
1525 		    tmp361 = K707106781 * (tmp357 - tmp360);
1526 		    tmp362 = tmp354 - tmp361;
1527 		    tmp400 = tmp354 + tmp361;
1528 		    tmp387 = (K382683432 * tmp375) - (K923879532 * tmp372);
1529 		    tmp388 = (K923879532 * tmp365) + (K382683432 * tmp368);
1530 		    tmp389 = tmp387 - tmp388;
1531 		    tmp401 = tmp387 + tmp388;
1532 		    tmp385 = K707106781 * (tmp383 - tmp384);
1533 		    tmp386 = tmp382 - tmp385;
1534 		    tmp396 = tmp382 + tmp385;
1535 		    tmp369 = (K382683432 * tmp365) - (K923879532 * tmp368);
1536 		    tmp376 = (K382683432 * tmp372) + (K923879532 * tmp375);
1537 		    tmp377 = tmp369 - tmp376;
1538 		    tmp397 = tmp376 + tmp369;
1539 	       }
1540 	       {
1541 		    fftw_real tmp378;
1542 		    fftw_real tmp390;
1543 		    fftw_real tmp351;
1544 		    fftw_real tmp379;
1545 		    ASSERT_ALIGNED_DOUBLE;
1546 		    tmp378 = tmp362 - tmp377;
1547 		    tmp390 = tmp386 - tmp389;
1548 		    tmp351 = c_re(W[29]);
1549 		    tmp379 = c_im(W[29]);
1550 		    X[30 * iostride] =
1551 			(tmp351 * tmp378) + (tmp379 * tmp390);
1552 		    Y[-iostride] = (tmp351 * tmp390) - (tmp379 * tmp378);
1553 	       }
1554 	       {
1555 		    fftw_real tmp392;
1556 		    fftw_real tmp394;
1557 		    fftw_real tmp391;
1558 		    fftw_real tmp393;
1559 		    ASSERT_ALIGNED_DOUBLE;
1560 		    tmp392 = tmp362 + tmp377;
1561 		    tmp394 = tmp386 + tmp389;
1562 		    tmp391 = c_re(W[13]);
1563 		    tmp393 = c_im(W[13]);
1564 		    X[14 * iostride] =
1565 			(tmp391 * tmp392) + (tmp393 * tmp394);
1566 		    Y[-17 * iostride] =
1567 			(tmp391 * tmp394) - (tmp393 * tmp392);
1568 	       }
1569 	       {
1570 		    fftw_real tmp398;
1571 		    fftw_real tmp402;
1572 		    fftw_real tmp395;
1573 		    fftw_real tmp399;
1574 		    ASSERT_ALIGNED_DOUBLE;
1575 		    tmp398 = tmp396 - tmp397;
1576 		    tmp402 = tmp400 - tmp401;
1577 		    tmp395 = c_re(W[21]);
1578 		    tmp399 = c_im(W[21]);
1579 		    Y[-9 * iostride] =
1580 			(tmp395 * tmp398) - (tmp399 * tmp402);
1581 		    X[22 * iostride] =
1582 			(tmp399 * tmp398) + (tmp395 * tmp402);
1583 	       }
1584 	       {
1585 		    fftw_real tmp404;
1586 		    fftw_real tmp406;
1587 		    fftw_real tmp403;
1588 		    fftw_real tmp405;
1589 		    ASSERT_ALIGNED_DOUBLE;
1590 		    tmp404 = tmp396 + tmp397;
1591 		    tmp406 = tmp400 + tmp401;
1592 		    tmp403 = c_re(W[5]);
1593 		    tmp405 = c_im(W[5]);
1594 		    Y[-25 * iostride] =
1595 			(tmp403 * tmp404) - (tmp405 * tmp406);
1596 		    X[6 * iostride] =
1597 			(tmp405 * tmp404) + (tmp403 * tmp406);
1598 	       }
1599 	  }
1600 	  {
1601 	       fftw_real tmp590;
1602 	       fftw_real tmp628;
1603 	       fftw_real tmp617;
1604 	       fftw_real tmp629;
1605 	       fftw_real tmp605;
1606 	       fftw_real tmp625;
1607 	       fftw_real tmp614;
1608 	       fftw_real tmp624;
1609 	       ASSERT_ALIGNED_DOUBLE;
1610 	       {
1611 		    fftw_real tmp582;
1612 		    fftw_real tmp589;
1613 		    fftw_real tmp615;
1614 		    fftw_real tmp616;
1615 		    ASSERT_ALIGNED_DOUBLE;
1616 		    tmp582 = tmp580 - tmp581;
1617 		    tmp589 = tmp585 + tmp588;
1618 		    tmp590 = tmp582 - tmp589;
1619 		    tmp628 = tmp582 + tmp589;
1620 		    tmp615 = (K831469612 * tmp603) - (K555570233 * tmp600);
1621 		    tmp616 = (K555570233 * tmp593) + (K831469612 * tmp596);
1622 		    tmp617 = tmp615 - tmp616;
1623 		    tmp629 = tmp615 + tmp616;
1624 	       }
1625 	       {
1626 		    fftw_real tmp597;
1627 		    fftw_real tmp604;
1628 		    fftw_real tmp610;
1629 		    fftw_real tmp613;
1630 		    ASSERT_ALIGNED_DOUBLE;
1631 		    tmp597 = (K831469612 * tmp593) - (K555570233 * tmp596);
1632 		    tmp604 = (K831469612 * tmp600) + (K555570233 * tmp603);
1633 		    tmp605 = tmp597 - tmp604;
1634 		    tmp625 = tmp604 + tmp597;
1635 		    tmp610 = tmp608 + tmp609;
1636 		    tmp613 = tmp611 - tmp612;
1637 		    tmp614 = tmp610 - tmp613;
1638 		    tmp624 = tmp610 + tmp613;
1639 	       }
1640 	       {
1641 		    fftw_real tmp606;
1642 		    fftw_real tmp618;
1643 		    fftw_real tmp579;
1644 		    fftw_real tmp607;
1645 		    ASSERT_ALIGNED_DOUBLE;
1646 		    tmp606 = tmp590 - tmp605;
1647 		    tmp618 = tmp614 - tmp617;
1648 		    tmp579 = c_re(W[26]);
1649 		    tmp607 = c_im(W[26]);
1650 		    X[27 * iostride] =
1651 			(tmp579 * tmp606) + (tmp607 * tmp618);
1652 		    Y[-4 * iostride] =
1653 			(tmp579 * tmp618) - (tmp607 * tmp606);
1654 	       }
1655 	       {
1656 		    fftw_real tmp620;
1657 		    fftw_real tmp622;
1658 		    fftw_real tmp619;
1659 		    fftw_real tmp621;
1660 		    ASSERT_ALIGNED_DOUBLE;
1661 		    tmp620 = tmp590 + tmp605;
1662 		    tmp622 = tmp614 + tmp617;
1663 		    tmp619 = c_re(W[10]);
1664 		    tmp621 = c_im(W[10]);
1665 		    X[11 * iostride] =
1666 			(tmp619 * tmp620) + (tmp621 * tmp622);
1667 		    Y[-20 * iostride] =
1668 			(tmp619 * tmp622) - (tmp621 * tmp620);
1669 	       }
1670 	       {
1671 		    fftw_real tmp626;
1672 		    fftw_real tmp630;
1673 		    fftw_real tmp623;
1674 		    fftw_real tmp627;
1675 		    ASSERT_ALIGNED_DOUBLE;
1676 		    tmp626 = tmp624 - tmp625;
1677 		    tmp630 = tmp628 - tmp629;
1678 		    tmp623 = c_re(W[18]);
1679 		    tmp627 = c_im(W[18]);
1680 		    Y[-12 * iostride] =
1681 			(tmp623 * tmp626) - (tmp627 * tmp630);
1682 		    X[19 * iostride] =
1683 			(tmp627 * tmp626) + (tmp623 * tmp630);
1684 	       }
1685 	       {
1686 		    fftw_real tmp632;
1687 		    fftw_real tmp634;
1688 		    fftw_real tmp631;
1689 		    fftw_real tmp633;
1690 		    ASSERT_ALIGNED_DOUBLE;
1691 		    tmp632 = tmp624 + tmp625;
1692 		    tmp634 = tmp628 + tmp629;
1693 		    tmp631 = c_re(W[2]);
1694 		    tmp633 = c_im(W[2]);
1695 		    Y[-28 * iostride] =
1696 			(tmp631 * tmp632) - (tmp633 * tmp634);
1697 		    X[3 * iostride] =
1698 			(tmp633 * tmp632) + (tmp631 * tmp634);
1699 	       }
1700 	  }
1701 	  {
1702 	       fftw_real tmp546;
1703 	       fftw_real tmp572;
1704 	       fftw_real tmp561;
1705 	       fftw_real tmp573;
1706 	       fftw_real tmp553;
1707 	       fftw_real tmp569;
1708 	       fftw_real tmp558;
1709 	       fftw_real tmp568;
1710 	       ASSERT_ALIGNED_DOUBLE;
1711 	       {
1712 		    fftw_real tmp544;
1713 		    fftw_real tmp545;
1714 		    fftw_real tmp559;
1715 		    fftw_real tmp560;
1716 		    ASSERT_ALIGNED_DOUBLE;
1717 		    tmp544 = tmp446 + tmp453;
1718 		    tmp545 = tmp519 + tmp520;
1719 		    tmp546 = tmp544 + tmp545;
1720 		    tmp572 = tmp544 - tmp545;
1721 		    tmp559 = (K195090322 * tmp547) + (K980785280 * tmp548);
1722 		    tmp560 = (K980785280 * tmp551) - (K195090322 * tmp550);
1723 		    tmp561 = tmp559 + tmp560;
1724 		    tmp573 = tmp560 - tmp559;
1725 	       }
1726 	       {
1727 		    fftw_real tmp549;
1728 		    fftw_real tmp552;
1729 		    fftw_real tmp556;
1730 		    fftw_real tmp557;
1731 		    ASSERT_ALIGNED_DOUBLE;
1732 		    tmp549 = (K980785280 * tmp547) - (K195090322 * tmp548);
1733 		    tmp552 = (K980785280 * tmp550) + (K195090322 * tmp551);
1734 		    tmp553 = tmp549 + tmp552;
1735 		    tmp569 = tmp549 - tmp552;
1736 		    tmp556 = tmp514 + tmp517;
1737 		    tmp557 = tmp468 + tmp461;
1738 		    tmp558 = tmp556 + tmp557;
1739 		    tmp568 = tmp556 - tmp557;
1740 	       }
1741 	       {
1742 		    fftw_real tmp554;
1743 		    fftw_real tmp562;
1744 		    fftw_real tmp543;
1745 		    fftw_real tmp555;
1746 		    ASSERT_ALIGNED_DOUBLE;
1747 		    tmp554 = tmp546 - tmp553;
1748 		    tmp562 = tmp558 - tmp561;
1749 		    tmp543 = c_re(W[16]);
1750 		    tmp555 = c_im(W[16]);
1751 		    X[17 * iostride] =
1752 			(tmp543 * tmp554) + (tmp555 * tmp562);
1753 		    Y[-14 * iostride] =
1754 			(tmp543 * tmp562) - (tmp555 * tmp554);
1755 	       }
1756 	       {
1757 		    fftw_real tmp564;
1758 		    fftw_real tmp566;
1759 		    fftw_real tmp563;
1760 		    fftw_real tmp565;
1761 		    ASSERT_ALIGNED_DOUBLE;
1762 		    tmp564 = tmp546 + tmp553;
1763 		    tmp566 = tmp558 + tmp561;
1764 		    tmp563 = c_re(W[0]);
1765 		    tmp565 = c_im(W[0]);
1766 		    X[iostride] = (tmp563 * tmp564) + (tmp565 * tmp566);
1767 		    Y[-30 * iostride] =
1768 			(tmp563 * tmp566) - (tmp565 * tmp564);
1769 	       }
1770 	       {
1771 		    fftw_real tmp570;
1772 		    fftw_real tmp574;
1773 		    fftw_real tmp567;
1774 		    fftw_real tmp571;
1775 		    ASSERT_ALIGNED_DOUBLE;
1776 		    tmp570 = tmp568 - tmp569;
1777 		    tmp574 = tmp572 - tmp573;
1778 		    tmp567 = c_re(W[24]);
1779 		    tmp571 = c_im(W[24]);
1780 		    Y[-6 * iostride] =
1781 			(tmp567 * tmp570) - (tmp571 * tmp574);
1782 		    X[25 * iostride] =
1783 			(tmp571 * tmp570) + (tmp567 * tmp574);
1784 	       }
1785 	       {
1786 		    fftw_real tmp576;
1787 		    fftw_real tmp578;
1788 		    fftw_real tmp575;
1789 		    fftw_real tmp577;
1790 		    ASSERT_ALIGNED_DOUBLE;
1791 		    tmp576 = tmp568 + tmp569;
1792 		    tmp578 = tmp572 + tmp573;
1793 		    tmp575 = c_re(W[8]);
1794 		    tmp577 = c_im(W[8]);
1795 		    Y[-22 * iostride] =
1796 			(tmp575 * tmp576) - (tmp577 * tmp578);
1797 		    X[9 * iostride] =
1798 			(tmp577 * tmp576) + (tmp575 * tmp578);
1799 	       }
1800 	  }
1801 	  {
1802 	       fftw_real tmp470;
1803 	       fftw_real tmp536;
1804 	       fftw_real tmp525;
1805 	       fftw_real tmp537;
1806 	       fftw_real tmp509;
1807 	       fftw_real tmp533;
1808 	       fftw_real tmp522;
1809 	       fftw_real tmp532;
1810 	       ASSERT_ALIGNED_DOUBLE;
1811 	       {
1812 		    fftw_real tmp454;
1813 		    fftw_real tmp469;
1814 		    fftw_real tmp523;
1815 		    fftw_real tmp524;
1816 		    ASSERT_ALIGNED_DOUBLE;
1817 		    tmp454 = tmp446 - tmp453;
1818 		    tmp469 = tmp461 - tmp468;
1819 		    tmp470 = tmp454 + tmp469;
1820 		    tmp536 = tmp454 - tmp469;
1821 		    tmp523 = (K831469612 * tmp481) + (K555570233 * tmp488);
1822 		    tmp524 = (K555570233 * tmp507) - (K831469612 * tmp500);
1823 		    tmp525 = tmp523 + tmp524;
1824 		    tmp537 = tmp524 - tmp523;
1825 	       }
1826 	       {
1827 		    fftw_real tmp489;
1828 		    fftw_real tmp508;
1829 		    fftw_real tmp518;
1830 		    fftw_real tmp521;
1831 		    ASSERT_ALIGNED_DOUBLE;
1832 		    tmp489 = (K555570233 * tmp481) - (K831469612 * tmp488);
1833 		    tmp508 = (K555570233 * tmp500) + (K831469612 * tmp507);
1834 		    tmp509 = tmp489 + tmp508;
1835 		    tmp533 = tmp489 - tmp508;
1836 		    tmp518 = tmp514 - tmp517;
1837 		    tmp521 = tmp519 - tmp520;
1838 		    tmp522 = tmp518 + tmp521;
1839 		    tmp532 = tmp518 - tmp521;
1840 	       }
1841 	       {
1842 		    fftw_real tmp510;
1843 		    fftw_real tmp526;
1844 		    fftw_real tmp443;
1845 		    fftw_real tmp511;
1846 		    ASSERT_ALIGNED_DOUBLE;
1847 		    tmp510 = tmp470 - tmp509;
1848 		    tmp526 = tmp522 - tmp525;
1849 		    tmp443 = c_re(W[20]);
1850 		    tmp511 = c_im(W[20]);
1851 		    X[21 * iostride] =
1852 			(tmp443 * tmp510) + (tmp511 * tmp526);
1853 		    Y[-10 * iostride] =
1854 			(tmp443 * tmp526) - (tmp511 * tmp510);
1855 	       }
1856 	       {
1857 		    fftw_real tmp528;
1858 		    fftw_real tmp530;
1859 		    fftw_real tmp527;
1860 		    fftw_real tmp529;
1861 		    ASSERT_ALIGNED_DOUBLE;
1862 		    tmp528 = tmp470 + tmp509;
1863 		    tmp530 = tmp522 + tmp525;
1864 		    tmp527 = c_re(W[4]);
1865 		    tmp529 = c_im(W[4]);
1866 		    X[5 * iostride] =
1867 			(tmp527 * tmp528) + (tmp529 * tmp530);
1868 		    Y[-26 * iostride] =
1869 			(tmp527 * tmp530) - (tmp529 * tmp528);
1870 	       }
1871 	       {
1872 		    fftw_real tmp534;
1873 		    fftw_real tmp538;
1874 		    fftw_real tmp531;
1875 		    fftw_real tmp535;
1876 		    ASSERT_ALIGNED_DOUBLE;
1877 		    tmp534 = tmp532 - tmp533;
1878 		    tmp538 = tmp536 - tmp537;
1879 		    tmp531 = c_re(W[28]);
1880 		    tmp535 = c_im(W[28]);
1881 		    Y[-2 * iostride] =
1882 			(tmp531 * tmp534) - (tmp535 * tmp538);
1883 		    X[29 * iostride] =
1884 			(tmp535 * tmp534) + (tmp531 * tmp538);
1885 	       }
1886 	       {
1887 		    fftw_real tmp540;
1888 		    fftw_real tmp542;
1889 		    fftw_real tmp539;
1890 		    fftw_real tmp541;
1891 		    ASSERT_ALIGNED_DOUBLE;
1892 		    tmp540 = tmp532 + tmp533;
1893 		    tmp542 = tmp536 + tmp537;
1894 		    tmp539 = c_re(W[12]);
1895 		    tmp541 = c_im(W[12]);
1896 		    Y[-18 * iostride] =
1897 			(tmp539 * tmp540) - (tmp541 * tmp542);
1898 		    X[13 * iostride] =
1899 			(tmp541 * tmp540) + (tmp539 * tmp542);
1900 	       }
1901 	  }
1902      }
1903      if (i == m) {
1904 	  fftw_real tmp7;
1905 	  fftw_real tmp123;
1906 	  fftw_real tmp35;
1907 	  fftw_real tmp95;
1908 	  fftw_real tmp82;
1909 	  fftw_real tmp110;
1910 	  fftw_real tmp146;
1911 	  fftw_real tmp165;
1912 	  fftw_real tmp29;
1913 	  fftw_real tmp137;
1914 	  fftw_real tmp141;
1915 	  fftw_real tmp160;
1916 	  fftw_real tmp69;
1917 	  fftw_real tmp73;
1918 	  fftw_real tmp103;
1919 	  fftw_real tmp107;
1920 	  fftw_real tmp14;
1921 	  fftw_real tmp143;
1922 	  fftw_real tmp46;
1923 	  fftw_real tmp109;
1924 	  fftw_real tmp126;
1925 	  fftw_real tmp166;
1926 	  fftw_real tmp77;
1927 	  fftw_real tmp96;
1928 	  fftw_real tmp22;
1929 	  fftw_real tmp132;
1930 	  fftw_real tmp140;
1931 	  fftw_real tmp161;
1932 	  fftw_real tmp58;
1933 	  fftw_real tmp72;
1934 	  fftw_real tmp100;
1935 	  fftw_real tmp106;
1936 	  ASSERT_ALIGNED_DOUBLE;
1937 	  {
1938 	       fftw_real tmp3;
1939 	       fftw_real tmp31;
1940 	       fftw_real tmp81;
1941 	       fftw_real tmp144;
1942 	       fftw_real tmp6;
1943 	       fftw_real tmp78;
1944 	       fftw_real tmp34;
1945 	       fftw_real tmp145;
1946 	       ASSERT_ALIGNED_DOUBLE;
1947 	       {
1948 		    fftw_real tmp1;
1949 		    fftw_real tmp2;
1950 		    fftw_real tmp79;
1951 		    fftw_real tmp80;
1952 		    ASSERT_ALIGNED_DOUBLE;
1953 		    tmp1 = X[0];
1954 		    tmp2 = X[15 * iostride];
1955 		    tmp3 = tmp1 + tmp2;
1956 		    tmp31 = tmp1 - tmp2;
1957 		    tmp79 = Y[0];
1958 		    tmp80 = Y[-15 * iostride];
1959 		    tmp81 = tmp79 + tmp80;
1960 		    tmp144 = tmp79 - tmp80;
1961 	       }
1962 	       {
1963 		    fftw_real tmp4;
1964 		    fftw_real tmp5;
1965 		    fftw_real tmp32;
1966 		    fftw_real tmp33;
1967 		    ASSERT_ALIGNED_DOUBLE;
1968 		    tmp4 = X[8 * iostride];
1969 		    tmp5 = X[7 * iostride];
1970 		    tmp6 = tmp4 + tmp5;
1971 		    tmp78 = tmp4 - tmp5;
1972 		    tmp32 = Y[-8 * iostride];
1973 		    tmp33 = Y[-7 * iostride];
1974 		    tmp34 = tmp32 + tmp33;
1975 		    tmp145 = tmp32 - tmp33;
1976 	       }
1977 	       tmp7 = tmp3 + tmp6;
1978 	       tmp123 = tmp3 - tmp6;
1979 	       tmp35 = tmp31 - tmp34;
1980 	       tmp95 = tmp31 + tmp34;
1981 	       tmp82 = tmp78 + tmp81;
1982 	       tmp110 = tmp81 - tmp78;
1983 	       tmp146 = tmp144 - tmp145;
1984 	       tmp165 = tmp145 + tmp144;
1985 	  }
1986 	  {
1987 	       fftw_real tmp25;
1988 	       fftw_real tmp59;
1989 	       fftw_real tmp67;
1990 	       fftw_real tmp134;
1991 	       fftw_real tmp28;
1992 	       fftw_real tmp64;
1993 	       fftw_real tmp62;
1994 	       fftw_real tmp135;
1995 	       fftw_real tmp133;
1996 	       fftw_real tmp136;
1997 	       ASSERT_ALIGNED_DOUBLE;
1998 	       {
1999 		    fftw_real tmp23;
2000 		    fftw_real tmp24;
2001 		    fftw_real tmp65;
2002 		    fftw_real tmp66;
2003 		    ASSERT_ALIGNED_DOUBLE;
2004 		    tmp23 = X[iostride];
2005 		    tmp24 = X[14 * iostride];
2006 		    tmp25 = tmp23 + tmp24;
2007 		    tmp59 = tmp23 - tmp24;
2008 		    tmp65 = Y[-iostride];
2009 		    tmp66 = Y[-14 * iostride];
2010 		    tmp67 = tmp65 + tmp66;
2011 		    tmp134 = tmp66 - tmp65;
2012 	       }
2013 	       {
2014 		    fftw_real tmp26;
2015 		    fftw_real tmp27;
2016 		    fftw_real tmp60;
2017 		    fftw_real tmp61;
2018 		    ASSERT_ALIGNED_DOUBLE;
2019 		    tmp26 = X[6 * iostride];
2020 		    tmp27 = X[9 * iostride];
2021 		    tmp28 = tmp26 + tmp27;
2022 		    tmp64 = tmp26 - tmp27;
2023 		    tmp60 = Y[-6 * iostride];
2024 		    tmp61 = Y[-9 * iostride];
2025 		    tmp62 = tmp60 + tmp61;
2026 		    tmp135 = tmp60 - tmp61;
2027 	       }
2028 	       tmp29 = tmp25 + tmp28;
2029 	       tmp133 = tmp25 - tmp28;
2030 	       tmp136 = tmp134 - tmp135;
2031 	       tmp137 = tmp133 + tmp136;
2032 	       tmp141 = tmp136 - tmp133;
2033 	       tmp160 = tmp135 + tmp134;
2034 	       {
2035 		    fftw_real tmp63;
2036 		    fftw_real tmp68;
2037 		    fftw_real tmp101;
2038 		    fftw_real tmp102;
2039 		    ASSERT_ALIGNED_DOUBLE;
2040 		    tmp63 = tmp59 - tmp62;
2041 		    tmp68 = tmp64 - tmp67;
2042 		    tmp69 = (K923879532 * tmp63) + (K382683432 * tmp68);
2043 		    tmp73 = (K923879532 * tmp68) - (K382683432 * tmp63);
2044 		    tmp101 = tmp59 + tmp62;
2045 		    tmp102 = tmp64 + tmp67;
2046 		    tmp103 = (K382683432 * tmp101) - (K923879532 * tmp102);
2047 		    tmp107 = (K923879532 * tmp101) + (K382683432 * tmp102);
2048 	       }
2049 	  }
2050 	  {
2051 	       fftw_real tmp10;
2052 	       fftw_real tmp36;
2053 	       fftw_real tmp39;
2054 	       fftw_real tmp125;
2055 	       fftw_real tmp13;
2056 	       fftw_real tmp41;
2057 	       fftw_real tmp44;
2058 	       fftw_real tmp124;
2059 	       ASSERT_ALIGNED_DOUBLE;
2060 	       {
2061 		    fftw_real tmp8;
2062 		    fftw_real tmp9;
2063 		    fftw_real tmp37;
2064 		    fftw_real tmp38;
2065 		    ASSERT_ALIGNED_DOUBLE;
2066 		    tmp8 = X[4 * iostride];
2067 		    tmp9 = X[11 * iostride];
2068 		    tmp10 = tmp8 + tmp9;
2069 		    tmp36 = tmp8 - tmp9;
2070 		    tmp37 = Y[-4 * iostride];
2071 		    tmp38 = Y[-11 * iostride];
2072 		    tmp39 = tmp37 + tmp38;
2073 		    tmp125 = tmp37 - tmp38;
2074 	       }
2075 	       {
2076 		    fftw_real tmp11;
2077 		    fftw_real tmp12;
2078 		    fftw_real tmp42;
2079 		    fftw_real tmp43;
2080 		    ASSERT_ALIGNED_DOUBLE;
2081 		    tmp11 = X[3 * iostride];
2082 		    tmp12 = X[12 * iostride];
2083 		    tmp13 = tmp11 + tmp12;
2084 		    tmp41 = tmp11 - tmp12;
2085 		    tmp42 = Y[-3 * iostride];
2086 		    tmp43 = Y[-12 * iostride];
2087 		    tmp44 = tmp42 + tmp43;
2088 		    tmp124 = tmp43 - tmp42;
2089 	       }
2090 	       {
2091 		    fftw_real tmp40;
2092 		    fftw_real tmp45;
2093 		    fftw_real tmp75;
2094 		    fftw_real tmp76;
2095 		    ASSERT_ALIGNED_DOUBLE;
2096 		    tmp14 = tmp10 + tmp13;
2097 		    tmp143 = tmp10 - tmp13;
2098 		    tmp40 = tmp36 - tmp39;
2099 		    tmp45 = tmp41 - tmp44;
2100 		    tmp46 = K707106781 * (tmp40 + tmp45);
2101 		    tmp109 = K707106781 * (tmp40 - tmp45);
2102 		    tmp126 = tmp124 - tmp125;
2103 		    tmp166 = tmp125 + tmp124;
2104 		    tmp75 = tmp36 + tmp39;
2105 		    tmp76 = tmp41 + tmp44;
2106 		    tmp77 = K707106781 * (tmp75 - tmp76);
2107 		    tmp96 = K707106781 * (tmp75 + tmp76);
2108 	       }
2109 	  }
2110 	  {
2111 	       fftw_real tmp18;
2112 	       fftw_real tmp48;
2113 	       fftw_real tmp56;
2114 	       fftw_real tmp129;
2115 	       fftw_real tmp21;
2116 	       fftw_real tmp53;
2117 	       fftw_real tmp51;
2118 	       fftw_real tmp130;
2119 	       fftw_real tmp128;
2120 	       fftw_real tmp131;
2121 	       ASSERT_ALIGNED_DOUBLE;
2122 	       {
2123 		    fftw_real tmp16;
2124 		    fftw_real tmp17;
2125 		    fftw_real tmp54;
2126 		    fftw_real tmp55;
2127 		    ASSERT_ALIGNED_DOUBLE;
2128 		    tmp16 = X[2 * iostride];
2129 		    tmp17 = X[13 * iostride];
2130 		    tmp18 = tmp16 + tmp17;
2131 		    tmp48 = tmp16 - tmp17;
2132 		    tmp54 = Y[-2 * iostride];
2133 		    tmp55 = Y[-13 * iostride];
2134 		    tmp56 = tmp54 + tmp55;
2135 		    tmp129 = tmp54 - tmp55;
2136 	       }
2137 	       {
2138 		    fftw_real tmp19;
2139 		    fftw_real tmp20;
2140 		    fftw_real tmp49;
2141 		    fftw_real tmp50;
2142 		    ASSERT_ALIGNED_DOUBLE;
2143 		    tmp19 = X[10 * iostride];
2144 		    tmp20 = X[5 * iostride];
2145 		    tmp21 = tmp19 + tmp20;
2146 		    tmp53 = tmp19 - tmp20;
2147 		    tmp49 = Y[-10 * iostride];
2148 		    tmp50 = Y[-5 * iostride];
2149 		    tmp51 = tmp49 + tmp50;
2150 		    tmp130 = tmp49 - tmp50;
2151 	       }
2152 	       tmp22 = tmp18 + tmp21;
2153 	       tmp128 = tmp18 - tmp21;
2154 	       tmp131 = tmp129 - tmp130;
2155 	       tmp132 = tmp128 - tmp131;
2156 	       tmp140 = tmp128 + tmp131;
2157 	       tmp161 = tmp130 + tmp129;
2158 	       {
2159 		    fftw_real tmp52;
2160 		    fftw_real tmp57;
2161 		    fftw_real tmp98;
2162 		    fftw_real tmp99;
2163 		    ASSERT_ALIGNED_DOUBLE;
2164 		    tmp52 = tmp48 - tmp51;
2165 		    tmp57 = tmp53 + tmp56;
2166 		    tmp58 = (K923879532 * tmp52) - (K382683432 * tmp57);
2167 		    tmp72 = (K382683432 * tmp52) + (K923879532 * tmp57);
2168 		    tmp98 = tmp48 + tmp51;
2169 		    tmp99 = tmp56 - tmp53;
2170 		    tmp100 = (K382683432 * tmp98) - (K923879532 * tmp99);
2171 		    tmp106 = (K923879532 * tmp98) + (K382683432 * tmp99);
2172 	       }
2173 	  }
2174 	  {
2175 	       fftw_real tmp15;
2176 	       fftw_real tmp30;
2177 	       fftw_real tmp171;
2178 	       fftw_real tmp172;
2179 	       fftw_real tmp173;
2180 	       fftw_real tmp174;
2181 	       ASSERT_ALIGNED_DOUBLE;
2182 	       tmp15 = tmp7 + tmp14;
2183 	       tmp30 = tmp22 + tmp29;
2184 	       tmp171 = tmp15 - tmp30;
2185 	       tmp172 = tmp166 + tmp165;
2186 	       tmp173 = tmp161 + tmp160;
2187 	       tmp174 = tmp172 - tmp173;
2188 	       X[0] = K2_000000000 * (tmp15 + tmp30);
2189 	       X[16 * iostride] = -(K2_000000000 * (tmp173 + tmp172));
2190 	       X[8 * iostride] = K1_414213562 * (tmp171 - tmp174);
2191 	       X[24 * iostride] = -(K1_414213562 * (tmp171 + tmp174));
2192 	  }
2193 	  {
2194 	       fftw_real tmp163;
2195 	       fftw_real tmp169;
2196 	       fftw_real tmp168;
2197 	       fftw_real tmp170;
2198 	       ASSERT_ALIGNED_DOUBLE;
2199 	       {
2200 		    fftw_real tmp159;
2201 		    fftw_real tmp162;
2202 		    fftw_real tmp164;
2203 		    fftw_real tmp167;
2204 		    ASSERT_ALIGNED_DOUBLE;
2205 		    tmp159 = tmp7 - tmp14;
2206 		    tmp162 = tmp160 - tmp161;
2207 		    tmp163 = tmp159 + tmp162;
2208 		    tmp169 = tmp159 - tmp162;
2209 		    tmp164 = tmp22 - tmp29;
2210 		    tmp167 = tmp165 - tmp166;
2211 		    tmp168 = tmp164 + tmp167;
2212 		    tmp170 = tmp167 - tmp164;
2213 	       }
2214 	       X[4 * iostride] =
2215 		   (K1_847759065 * tmp163) - (K765366864 * tmp168);
2216 	       X[20 * iostride] =
2217 		   -((K765366864 * tmp163) + (K1_847759065 * tmp168));
2218 	       X[12 * iostride] =
2219 		   (K765366864 * tmp169) - (K1_847759065 * tmp170);
2220 	       X[28 * iostride] =
2221 		   -((K1_847759065 * tmp169) + (K765366864 * tmp170));
2222 	  }
2223 	  {
2224 	       fftw_real tmp71;
2225 	       fftw_real tmp85;
2226 	       fftw_real tmp84;
2227 	       fftw_real tmp86;
2228 	       ASSERT_ALIGNED_DOUBLE;
2229 	       {
2230 		    fftw_real tmp47;
2231 		    fftw_real tmp70;
2232 		    fftw_real tmp74;
2233 		    fftw_real tmp83;
2234 		    ASSERT_ALIGNED_DOUBLE;
2235 		    tmp47 = tmp35 + tmp46;
2236 		    tmp70 = tmp58 + tmp69;
2237 		    tmp71 = tmp47 + tmp70;
2238 		    tmp85 = tmp47 - tmp70;
2239 		    tmp74 = tmp72 + tmp73;
2240 		    tmp83 = tmp77 + tmp82;
2241 		    tmp84 = tmp74 + tmp83;
2242 		    tmp86 = tmp83 - tmp74;
2243 	       }
2244 	       X[iostride] = (K1_990369453 * tmp71) - (K196034280 * tmp84);
2245 	       X[17 * iostride] =
2246 		   -((K196034280 * tmp71) + (K1_990369453 * tmp84));
2247 	       X[9 * iostride] =
2248 		   (K1_268786568 * tmp85) - (K1_546020906 * tmp86);
2249 	       X[25 * iostride] =
2250 		   -((K1_546020906 * tmp85) + (K1_268786568 * tmp86));
2251 	  }
2252 	  {
2253 	       fftw_real tmp89;
2254 	       fftw_real tmp93;
2255 	       fftw_real tmp92;
2256 	       fftw_real tmp94;
2257 	       ASSERT_ALIGNED_DOUBLE;
2258 	       {
2259 		    fftw_real tmp87;
2260 		    fftw_real tmp88;
2261 		    fftw_real tmp90;
2262 		    fftw_real tmp91;
2263 		    ASSERT_ALIGNED_DOUBLE;
2264 		    tmp87 = tmp35 - tmp46;
2265 		    tmp88 = tmp73 - tmp72;
2266 		    tmp89 = tmp87 + tmp88;
2267 		    tmp93 = tmp87 - tmp88;
2268 		    tmp90 = tmp58 - tmp69;
2269 		    tmp91 = tmp82 - tmp77;
2270 		    tmp92 = tmp90 + tmp91;
2271 		    tmp94 = tmp91 - tmp90;
2272 	       }
2273 	       X[5 * iostride] =
2274 		   (K1_763842528 * tmp89) - (K942793473 * tmp92);
2275 	       X[21 * iostride] =
2276 		   -((K942793473 * tmp89) + (K1_763842528 * tmp92));
2277 	       X[13 * iostride] =
2278 		   (K580569354 * tmp93) - (K1_913880671 * tmp94);
2279 	       X[29 * iostride] =
2280 		   -((K1_913880671 * tmp93) + (K580569354 * tmp94));
2281 	  }
2282 	  {
2283 	       fftw_real tmp105;
2284 	       fftw_real tmp113;
2285 	       fftw_real tmp112;
2286 	       fftw_real tmp114;
2287 	       ASSERT_ALIGNED_DOUBLE;
2288 	       {
2289 		    fftw_real tmp97;
2290 		    fftw_real tmp104;
2291 		    fftw_real tmp108;
2292 		    fftw_real tmp111;
2293 		    ASSERT_ALIGNED_DOUBLE;
2294 		    tmp97 = tmp95 - tmp96;
2295 		    tmp104 = tmp100 + tmp103;
2296 		    tmp105 = tmp97 + tmp104;
2297 		    tmp113 = tmp97 - tmp104;
2298 		    tmp108 = tmp106 - tmp107;
2299 		    tmp111 = tmp109 + tmp110;
2300 		    tmp112 = tmp108 + tmp111;
2301 		    tmp114 = tmp111 - tmp108;
2302 	       }
2303 	       X[3 * iostride] =
2304 		   (K1_913880671 * tmp105) - (K580569354 * tmp112);
2305 	       X[19 * iostride] =
2306 		   -((K580569354 * tmp105) + (K1_913880671 * tmp112));
2307 	       X[11 * iostride] =
2308 		   (K942793473 * tmp113) - (K1_763842528 * tmp114);
2309 	       X[27 * iostride] =
2310 		   -((K1_763842528 * tmp113) + (K942793473 * tmp114));
2311 	  }
2312 	  {
2313 	       fftw_real tmp117;
2314 	       fftw_real tmp121;
2315 	       fftw_real tmp120;
2316 	       fftw_real tmp122;
2317 	       ASSERT_ALIGNED_DOUBLE;
2318 	       {
2319 		    fftw_real tmp115;
2320 		    fftw_real tmp116;
2321 		    fftw_real tmp118;
2322 		    fftw_real tmp119;
2323 		    ASSERT_ALIGNED_DOUBLE;
2324 		    tmp115 = tmp95 + tmp96;
2325 		    tmp116 = tmp106 + tmp107;
2326 		    tmp117 = tmp115 - tmp116;
2327 		    tmp121 = tmp115 + tmp116;
2328 		    tmp118 = tmp100 - tmp103;
2329 		    tmp119 = tmp110 - tmp109;
2330 		    tmp120 = tmp118 + tmp119;
2331 		    tmp122 = tmp119 - tmp118;
2332 	       }
2333 	       X[7 * iostride] =
2334 		   (K1_546020906 * tmp117) - (K1_268786568 * tmp120);
2335 	       X[23 * iostride] =
2336 		   -((K1_268786568 * tmp117) + (K1_546020906 * tmp120));
2337 	       X[15 * iostride] =
2338 		   (K196034280 * tmp121) - (K1_990369453 * tmp122);
2339 	       X[31 * iostride] =
2340 		   -((K1_990369453 * tmp121) + (K196034280 * tmp122));
2341 	  }
2342 	  {
2343 	       fftw_real tmp139;
2344 	       fftw_real tmp149;
2345 	       fftw_real tmp148;
2346 	       fftw_real tmp150;
2347 	       ASSERT_ALIGNED_DOUBLE;
2348 	       {
2349 		    fftw_real tmp127;
2350 		    fftw_real tmp138;
2351 		    fftw_real tmp142;
2352 		    fftw_real tmp147;
2353 		    ASSERT_ALIGNED_DOUBLE;
2354 		    tmp127 = tmp123 + tmp126;
2355 		    tmp138 = K707106781 * (tmp132 + tmp137);
2356 		    tmp139 = tmp127 + tmp138;
2357 		    tmp149 = tmp127 - tmp138;
2358 		    tmp142 = K707106781 * (tmp140 + tmp141);
2359 		    tmp147 = tmp143 + tmp146;
2360 		    tmp148 = tmp142 + tmp147;
2361 		    tmp150 = tmp147 - tmp142;
2362 	       }
2363 	       X[2 * iostride] =
2364 		   (K1_961570560 * tmp139) - (K390180644 * tmp148);
2365 	       X[18 * iostride] =
2366 		   -((K390180644 * tmp139) + (K1_961570560 * tmp148));
2367 	       X[10 * iostride] =
2368 		   (K1_111140466 * tmp149) - (K1_662939224 * tmp150);
2369 	       X[26 * iostride] =
2370 		   -((K1_662939224 * tmp149) + (K1_111140466 * tmp150));
2371 	  }
2372 	  {
2373 	       fftw_real tmp153;
2374 	       fftw_real tmp157;
2375 	       fftw_real tmp156;
2376 	       fftw_real tmp158;
2377 	       ASSERT_ALIGNED_DOUBLE;
2378 	       {
2379 		    fftw_real tmp151;
2380 		    fftw_real tmp152;
2381 		    fftw_real tmp154;
2382 		    fftw_real tmp155;
2383 		    ASSERT_ALIGNED_DOUBLE;
2384 		    tmp151 = tmp123 - tmp126;
2385 		    tmp152 = K707106781 * (tmp141 - tmp140);
2386 		    tmp153 = tmp151 + tmp152;
2387 		    tmp157 = tmp151 - tmp152;
2388 		    tmp154 = K707106781 * (tmp132 - tmp137);
2389 		    tmp155 = tmp146 - tmp143;
2390 		    tmp156 = tmp154 + tmp155;
2391 		    tmp158 = tmp155 - tmp154;
2392 	       }
2393 	       X[6 * iostride] =
2394 		   (K1_662939224 * tmp153) - (K1_111140466 * tmp156);
2395 	       X[22 * iostride] =
2396 		   -((K1_111140466 * tmp153) + (K1_662939224 * tmp156));
2397 	       X[14 * iostride] =
2398 		   (K390180644 * tmp157) - (K1_961570560 * tmp158);
2399 	       X[30 * iostride] =
2400 		   -((K1_961570560 * tmp157) + (K390180644 * tmp158));
2401 	  }
2402      }
2403 }
2404 
2405 static const int twiddle_order[] =
2406     { 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19,
2407 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31 };
2408 fftw_codelet_desc fftw_hc2hc_backward_32_desc = {
2409      "fftw_hc2hc_backward_32",
2410      (void (*)()) fftw_hc2hc_backward_32,
2411      32,
2412      FFTW_BACKWARD,
2413      FFTW_HC2HC,
2414      718,
2415      31,
2416      twiddle_order,
2417 };
2418