1 /*
2  * Copyright (c) 1997-1999, 2003 Massachusetts Institute of Technology
3  *
4  * This program is free software; you can redistribute it and/or modify
5  * it under the terms of the GNU General Public License as published by
6  * the Free Software Foundation; either version 2 of the License, or
7  * (at your option) any later version.
8  *
9  * This program is distributed in the hope that it will be useful,
10  * but WITHOUT ANY WARRANTY; without even the implied warranty of
11  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
12  * GNU General Public License for more details.
13  *
14  * You should have received a copy of the GNU General Public License
15  * along with this program; if not, write to the Free Software
16  * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
17  *
18  */
19 
20 /* This file was automatically generated --- DO NOT EDIT */
21 /* Generated on Mon Mar 24 02:06:14 EST 2003 */
22 
23 #include "fftw-int.h"
24 #include "fftw.h"
25 
26 /* Generated by: /homee/stevenj/cvs/fftw/gensrc/genfft -magic-alignment-check -magic-twiddle-load-all -magic-variables 4 -magic-loopi -real2hc 128 */
27 
28 /*
29  * This function contains 956 FP additions, 330 FP multiplications,
30  * (or, 812 additions, 186 multiplications, 144 fused multiply/add),
31  * 156 stack variables, and 256 memory accesses
32  */
33 static const fftw_real K242980179 =
34 FFTW_KONST(+0.242980179903263889948274162077471118320990783);
35 static const fftw_real K970031253 =
36 FFTW_KONST(+0.970031253194543992603984207286100251456865962);
37 static const fftw_real K514102744 =
38 FFTW_KONST(+0.514102744193221726593693838968815772608049120);
39 static const fftw_real K857728610 =
40 FFTW_KONST(+0.857728610000272069902269984284770137042490799);
41 static const fftw_real K595699304 =
42 FFTW_KONST(+0.595699304492433343467036528829969889511926338);
43 static const fftw_real K803207531 =
44 FFTW_KONST(+0.803207531480644909806676512963141923879569427);
45 static const fftw_real K146730474 =
46 FFTW_KONST(+0.146730474455361751658850129646717819706215317);
47 static const fftw_real K989176509 =
48 FFTW_KONST(+0.989176509964780973451673738016243063983689533);
49 static const fftw_real K471396736 =
50 FFTW_KONST(+0.471396736825997648556387625905254377657460319);
51 static const fftw_real K881921264 =
52 FFTW_KONST(+0.881921264348355029712756863660388349508442621);
53 static const fftw_real K956940335 =
54 FFTW_KONST(+0.956940335732208864935797886980269969482849206);
55 static const fftw_real K290284677 =
56 FFTW_KONST(+0.290284677254462367636192375817395274691476278);
57 static const fftw_real K336889853 =
58 FFTW_KONST(+0.336889853392220050689253212619147570477766780);
59 static const fftw_real K941544065 =
60 FFTW_KONST(+0.941544065183020778412509402599502357185589796);
61 static const fftw_real K427555093 =
62 FFTW_KONST(+0.427555093430282094320966856888798534304578629);
63 static const fftw_real K903989293 =
64 FFTW_KONST(+0.903989293123443331586200297230537048710132025);
65 static const fftw_real K634393284 =
66 FFTW_KONST(+0.634393284163645498215171613225493370675687095);
67 static const fftw_real K773010453 =
68 FFTW_KONST(+0.773010453362736960810906609758469800971041293);
69 static const fftw_real K671558954 =
70 FFTW_KONST(+0.671558954847018400625376850427421803228750632);
71 static const fftw_real K740951125 =
72 FFTW_KONST(+0.740951125354959091175616897495162729728955309);
73 static const fftw_real K049067674 =
74 FFTW_KONST(+0.049067674327418014254954976942682658314745363);
75 static const fftw_real K998795456 =
76 FFTW_KONST(+0.998795456205172392714771604759100694443203615);
77 static const fftw_real K995184726 =
78 FFTW_KONST(+0.995184726672196886244836953109479921575474869);
79 static const fftw_real K098017140 =
80 FFTW_KONST(+0.098017140329560601994195563888641845861136673);
81 static const fftw_real K555570233 =
82 FFTW_KONST(+0.555570233019602224742830813948532874374937191);
83 static const fftw_real K831469612 =
84 FFTW_KONST(+0.831469612302545237078788377617905756738560812);
85 static const fftw_real K195090322 =
86 FFTW_KONST(+0.195090322016128267848284868477022240927691618);
87 static const fftw_real K980785280 =
88 FFTW_KONST(+0.980785280403230449126182236134239036973933731);
89 static const fftw_real K382683432 =
90 FFTW_KONST(+0.382683432365089771728459984030398866761344562);
91 static const fftw_real K923879532 =
92 FFTW_KONST(+0.923879532511286756128183189396788286822416626);
93 static const fftw_real K707106781 =
94 FFTW_KONST(+0.707106781186547524400844362104849039284835938);
95 
96 /*
97  * Generator Id's :
98  * $Id: exprdag.ml,v 1.43 2003/03/16 23:43:46 stevenj Exp $
99  * $Id: fft.ml,v 1.44 2003/03/16 23:43:46 stevenj Exp $
100  * $Id: to_c.ml,v 1.26 2003/03/16 23:43:46 stevenj Exp $
101  */
102 
fftw_real2hc_128(const fftw_real * input,fftw_real * real_output,fftw_real * imag_output,int istride,int real_ostride,int imag_ostride)103 void fftw_real2hc_128(const fftw_real *input, fftw_real *real_output,
104 		      fftw_real *imag_output, int istride,
105 		      int real_ostride, int imag_ostride)
106 {
107      fftw_real tmp783;
108      fftw_real tmp15;
109      fftw_real tmp625;
110      fftw_real tmp862;
111      fftw_real tmp131;
112      fftw_real tmp461;
113      fftw_real tmp364;
114      fftw_real tmp530;
115      fftw_real tmp46;
116      fftw_real tmp626;
117      fftw_real tmp790;
118      fftw_real tmp865;
119      fftw_real tmp148;
120      fftw_real tmp369;
121      fftw_real tmp466;
122      fftw_real tmp533;
123      fftw_real tmp30;
124      fftw_real tmp708;
125      fftw_real tmp786;
126      fftw_real tmp863;
127      fftw_real tmp138;
128      fftw_real tmp531;
129      fftw_real tmp367;
130      fftw_real tmp462;
131      fftw_real tmp307;
132      fftw_real tmp419;
133      fftw_real tmp509;
134      fftw_real tmp583;
135      fftw_real tmp352;
136      fftw_real tmp423;
137      fftw_real tmp520;
138      fftw_real tmp587;
139      fftw_real tmp677;
140      fftw_real tmp747;
141      fftw_real tmp841;
142      fftw_real tmp915;
143      fftw_real tmp852;
144      fftw_real tmp919;
145      fftw_real tmp700;
146      fftw_real tmp748;
147      fftw_real tmp750;
148      fftw_real tmp692;
149      fftw_real tmp701;
150      fftw_real tmp751;
151      fftw_real tmp855;
152      fftw_real tmp916;
153      fftw_real tmp848;
154      fftw_real tmp918;
155      fftw_real tmp324;
156      fftw_real tmp353;
157      fftw_real tmp512;
158      fftw_real tmp521;
159      fftw_real tmp515;
160      fftw_real tmp522;
161      fftw_real tmp341;
162      fftw_real tmp354;
163      fftw_real tmp61;
164      fftw_real tmp627;
165      fftw_real tmp793;
166      fftw_real tmp866;
167      fftw_real tmp157;
168      fftw_real tmp370;
169      fftw_real tmp469;
170      fftw_real tmp534;
171      fftw_real tmp109;
172      fftw_real tmp633;
173      fftw_real tmp809;
174      fftw_real tmp900;
175      fftw_real tmp812;
176      fftw_real tmp901;
177      fftw_real tmp484;
178      fftw_real tmp569;
179      fftw_real tmp193;
180      fftw_real tmp405;
181      fftw_real tmp481;
182      fftw_real tmp568;
183      fftw_real tmp200;
184      fftw_real tmp404;
185      fftw_real tmp124;
186      fftw_real tmp634;
187      fftw_real tmp78;
188      fftw_real tmp630;
189      fftw_real tmp800;
190      fftw_real tmp904;
191      fftw_real tmp803;
192      fftw_real tmp903;
193      fftw_real tmp477;
194      fftw_real tmp571;
195      fftw_real tmp172;
196      fftw_real tmp407;
197      fftw_real tmp474;
198      fftw_real tmp572;
199      fftw_real tmp179;
200      fftw_real tmp408;
201      fftw_real tmp93;
202      fftw_real tmp631;
203      fftw_real tmp230;
204      fftw_real tmp415;
205      fftw_real tmp490;
206      fftw_real tmp579;
207      fftw_real tmp275;
208      fftw_real tmp413;
209      fftw_real tmp501;
210      fftw_real tmp577;
211      fftw_real tmp644;
212      fftw_real tmp740;
213      fftw_real tmp820;
214      fftw_real tmp911;
215      fftw_real tmp831;
216      fftw_real tmp909;
217      fftw_real tmp667;
218      fftw_real tmp741;
219      fftw_real tmp743;
220      fftw_real tmp659;
221      fftw_real tmp668;
222      fftw_real tmp744;
223      fftw_real tmp834;
224      fftw_real tmp912;
225      fftw_real tmp827;
226      fftw_real tmp908;
227      fftw_real tmp247;
228      fftw_real tmp276;
229      fftw_real tmp493;
230      fftw_real tmp502;
231      fftw_real tmp496;
232      fftw_real tmp503;
233      fftw_real tmp264;
234      fftw_real tmp277;
235      ASSERT_ALIGNED_DOUBLE;
236      {
237 	  fftw_real tmp3;
238 	  fftw_real tmp127;
239 	  fftw_real tmp13;
240 	  fftw_real tmp129;
241 	  fftw_real tmp6;
242 	  fftw_real tmp363;
243 	  fftw_real tmp10;
244 	  fftw_real tmp128;
245 	  ASSERT_ALIGNED_DOUBLE;
246 	  {
247 	       fftw_real tmp1;
248 	       fftw_real tmp2;
249 	       fftw_real tmp11;
250 	       fftw_real tmp12;
251 	       ASSERT_ALIGNED_DOUBLE;
252 	       tmp1 = input[0];
253 	       tmp2 = input[64 * istride];
254 	       tmp3 = tmp1 + tmp2;
255 	       tmp127 = tmp1 - tmp2;
256 	       tmp11 = input[112 * istride];
257 	       tmp12 = input[48 * istride];
258 	       tmp13 = tmp11 + tmp12;
259 	       tmp129 = tmp11 - tmp12;
260 	  }
261 	  {
262 	       fftw_real tmp4;
263 	       fftw_real tmp5;
264 	       fftw_real tmp8;
265 	       fftw_real tmp9;
266 	       ASSERT_ALIGNED_DOUBLE;
267 	       tmp4 = input[32 * istride];
268 	       tmp5 = input[96 * istride];
269 	       tmp6 = tmp4 + tmp5;
270 	       tmp363 = tmp4 - tmp5;
271 	       tmp8 = input[16 * istride];
272 	       tmp9 = input[80 * istride];
273 	       tmp10 = tmp8 + tmp9;
274 	       tmp128 = tmp8 - tmp9;
275 	  }
276 	  {
277 	       fftw_real tmp7;
278 	       fftw_real tmp14;
279 	       fftw_real tmp130;
280 	       fftw_real tmp362;
281 	       ASSERT_ALIGNED_DOUBLE;
282 	       tmp783 = tmp3 - tmp6;
283 	       tmp7 = tmp3 + tmp6;
284 	       tmp14 = tmp10 + tmp13;
285 	       tmp15 = tmp7 + tmp14;
286 	       tmp625 = tmp7 - tmp14;
287 	       tmp862 = tmp13 - tmp10;
288 	       tmp130 = K707106781 * (tmp128 + tmp129);
289 	       tmp131 = tmp127 + tmp130;
290 	       tmp461 = tmp127 - tmp130;
291 	       tmp362 = K707106781 * (tmp129 - tmp128);
292 	       tmp364 = tmp362 - tmp363;
293 	       tmp530 = tmp363 + tmp362;
294 	  }
295      }
296      {
297 	  fftw_real tmp34;
298 	  fftw_real tmp140;
299 	  fftw_real tmp37;
300 	  fftw_real tmp146;
301 	  fftw_real tmp41;
302 	  fftw_real tmp145;
303 	  fftw_real tmp143;
304 	  fftw_real tmp44;
305 	  ASSERT_ALIGNED_DOUBLE;
306 	  {
307 	       fftw_real tmp32;
308 	       fftw_real tmp33;
309 	       fftw_real tmp35;
310 	       fftw_real tmp36;
311 	       ASSERT_ALIGNED_DOUBLE;
312 	       tmp32 = input[4 * istride];
313 	       tmp33 = input[68 * istride];
314 	       tmp34 = tmp32 + tmp33;
315 	       tmp140 = tmp32 - tmp33;
316 	       tmp35 = input[36 * istride];
317 	       tmp36 = input[100 * istride];
318 	       tmp37 = tmp35 + tmp36;
319 	       tmp146 = tmp35 - tmp36;
320 	       {
321 		    fftw_real tmp39;
322 		    fftw_real tmp40;
323 		    fftw_real tmp141;
324 		    fftw_real tmp42;
325 		    fftw_real tmp43;
326 		    fftw_real tmp142;
327 		    ASSERT_ALIGNED_DOUBLE;
328 		    tmp39 = input[20 * istride];
329 		    tmp40 = input[84 * istride];
330 		    tmp141 = tmp39 - tmp40;
331 		    tmp42 = input[116 * istride];
332 		    tmp43 = input[52 * istride];
333 		    tmp142 = tmp42 - tmp43;
334 		    tmp41 = tmp39 + tmp40;
335 		    tmp145 = K707106781 * (tmp142 - tmp141);
336 		    tmp143 = K707106781 * (tmp141 + tmp142);
337 		    tmp44 = tmp42 + tmp43;
338 	       }
339 	  }
340 	  {
341 	       fftw_real tmp38;
342 	       fftw_real tmp45;
343 	       fftw_real tmp788;
344 	       fftw_real tmp789;
345 	       ASSERT_ALIGNED_DOUBLE;
346 	       tmp38 = tmp34 + tmp37;
347 	       tmp45 = tmp41 + tmp44;
348 	       tmp46 = tmp38 + tmp45;
349 	       tmp626 = tmp38 - tmp45;
350 	       tmp788 = tmp34 - tmp37;
351 	       tmp789 = tmp44 - tmp41;
352 	       tmp790 = (K923879532 * tmp788) + (K382683432 * tmp789);
353 	       tmp865 = (K923879532 * tmp789) - (K382683432 * tmp788);
354 	  }
355 	  {
356 	       fftw_real tmp144;
357 	       fftw_real tmp147;
358 	       fftw_real tmp464;
359 	       fftw_real tmp465;
360 	       ASSERT_ALIGNED_DOUBLE;
361 	       tmp144 = tmp140 + tmp143;
362 	       tmp147 = tmp145 - tmp146;
363 	       tmp148 = (K980785280 * tmp144) + (K195090322 * tmp147);
364 	       tmp369 = (K980785280 * tmp147) - (K195090322 * tmp144);
365 	       tmp464 = tmp140 - tmp143;
366 	       tmp465 = tmp146 + tmp145;
367 	       tmp466 = (K831469612 * tmp464) + (K555570233 * tmp465);
368 	       tmp533 = (K831469612 * tmp465) - (K555570233 * tmp464);
369 	  }
370      }
371      {
372 	  fftw_real tmp18;
373 	  fftw_real tmp132;
374 	  fftw_real tmp28;
375 	  fftw_real tmp136;
376 	  fftw_real tmp21;
377 	  fftw_real tmp133;
378 	  fftw_real tmp25;
379 	  fftw_real tmp135;
380 	  ASSERT_ALIGNED_DOUBLE;
381 	  {
382 	       fftw_real tmp16;
383 	       fftw_real tmp17;
384 	       fftw_real tmp26;
385 	       fftw_real tmp27;
386 	       ASSERT_ALIGNED_DOUBLE;
387 	       tmp16 = input[8 * istride];
388 	       tmp17 = input[72 * istride];
389 	       tmp18 = tmp16 + tmp17;
390 	       tmp132 = tmp16 - tmp17;
391 	       tmp26 = input[24 * istride];
392 	       tmp27 = input[88 * istride];
393 	       tmp28 = tmp26 + tmp27;
394 	       tmp136 = tmp26 - tmp27;
395 	  }
396 	  {
397 	       fftw_real tmp19;
398 	       fftw_real tmp20;
399 	       fftw_real tmp23;
400 	       fftw_real tmp24;
401 	       ASSERT_ALIGNED_DOUBLE;
402 	       tmp19 = input[40 * istride];
403 	       tmp20 = input[104 * istride];
404 	       tmp21 = tmp19 + tmp20;
405 	       tmp133 = tmp19 - tmp20;
406 	       tmp23 = input[120 * istride];
407 	       tmp24 = input[56 * istride];
408 	       tmp25 = tmp23 + tmp24;
409 	       tmp135 = tmp23 - tmp24;
410 	  }
411 	  {
412 	       fftw_real tmp22;
413 	       fftw_real tmp29;
414 	       fftw_real tmp784;
415 	       fftw_real tmp785;
416 	       ASSERT_ALIGNED_DOUBLE;
417 	       tmp22 = tmp18 + tmp21;
418 	       tmp29 = tmp25 + tmp28;
419 	       tmp30 = tmp22 + tmp29;
420 	       tmp708 = tmp29 - tmp22;
421 	       tmp784 = tmp18 - tmp21;
422 	       tmp785 = tmp25 - tmp28;
423 	       tmp786 = K707106781 * (tmp784 + tmp785);
424 	       tmp863 = K707106781 * (tmp785 - tmp784);
425 	  }
426 	  {
427 	       fftw_real tmp134;
428 	       fftw_real tmp137;
429 	       fftw_real tmp365;
430 	       fftw_real tmp366;
431 	       ASSERT_ALIGNED_DOUBLE;
432 	       tmp134 = (K923879532 * tmp132) - (K382683432 * tmp133);
433 	       tmp137 = (K923879532 * tmp135) + (K382683432 * tmp136);
434 	       tmp138 = tmp134 + tmp137;
435 	       tmp531 = tmp137 - tmp134;
436 	       tmp365 = (K382683432 * tmp135) - (K923879532 * tmp136);
437 	       tmp366 = (K382683432 * tmp132) + (K923879532 * tmp133);
438 	       tmp367 = tmp365 - tmp366;
439 	       tmp462 = tmp366 + tmp365;
440 	  }
441      }
442      {
443 	  fftw_real tmp283;
444 	  fftw_real tmp671;
445 	  fftw_real tmp347;
446 	  fftw_real tmp672;
447 	  fftw_real tmp290;
448 	  fftw_real tmp344;
449 	  fftw_real tmp674;
450 	  fftw_real tmp675;
451 	  fftw_real tmp697;
452 	  fftw_real tmp698;
453 	  fftw_real tmp298;
454 	  fftw_real tmp350;
455 	  fftw_real tmp838;
456 	  fftw_real tmp694;
457 	  fftw_real tmp695;
458 	  fftw_real tmp305;
459 	  fftw_real tmp349;
460 	  fftw_real tmp839;
461 	  ASSERT_ALIGNED_DOUBLE;
462 	  {
463 	       fftw_real tmp281;
464 	       fftw_real tmp282;
465 	       fftw_real tmp345;
466 	       fftw_real tmp346;
467 	       ASSERT_ALIGNED_DOUBLE;
468 	       tmp281 = input[127 * istride];
469 	       tmp282 = input[63 * istride];
470 	       tmp283 = tmp281 - tmp282;
471 	       tmp671 = tmp281 + tmp282;
472 	       tmp345 = input[31 * istride];
473 	       tmp346 = input[95 * istride];
474 	       tmp347 = tmp345 - tmp346;
475 	       tmp672 = tmp345 + tmp346;
476 	  }
477 	  {
478 	       fftw_real tmp284;
479 	       fftw_real tmp285;
480 	       fftw_real tmp286;
481 	       fftw_real tmp287;
482 	       fftw_real tmp288;
483 	       fftw_real tmp289;
484 	       ASSERT_ALIGNED_DOUBLE;
485 	       tmp284 = input[15 * istride];
486 	       tmp285 = input[79 * istride];
487 	       tmp286 = tmp284 - tmp285;
488 	       tmp287 = input[111 * istride];
489 	       tmp288 = input[47 * istride];
490 	       tmp289 = tmp287 - tmp288;
491 	       tmp290 = K707106781 * (tmp286 + tmp289);
492 	       tmp344 = K707106781 * (tmp289 - tmp286);
493 	       tmp674 = tmp284 + tmp285;
494 	       tmp675 = tmp287 + tmp288;
495 	  }
496 	  {
497 	       fftw_real tmp294;
498 	       fftw_real tmp297;
499 	       fftw_real tmp301;
500 	       fftw_real tmp304;
501 	       ASSERT_ALIGNED_DOUBLE;
502 	       {
503 		    fftw_real tmp292;
504 		    fftw_real tmp293;
505 		    fftw_real tmp295;
506 		    fftw_real tmp296;
507 		    ASSERT_ALIGNED_DOUBLE;
508 		    tmp292 = input[7 * istride];
509 		    tmp293 = input[71 * istride];
510 		    tmp294 = tmp292 - tmp293;
511 		    tmp697 = tmp292 + tmp293;
512 		    tmp295 = input[39 * istride];
513 		    tmp296 = input[103 * istride];
514 		    tmp297 = tmp295 - tmp296;
515 		    tmp698 = tmp295 + tmp296;
516 	       }
517 	       tmp298 = (K923879532 * tmp294) - (K382683432 * tmp297);
518 	       tmp350 = (K382683432 * tmp294) + (K923879532 * tmp297);
519 	       tmp838 = tmp697 - tmp698;
520 	       {
521 		    fftw_real tmp299;
522 		    fftw_real tmp300;
523 		    fftw_real tmp302;
524 		    fftw_real tmp303;
525 		    ASSERT_ALIGNED_DOUBLE;
526 		    tmp299 = input[119 * istride];
527 		    tmp300 = input[55 * istride];
528 		    tmp301 = tmp299 - tmp300;
529 		    tmp694 = tmp299 + tmp300;
530 		    tmp302 = input[23 * istride];
531 		    tmp303 = input[87 * istride];
532 		    tmp304 = tmp302 - tmp303;
533 		    tmp695 = tmp302 + tmp303;
534 	       }
535 	       tmp305 = (K923879532 * tmp301) + (K382683432 * tmp304);
536 	       tmp349 = (K382683432 * tmp301) - (K923879532 * tmp304);
537 	       tmp839 = tmp694 - tmp695;
538 	  }
539 	  {
540 	       fftw_real tmp291;
541 	       fftw_real tmp306;
542 	       fftw_real tmp507;
543 	       fftw_real tmp508;
544 	       ASSERT_ALIGNED_DOUBLE;
545 	       tmp291 = tmp283 + tmp290;
546 	       tmp306 = tmp298 + tmp305;
547 	       tmp307 = tmp291 + tmp306;
548 	       tmp419 = tmp291 - tmp306;
549 	       tmp507 = tmp283 - tmp290;
550 	       tmp508 = tmp350 + tmp349;
551 	       tmp509 = tmp507 + tmp508;
552 	       tmp583 = tmp507 - tmp508;
553 	  }
554 	  {
555 	       fftw_real tmp348;
556 	       fftw_real tmp351;
557 	       fftw_real tmp518;
558 	       fftw_real tmp519;
559 	       ASSERT_ALIGNED_DOUBLE;
560 	       tmp348 = tmp344 - tmp347;
561 	       tmp351 = tmp349 - tmp350;
562 	       tmp352 = tmp348 + tmp351;
563 	       tmp423 = tmp351 - tmp348;
564 	       tmp518 = tmp347 + tmp344;
565 	       tmp519 = tmp305 - tmp298;
566 	       tmp520 = tmp518 + tmp519;
567 	       tmp587 = tmp519 - tmp518;
568 	  }
569 	  {
570 	       fftw_real tmp673;
571 	       fftw_real tmp676;
572 	       fftw_real tmp837;
573 	       fftw_real tmp840;
574 	       ASSERT_ALIGNED_DOUBLE;
575 	       tmp673 = tmp671 + tmp672;
576 	       tmp676 = tmp674 + tmp675;
577 	       tmp677 = tmp673 - tmp676;
578 	       tmp747 = tmp673 + tmp676;
579 	       tmp837 = tmp671 - tmp672;
580 	       tmp840 = K707106781 * (tmp838 + tmp839);
581 	       tmp841 = tmp837 + tmp840;
582 	       tmp915 = tmp837 - tmp840;
583 	  }
584 	  {
585 	       fftw_real tmp850;
586 	       fftw_real tmp851;
587 	       fftw_real tmp696;
588 	       fftw_real tmp699;
589 	       ASSERT_ALIGNED_DOUBLE;
590 	       tmp850 = tmp675 - tmp674;
591 	       tmp851 = K707106781 * (tmp839 - tmp838);
592 	       tmp852 = tmp850 + tmp851;
593 	       tmp919 = tmp851 - tmp850;
594 	       tmp696 = tmp694 + tmp695;
595 	       tmp699 = tmp697 + tmp698;
596 	       tmp700 = tmp696 - tmp699;
597 	       tmp748 = tmp699 + tmp696;
598 	  }
599      }
600      {
601 	  fftw_real tmp310;
602 	  fftw_real tmp842;
603 	  fftw_real tmp680;
604 	  fftw_real tmp322;
605 	  fftw_real tmp334;
606 	  fftw_real tmp336;
607 	  fftw_real tmp690;
608 	  fftw_real tmp846;
609 	  fftw_real tmp327;
610 	  fftw_real tmp845;
611 	  fftw_real tmp687;
612 	  fftw_real tmp339;
613 	  fftw_real tmp317;
614 	  fftw_real tmp319;
615 	  fftw_real tmp683;
616 	  fftw_real tmp843;
617 	  fftw_real tmp510;
618 	  fftw_real tmp511;
619 	  ASSERT_ALIGNED_DOUBLE;
620 	  {
621 	       fftw_real tmp308;
622 	       fftw_real tmp309;
623 	       fftw_real tmp678;
624 	       fftw_real tmp320;
625 	       fftw_real tmp321;
626 	       fftw_real tmp679;
627 	       ASSERT_ALIGNED_DOUBLE;
628 	       tmp308 = input[3 * istride];
629 	       tmp309 = input[67 * istride];
630 	       tmp678 = tmp308 + tmp309;
631 	       tmp320 = input[35 * istride];
632 	       tmp321 = input[99 * istride];
633 	       tmp679 = tmp320 + tmp321;
634 	       tmp310 = tmp308 - tmp309;
635 	       tmp842 = tmp678 - tmp679;
636 	       tmp680 = tmp678 + tmp679;
637 	       tmp322 = tmp320 - tmp321;
638 	  }
639 	  {
640 	       fftw_real tmp330;
641 	       fftw_real tmp688;
642 	       fftw_real tmp333;
643 	       fftw_real tmp689;
644 	       ASSERT_ALIGNED_DOUBLE;
645 	       {
646 		    fftw_real tmp328;
647 		    fftw_real tmp329;
648 		    fftw_real tmp331;
649 		    fftw_real tmp332;
650 		    ASSERT_ALIGNED_DOUBLE;
651 		    tmp328 = input[11 * istride];
652 		    tmp329 = input[75 * istride];
653 		    tmp330 = tmp328 - tmp329;
654 		    tmp688 = tmp328 + tmp329;
655 		    tmp331 = input[107 * istride];
656 		    tmp332 = input[43 * istride];
657 		    tmp333 = tmp331 - tmp332;
658 		    tmp689 = tmp331 + tmp332;
659 	       }
660 	       tmp334 = K707106781 * (tmp330 + tmp333);
661 	       tmp336 = K707106781 * (tmp333 - tmp330);
662 	       tmp690 = tmp688 + tmp689;
663 	       tmp846 = tmp689 - tmp688;
664 	  }
665 	  {
666 	       fftw_real tmp325;
667 	       fftw_real tmp326;
668 	       fftw_real tmp685;
669 	       fftw_real tmp337;
670 	       fftw_real tmp338;
671 	       fftw_real tmp686;
672 	       ASSERT_ALIGNED_DOUBLE;
673 	       tmp325 = input[123 * istride];
674 	       tmp326 = input[59 * istride];
675 	       tmp685 = tmp325 + tmp326;
676 	       tmp337 = input[27 * istride];
677 	       tmp338 = input[91 * istride];
678 	       tmp686 = tmp337 + tmp338;
679 	       tmp327 = tmp325 - tmp326;
680 	       tmp845 = tmp685 - tmp686;
681 	       tmp687 = tmp685 + tmp686;
682 	       tmp339 = tmp337 - tmp338;
683 	  }
684 	  {
685 	       fftw_real tmp313;
686 	       fftw_real tmp681;
687 	       fftw_real tmp316;
688 	       fftw_real tmp682;
689 	       ASSERT_ALIGNED_DOUBLE;
690 	       {
691 		    fftw_real tmp311;
692 		    fftw_real tmp312;
693 		    fftw_real tmp314;
694 		    fftw_real tmp315;
695 		    ASSERT_ALIGNED_DOUBLE;
696 		    tmp311 = input[19 * istride];
697 		    tmp312 = input[83 * istride];
698 		    tmp313 = tmp311 - tmp312;
699 		    tmp681 = tmp311 + tmp312;
700 		    tmp314 = input[115 * istride];
701 		    tmp315 = input[51 * istride];
702 		    tmp316 = tmp314 - tmp315;
703 		    tmp682 = tmp314 + tmp315;
704 	       }
705 	       tmp317 = K707106781 * (tmp313 + tmp316);
706 	       tmp319 = K707106781 * (tmp316 - tmp313);
707 	       tmp683 = tmp681 + tmp682;
708 	       tmp843 = tmp682 - tmp681;
709 	  }
710 	  {
711 	       fftw_real tmp684;
712 	       fftw_real tmp691;
713 	       fftw_real tmp853;
714 	       fftw_real tmp854;
715 	       ASSERT_ALIGNED_DOUBLE;
716 	       tmp750 = tmp680 + tmp683;
717 	       tmp684 = tmp680 - tmp683;
718 	       tmp691 = tmp687 - tmp690;
719 	       tmp692 = K707106781 * (tmp684 + tmp691);
720 	       tmp701 = K707106781 * (tmp691 - tmp684);
721 	       tmp751 = tmp687 + tmp690;
722 	       tmp853 = (K923879532 * tmp843) - (K382683432 * tmp842);
723 	       tmp854 = (K382683432 * tmp845) + (K923879532 * tmp846);
724 	       tmp855 = tmp853 + tmp854;
725 	       tmp916 = tmp854 - tmp853;
726 	  }
727 	  {
728 	       fftw_real tmp844;
729 	       fftw_real tmp847;
730 	       fftw_real tmp318;
731 	       fftw_real tmp323;
732 	       ASSERT_ALIGNED_DOUBLE;
733 	       tmp844 = (K923879532 * tmp842) + (K382683432 * tmp843);
734 	       tmp847 = (K923879532 * tmp845) - (K382683432 * tmp846);
735 	       tmp848 = tmp844 + tmp847;
736 	       tmp918 = tmp847 - tmp844;
737 	       tmp318 = tmp310 + tmp317;
738 	       tmp323 = tmp319 - tmp322;
739 	       tmp324 = (K980785280 * tmp318) + (K195090322 * tmp323);
740 	       tmp353 = (K980785280 * tmp323) - (K195090322 * tmp318);
741 	  }
742 	  tmp510 = tmp310 - tmp317;
743 	  tmp511 = tmp322 + tmp319;
744 	  tmp512 = (K831469612 * tmp510) + (K555570233 * tmp511);
745 	  tmp521 = (K831469612 * tmp511) - (K555570233 * tmp510);
746 	  {
747 	       fftw_real tmp513;
748 	       fftw_real tmp514;
749 	       fftw_real tmp335;
750 	       fftw_real tmp340;
751 	       ASSERT_ALIGNED_DOUBLE;
752 	       tmp513 = tmp327 - tmp334;
753 	       tmp514 = tmp339 + tmp336;
754 	       tmp515 = (K831469612 * tmp513) - (K555570233 * tmp514);
755 	       tmp522 = (K555570233 * tmp513) + (K831469612 * tmp514);
756 	       tmp335 = tmp327 + tmp334;
757 	       tmp340 = tmp336 - tmp339;
758 	       tmp341 = (K980785280 * tmp335) - (K195090322 * tmp340);
759 	       tmp354 = (K195090322 * tmp335) + (K980785280 * tmp340);
760 	  }
761      }
762      {
763 	  fftw_real tmp49;
764 	  fftw_real tmp149;
765 	  fftw_real tmp52;
766 	  fftw_real tmp155;
767 	  fftw_real tmp56;
768 	  fftw_real tmp154;
769 	  fftw_real tmp152;
770 	  fftw_real tmp59;
771 	  ASSERT_ALIGNED_DOUBLE;
772 	  {
773 	       fftw_real tmp47;
774 	       fftw_real tmp48;
775 	       fftw_real tmp50;
776 	       fftw_real tmp51;
777 	       ASSERT_ALIGNED_DOUBLE;
778 	       tmp47 = input[124 * istride];
779 	       tmp48 = input[60 * istride];
780 	       tmp49 = tmp47 + tmp48;
781 	       tmp149 = tmp47 - tmp48;
782 	       tmp50 = input[28 * istride];
783 	       tmp51 = input[92 * istride];
784 	       tmp52 = tmp50 + tmp51;
785 	       tmp155 = tmp50 - tmp51;
786 	       {
787 		    fftw_real tmp54;
788 		    fftw_real tmp55;
789 		    fftw_real tmp150;
790 		    fftw_real tmp57;
791 		    fftw_real tmp58;
792 		    fftw_real tmp151;
793 		    ASSERT_ALIGNED_DOUBLE;
794 		    tmp54 = input[12 * istride];
795 		    tmp55 = input[76 * istride];
796 		    tmp150 = tmp54 - tmp55;
797 		    tmp57 = input[108 * istride];
798 		    tmp58 = input[44 * istride];
799 		    tmp151 = tmp57 - tmp58;
800 		    tmp56 = tmp54 + tmp55;
801 		    tmp154 = K707106781 * (tmp151 - tmp150);
802 		    tmp152 = K707106781 * (tmp150 + tmp151);
803 		    tmp59 = tmp57 + tmp58;
804 	       }
805 	  }
806 	  {
807 	       fftw_real tmp53;
808 	       fftw_real tmp60;
809 	       fftw_real tmp791;
810 	       fftw_real tmp792;
811 	       ASSERT_ALIGNED_DOUBLE;
812 	       tmp53 = tmp49 + tmp52;
813 	       tmp60 = tmp56 + tmp59;
814 	       tmp61 = tmp53 + tmp60;
815 	       tmp627 = tmp53 - tmp60;
816 	       tmp791 = tmp49 - tmp52;
817 	       tmp792 = tmp59 - tmp56;
818 	       tmp793 = (K923879532 * tmp791) - (K382683432 * tmp792);
819 	       tmp866 = (K382683432 * tmp791) + (K923879532 * tmp792);
820 	  }
821 	  {
822 	       fftw_real tmp153;
823 	       fftw_real tmp156;
824 	       fftw_real tmp467;
825 	       fftw_real tmp468;
826 	       ASSERT_ALIGNED_DOUBLE;
827 	       tmp153 = tmp149 + tmp152;
828 	       tmp156 = tmp154 - tmp155;
829 	       tmp157 = (K980785280 * tmp153) - (K195090322 * tmp156);
830 	       tmp370 = (K195090322 * tmp153) + (K980785280 * tmp156);
831 	       tmp467 = tmp149 - tmp152;
832 	       tmp468 = tmp155 + tmp154;
833 	       tmp469 = (K831469612 * tmp467) - (K555570233 * tmp468);
834 	       tmp534 = (K555570233 * tmp467) + (K831469612 * tmp468);
835 	  }
836      }
837      {
838 	  fftw_real tmp97;
839 	  fftw_real tmp181;
840 	  fftw_real tmp119;
841 	  fftw_real tmp122;
842 	  fftw_real tmp191;
843 	  fftw_real tmp197;
844 	  fftw_real tmp807;
845 	  fftw_real tmp100;
846 	  fftw_real tmp195;
847 	  fftw_real tmp104;
848 	  fftw_real tmp194;
849 	  fftw_real tmp184;
850 	  fftw_real tmp107;
851 	  fftw_real tmp112;
852 	  fftw_real tmp115;
853 	  fftw_real tmp188;
854 	  fftw_real tmp198;
855 	  fftw_real tmp806;
856 	  ASSERT_ALIGNED_DOUBLE;
857 	  {
858 	       fftw_real tmp95;
859 	       fftw_real tmp96;
860 	       fftw_real tmp189;
861 	       fftw_real tmp190;
862 	       ASSERT_ALIGNED_DOUBLE;
863 	       tmp95 = input[126 * istride];
864 	       tmp96 = input[62 * istride];
865 	       tmp97 = tmp95 + tmp96;
866 	       tmp181 = tmp95 - tmp96;
867 	       {
868 		    fftw_real tmp117;
869 		    fftw_real tmp118;
870 		    fftw_real tmp120;
871 		    fftw_real tmp121;
872 		    ASSERT_ALIGNED_DOUBLE;
873 		    tmp117 = input[118 * istride];
874 		    tmp118 = input[54 * istride];
875 		    tmp119 = tmp117 + tmp118;
876 		    tmp189 = tmp117 - tmp118;
877 		    tmp120 = input[22 * istride];
878 		    tmp121 = input[86 * istride];
879 		    tmp122 = tmp120 + tmp121;
880 		    tmp190 = tmp120 - tmp121;
881 	       }
882 	       tmp191 = (K923879532 * tmp189) + (K382683432 * tmp190);
883 	       tmp197 = (K382683432 * tmp189) - (K923879532 * tmp190);
884 	       tmp807 = tmp119 - tmp122;
885 	  }
886 	  {
887 	       fftw_real tmp98;
888 	       fftw_real tmp99;
889 	       fftw_real tmp186;
890 	       fftw_real tmp187;
891 	       ASSERT_ALIGNED_DOUBLE;
892 	       tmp98 = input[30 * istride];
893 	       tmp99 = input[94 * istride];
894 	       tmp100 = tmp98 + tmp99;
895 	       tmp195 = tmp98 - tmp99;
896 	       {
897 		    fftw_real tmp102;
898 		    fftw_real tmp103;
899 		    fftw_real tmp182;
900 		    fftw_real tmp105;
901 		    fftw_real tmp106;
902 		    fftw_real tmp183;
903 		    ASSERT_ALIGNED_DOUBLE;
904 		    tmp102 = input[14 * istride];
905 		    tmp103 = input[78 * istride];
906 		    tmp182 = tmp102 - tmp103;
907 		    tmp105 = input[110 * istride];
908 		    tmp106 = input[46 * istride];
909 		    tmp183 = tmp105 - tmp106;
910 		    tmp104 = tmp102 + tmp103;
911 		    tmp194 = K707106781 * (tmp183 - tmp182);
912 		    tmp184 = K707106781 * (tmp182 + tmp183);
913 		    tmp107 = tmp105 + tmp106;
914 	       }
915 	       {
916 		    fftw_real tmp110;
917 		    fftw_real tmp111;
918 		    fftw_real tmp113;
919 		    fftw_real tmp114;
920 		    ASSERT_ALIGNED_DOUBLE;
921 		    tmp110 = input[6 * istride];
922 		    tmp111 = input[70 * istride];
923 		    tmp112 = tmp110 + tmp111;
924 		    tmp186 = tmp110 - tmp111;
925 		    tmp113 = input[38 * istride];
926 		    tmp114 = input[102 * istride];
927 		    tmp115 = tmp113 + tmp114;
928 		    tmp187 = tmp113 - tmp114;
929 	       }
930 	       tmp188 = (K923879532 * tmp186) - (K382683432 * tmp187);
931 	       tmp198 = (K382683432 * tmp186) + (K923879532 * tmp187);
932 	       tmp806 = tmp112 - tmp115;
933 	  }
934 	  {
935 	       fftw_real tmp101;
936 	       fftw_real tmp108;
937 	       fftw_real tmp805;
938 	       fftw_real tmp808;
939 	       ASSERT_ALIGNED_DOUBLE;
940 	       tmp101 = tmp97 + tmp100;
941 	       tmp108 = tmp104 + tmp107;
942 	       tmp109 = tmp101 + tmp108;
943 	       tmp633 = tmp101 - tmp108;
944 	       tmp805 = tmp97 - tmp100;
945 	       tmp808 = K707106781 * (tmp806 + tmp807);
946 	       tmp809 = tmp805 + tmp808;
947 	       tmp900 = tmp805 - tmp808;
948 	  }
949 	  {
950 	       fftw_real tmp810;
951 	       fftw_real tmp811;
952 	       fftw_real tmp482;
953 	       fftw_real tmp483;
954 	       ASSERT_ALIGNED_DOUBLE;
955 	       tmp810 = tmp107 - tmp104;
956 	       tmp811 = K707106781 * (tmp807 - tmp806);
957 	       tmp812 = tmp810 + tmp811;
958 	       tmp901 = tmp811 - tmp810;
959 	       tmp482 = tmp195 + tmp194;
960 	       tmp483 = tmp191 - tmp188;
961 	       tmp484 = tmp482 + tmp483;
962 	       tmp569 = tmp483 - tmp482;
963 	  }
964 	  {
965 	       fftw_real tmp185;
966 	       fftw_real tmp192;
967 	       fftw_real tmp479;
968 	       fftw_real tmp480;
969 	       ASSERT_ALIGNED_DOUBLE;
970 	       tmp185 = tmp181 + tmp184;
971 	       tmp192 = tmp188 + tmp191;
972 	       tmp193 = tmp185 + tmp192;
973 	       tmp405 = tmp185 - tmp192;
974 	       tmp479 = tmp181 - tmp184;
975 	       tmp480 = tmp198 + tmp197;
976 	       tmp481 = tmp479 + tmp480;
977 	       tmp568 = tmp479 - tmp480;
978 	  }
979 	  {
980 	       fftw_real tmp196;
981 	       fftw_real tmp199;
982 	       fftw_real tmp116;
983 	       fftw_real tmp123;
984 	       ASSERT_ALIGNED_DOUBLE;
985 	       tmp196 = tmp194 - tmp195;
986 	       tmp199 = tmp197 - tmp198;
987 	       tmp200 = tmp196 + tmp199;
988 	       tmp404 = tmp199 - tmp196;
989 	       tmp116 = tmp112 + tmp115;
990 	       tmp123 = tmp119 + tmp122;
991 	       tmp124 = tmp116 + tmp123;
992 	       tmp634 = tmp123 - tmp116;
993 	  }
994      }
995      {
996 	  fftw_real tmp66;
997 	  fftw_real tmp173;
998 	  fftw_real tmp88;
999 	  fftw_real tmp91;
1000 	  fftw_real tmp167;
1001 	  fftw_real tmp177;
1002 	  fftw_real tmp798;
1003 	  fftw_real tmp69;
1004 	  fftw_real tmp163;
1005 	  fftw_real tmp73;
1006 	  fftw_real tmp174;
1007 	  fftw_real tmp162;
1008 	  fftw_real tmp76;
1009 	  fftw_real tmp81;
1010 	  fftw_real tmp84;
1011 	  fftw_real tmp170;
1012 	  fftw_real tmp176;
1013 	  fftw_real tmp797;
1014 	  ASSERT_ALIGNED_DOUBLE;
1015 	  {
1016 	       fftw_real tmp64;
1017 	       fftw_real tmp65;
1018 	       fftw_real tmp165;
1019 	       fftw_real tmp166;
1020 	       ASSERT_ALIGNED_DOUBLE;
1021 	       tmp64 = input[2 * istride];
1022 	       tmp65 = input[66 * istride];
1023 	       tmp66 = tmp64 + tmp65;
1024 	       tmp173 = tmp64 - tmp65;
1025 	       {
1026 		    fftw_real tmp86;
1027 		    fftw_real tmp87;
1028 		    fftw_real tmp89;
1029 		    fftw_real tmp90;
1030 		    ASSERT_ALIGNED_DOUBLE;
1031 		    tmp86 = input[122 * istride];
1032 		    tmp87 = input[58 * istride];
1033 		    tmp88 = tmp86 + tmp87;
1034 		    tmp165 = tmp86 - tmp87;
1035 		    tmp89 = input[26 * istride];
1036 		    tmp90 = input[90 * istride];
1037 		    tmp91 = tmp89 + tmp90;
1038 		    tmp166 = tmp89 - tmp90;
1039 	       }
1040 	       tmp167 = (K382683432 * tmp165) - (K923879532 * tmp166);
1041 	       tmp177 = (K923879532 * tmp165) + (K382683432 * tmp166);
1042 	       tmp798 = tmp88 - tmp91;
1043 	  }
1044 	  {
1045 	       fftw_real tmp67;
1046 	       fftw_real tmp68;
1047 	       fftw_real tmp168;
1048 	       fftw_real tmp169;
1049 	       ASSERT_ALIGNED_DOUBLE;
1050 	       tmp67 = input[34 * istride];
1051 	       tmp68 = input[98 * istride];
1052 	       tmp69 = tmp67 + tmp68;
1053 	       tmp163 = tmp67 - tmp68;
1054 	       {
1055 		    fftw_real tmp71;
1056 		    fftw_real tmp72;
1057 		    fftw_real tmp161;
1058 		    fftw_real tmp74;
1059 		    fftw_real tmp75;
1060 		    fftw_real tmp160;
1061 		    ASSERT_ALIGNED_DOUBLE;
1062 		    tmp71 = input[18 * istride];
1063 		    tmp72 = input[82 * istride];
1064 		    tmp161 = tmp71 - tmp72;
1065 		    tmp74 = input[114 * istride];
1066 		    tmp75 = input[50 * istride];
1067 		    tmp160 = tmp74 - tmp75;
1068 		    tmp73 = tmp71 + tmp72;
1069 		    tmp174 = K707106781 * (tmp161 + tmp160);
1070 		    tmp162 = K707106781 * (tmp160 - tmp161);
1071 		    tmp76 = tmp74 + tmp75;
1072 	       }
1073 	       {
1074 		    fftw_real tmp79;
1075 		    fftw_real tmp80;
1076 		    fftw_real tmp82;
1077 		    fftw_real tmp83;
1078 		    ASSERT_ALIGNED_DOUBLE;
1079 		    tmp79 = input[10 * istride];
1080 		    tmp80 = input[74 * istride];
1081 		    tmp81 = tmp79 + tmp80;
1082 		    tmp168 = tmp79 - tmp80;
1083 		    tmp82 = input[42 * istride];
1084 		    tmp83 = input[106 * istride];
1085 		    tmp84 = tmp82 + tmp83;
1086 		    tmp169 = tmp82 - tmp83;
1087 	       }
1088 	       tmp170 = (K382683432 * tmp168) + (K923879532 * tmp169);
1089 	       tmp176 = (K923879532 * tmp168) - (K382683432 * tmp169);
1090 	       tmp797 = tmp81 - tmp84;
1091 	  }
1092 	  {
1093 	       fftw_real tmp70;
1094 	       fftw_real tmp77;
1095 	       fftw_real tmp796;
1096 	       fftw_real tmp799;
1097 	       ASSERT_ALIGNED_DOUBLE;
1098 	       tmp70 = tmp66 + tmp69;
1099 	       tmp77 = tmp73 + tmp76;
1100 	       tmp78 = tmp70 + tmp77;
1101 	       tmp630 = tmp70 - tmp77;
1102 	       tmp796 = tmp66 - tmp69;
1103 	       tmp799 = K707106781 * (tmp797 + tmp798);
1104 	       tmp800 = tmp796 + tmp799;
1105 	       tmp904 = tmp796 - tmp799;
1106 	  }
1107 	  {
1108 	       fftw_real tmp801;
1109 	       fftw_real tmp802;
1110 	       fftw_real tmp475;
1111 	       fftw_real tmp476;
1112 	       ASSERT_ALIGNED_DOUBLE;
1113 	       tmp801 = tmp76 - tmp73;
1114 	       tmp802 = K707106781 * (tmp798 - tmp797);
1115 	       tmp803 = tmp801 + tmp802;
1116 	       tmp903 = tmp802 - tmp801;
1117 	       tmp475 = tmp163 + tmp162;
1118 	       tmp476 = tmp177 - tmp176;
1119 	       tmp477 = tmp475 + tmp476;
1120 	       tmp571 = tmp476 - tmp475;
1121 	  }
1122 	  {
1123 	       fftw_real tmp164;
1124 	       fftw_real tmp171;
1125 	       fftw_real tmp472;
1126 	       fftw_real tmp473;
1127 	       ASSERT_ALIGNED_DOUBLE;
1128 	       tmp164 = tmp162 - tmp163;
1129 	       tmp171 = tmp167 - tmp170;
1130 	       tmp172 = tmp164 + tmp171;
1131 	       tmp407 = tmp171 - tmp164;
1132 	       tmp472 = tmp173 - tmp174;
1133 	       tmp473 = tmp170 + tmp167;
1134 	       tmp474 = tmp472 + tmp473;
1135 	       tmp572 = tmp472 - tmp473;
1136 	  }
1137 	  {
1138 	       fftw_real tmp175;
1139 	       fftw_real tmp178;
1140 	       fftw_real tmp85;
1141 	       fftw_real tmp92;
1142 	       ASSERT_ALIGNED_DOUBLE;
1143 	       tmp175 = tmp173 + tmp174;
1144 	       tmp178 = tmp176 + tmp177;
1145 	       tmp179 = tmp175 + tmp178;
1146 	       tmp408 = tmp175 - tmp178;
1147 	       tmp85 = tmp81 + tmp84;
1148 	       tmp92 = tmp88 + tmp91;
1149 	       tmp93 = tmp85 + tmp92;
1150 	       tmp631 = tmp92 - tmp85;
1151 	  }
1152      }
1153      {
1154 	  fftw_real tmp206;
1155 	  fftw_real tmp638;
1156 	  fftw_real tmp270;
1157 	  fftw_real tmp639;
1158 	  fftw_real tmp213;
1159 	  fftw_real tmp267;
1160 	  fftw_real tmp641;
1161 	  fftw_real tmp642;
1162 	  fftw_real tmp664;
1163 	  fftw_real tmp665;
1164 	  fftw_real tmp221;
1165 	  fftw_real tmp273;
1166 	  fftw_real tmp817;
1167 	  fftw_real tmp661;
1168 	  fftw_real tmp662;
1169 	  fftw_real tmp228;
1170 	  fftw_real tmp272;
1171 	  fftw_real tmp818;
1172 	  ASSERT_ALIGNED_DOUBLE;
1173 	  {
1174 	       fftw_real tmp204;
1175 	       fftw_real tmp205;
1176 	       fftw_real tmp268;
1177 	       fftw_real tmp269;
1178 	       ASSERT_ALIGNED_DOUBLE;
1179 	       tmp204 = input[istride];
1180 	       tmp205 = input[65 * istride];
1181 	       tmp206 = tmp204 - tmp205;
1182 	       tmp638 = tmp204 + tmp205;
1183 	       tmp268 = input[33 * istride];
1184 	       tmp269 = input[97 * istride];
1185 	       tmp270 = tmp268 - tmp269;
1186 	       tmp639 = tmp268 + tmp269;
1187 	  }
1188 	  {
1189 	       fftw_real tmp207;
1190 	       fftw_real tmp208;
1191 	       fftw_real tmp209;
1192 	       fftw_real tmp210;
1193 	       fftw_real tmp211;
1194 	       fftw_real tmp212;
1195 	       ASSERT_ALIGNED_DOUBLE;
1196 	       tmp207 = input[17 * istride];
1197 	       tmp208 = input[81 * istride];
1198 	       tmp209 = tmp207 - tmp208;
1199 	       tmp210 = input[113 * istride];
1200 	       tmp211 = input[49 * istride];
1201 	       tmp212 = tmp210 - tmp211;
1202 	       tmp213 = K707106781 * (tmp209 + tmp212);
1203 	       tmp267 = K707106781 * (tmp212 - tmp209);
1204 	       tmp641 = tmp207 + tmp208;
1205 	       tmp642 = tmp210 + tmp211;
1206 	  }
1207 	  {
1208 	       fftw_real tmp217;
1209 	       fftw_real tmp220;
1210 	       fftw_real tmp224;
1211 	       fftw_real tmp227;
1212 	       ASSERT_ALIGNED_DOUBLE;
1213 	       {
1214 		    fftw_real tmp215;
1215 		    fftw_real tmp216;
1216 		    fftw_real tmp218;
1217 		    fftw_real tmp219;
1218 		    ASSERT_ALIGNED_DOUBLE;
1219 		    tmp215 = input[9 * istride];
1220 		    tmp216 = input[73 * istride];
1221 		    tmp217 = tmp215 - tmp216;
1222 		    tmp664 = tmp215 + tmp216;
1223 		    tmp218 = input[41 * istride];
1224 		    tmp219 = input[105 * istride];
1225 		    tmp220 = tmp218 - tmp219;
1226 		    tmp665 = tmp218 + tmp219;
1227 	       }
1228 	       tmp221 = (K923879532 * tmp217) - (K382683432 * tmp220);
1229 	       tmp273 = (K382683432 * tmp217) + (K923879532 * tmp220);
1230 	       tmp817 = tmp664 - tmp665;
1231 	       {
1232 		    fftw_real tmp222;
1233 		    fftw_real tmp223;
1234 		    fftw_real tmp225;
1235 		    fftw_real tmp226;
1236 		    ASSERT_ALIGNED_DOUBLE;
1237 		    tmp222 = input[121 * istride];
1238 		    tmp223 = input[57 * istride];
1239 		    tmp224 = tmp222 - tmp223;
1240 		    tmp661 = tmp222 + tmp223;
1241 		    tmp225 = input[25 * istride];
1242 		    tmp226 = input[89 * istride];
1243 		    tmp227 = tmp225 - tmp226;
1244 		    tmp662 = tmp225 + tmp226;
1245 	       }
1246 	       tmp228 = (K923879532 * tmp224) + (K382683432 * tmp227);
1247 	       tmp272 = (K382683432 * tmp224) - (K923879532 * tmp227);
1248 	       tmp818 = tmp661 - tmp662;
1249 	  }
1250 	  {
1251 	       fftw_real tmp214;
1252 	       fftw_real tmp229;
1253 	       fftw_real tmp488;
1254 	       fftw_real tmp489;
1255 	       ASSERT_ALIGNED_DOUBLE;
1256 	       tmp214 = tmp206 + tmp213;
1257 	       tmp229 = tmp221 + tmp228;
1258 	       tmp230 = tmp214 + tmp229;
1259 	       tmp415 = tmp214 - tmp229;
1260 	       tmp488 = tmp206 - tmp213;
1261 	       tmp489 = tmp273 + tmp272;
1262 	       tmp490 = tmp488 + tmp489;
1263 	       tmp579 = tmp488 - tmp489;
1264 	  }
1265 	  {
1266 	       fftw_real tmp271;
1267 	       fftw_real tmp274;
1268 	       fftw_real tmp499;
1269 	       fftw_real tmp500;
1270 	       ASSERT_ALIGNED_DOUBLE;
1271 	       tmp271 = tmp267 - tmp270;
1272 	       tmp274 = tmp272 - tmp273;
1273 	       tmp275 = tmp271 + tmp274;
1274 	       tmp413 = tmp274 - tmp271;
1275 	       tmp499 = tmp270 + tmp267;
1276 	       tmp500 = tmp228 - tmp221;
1277 	       tmp501 = tmp499 + tmp500;
1278 	       tmp577 = tmp500 - tmp499;
1279 	  }
1280 	  {
1281 	       fftw_real tmp640;
1282 	       fftw_real tmp643;
1283 	       fftw_real tmp816;
1284 	       fftw_real tmp819;
1285 	       ASSERT_ALIGNED_DOUBLE;
1286 	       tmp640 = tmp638 + tmp639;
1287 	       tmp643 = tmp641 + tmp642;
1288 	       tmp644 = tmp640 - tmp643;
1289 	       tmp740 = tmp640 + tmp643;
1290 	       tmp816 = tmp638 - tmp639;
1291 	       tmp819 = K707106781 * (tmp817 + tmp818);
1292 	       tmp820 = tmp816 + tmp819;
1293 	       tmp911 = tmp816 - tmp819;
1294 	  }
1295 	  {
1296 	       fftw_real tmp829;
1297 	       fftw_real tmp830;
1298 	       fftw_real tmp663;
1299 	       fftw_real tmp666;
1300 	       ASSERT_ALIGNED_DOUBLE;
1301 	       tmp829 = tmp642 - tmp641;
1302 	       tmp830 = K707106781 * (tmp818 - tmp817);
1303 	       tmp831 = tmp829 + tmp830;
1304 	       tmp909 = tmp830 - tmp829;
1305 	       tmp663 = tmp661 + tmp662;
1306 	       tmp666 = tmp664 + tmp665;
1307 	       tmp667 = tmp663 - tmp666;
1308 	       tmp741 = tmp666 + tmp663;
1309 	  }
1310      }
1311      {
1312 	  fftw_real tmp233;
1313 	  fftw_real tmp821;
1314 	  fftw_real tmp647;
1315 	  fftw_real tmp245;
1316 	  fftw_real tmp257;
1317 	  fftw_real tmp259;
1318 	  fftw_real tmp657;
1319 	  fftw_real tmp825;
1320 	  fftw_real tmp250;
1321 	  fftw_real tmp824;
1322 	  fftw_real tmp654;
1323 	  fftw_real tmp262;
1324 	  fftw_real tmp240;
1325 	  fftw_real tmp242;
1326 	  fftw_real tmp650;
1327 	  fftw_real tmp822;
1328 	  fftw_real tmp491;
1329 	  fftw_real tmp492;
1330 	  ASSERT_ALIGNED_DOUBLE;
1331 	  {
1332 	       fftw_real tmp231;
1333 	       fftw_real tmp232;
1334 	       fftw_real tmp645;
1335 	       fftw_real tmp243;
1336 	       fftw_real tmp244;
1337 	       fftw_real tmp646;
1338 	       ASSERT_ALIGNED_DOUBLE;
1339 	       tmp231 = input[5 * istride];
1340 	       tmp232 = input[69 * istride];
1341 	       tmp645 = tmp231 + tmp232;
1342 	       tmp243 = input[37 * istride];
1343 	       tmp244 = input[101 * istride];
1344 	       tmp646 = tmp243 + tmp244;
1345 	       tmp233 = tmp231 - tmp232;
1346 	       tmp821 = tmp645 - tmp646;
1347 	       tmp647 = tmp645 + tmp646;
1348 	       tmp245 = tmp243 - tmp244;
1349 	  }
1350 	  {
1351 	       fftw_real tmp253;
1352 	       fftw_real tmp655;
1353 	       fftw_real tmp256;
1354 	       fftw_real tmp656;
1355 	       ASSERT_ALIGNED_DOUBLE;
1356 	       {
1357 		    fftw_real tmp251;
1358 		    fftw_real tmp252;
1359 		    fftw_real tmp254;
1360 		    fftw_real tmp255;
1361 		    ASSERT_ALIGNED_DOUBLE;
1362 		    tmp251 = input[13 * istride];
1363 		    tmp252 = input[77 * istride];
1364 		    tmp253 = tmp251 - tmp252;
1365 		    tmp655 = tmp251 + tmp252;
1366 		    tmp254 = input[109 * istride];
1367 		    tmp255 = input[45 * istride];
1368 		    tmp256 = tmp254 - tmp255;
1369 		    tmp656 = tmp254 + tmp255;
1370 	       }
1371 	       tmp257 = K707106781 * (tmp253 + tmp256);
1372 	       tmp259 = K707106781 * (tmp256 - tmp253);
1373 	       tmp657 = tmp655 + tmp656;
1374 	       tmp825 = tmp656 - tmp655;
1375 	  }
1376 	  {
1377 	       fftw_real tmp248;
1378 	       fftw_real tmp249;
1379 	       fftw_real tmp652;
1380 	       fftw_real tmp260;
1381 	       fftw_real tmp261;
1382 	       fftw_real tmp653;
1383 	       ASSERT_ALIGNED_DOUBLE;
1384 	       tmp248 = input[125 * istride];
1385 	       tmp249 = input[61 * istride];
1386 	       tmp652 = tmp248 + tmp249;
1387 	       tmp260 = input[29 * istride];
1388 	       tmp261 = input[93 * istride];
1389 	       tmp653 = tmp260 + tmp261;
1390 	       tmp250 = tmp248 - tmp249;
1391 	       tmp824 = tmp652 - tmp653;
1392 	       tmp654 = tmp652 + tmp653;
1393 	       tmp262 = tmp260 - tmp261;
1394 	  }
1395 	  {
1396 	       fftw_real tmp236;
1397 	       fftw_real tmp648;
1398 	       fftw_real tmp239;
1399 	       fftw_real tmp649;
1400 	       ASSERT_ALIGNED_DOUBLE;
1401 	       {
1402 		    fftw_real tmp234;
1403 		    fftw_real tmp235;
1404 		    fftw_real tmp237;
1405 		    fftw_real tmp238;
1406 		    ASSERT_ALIGNED_DOUBLE;
1407 		    tmp234 = input[21 * istride];
1408 		    tmp235 = input[85 * istride];
1409 		    tmp236 = tmp234 - tmp235;
1410 		    tmp648 = tmp234 + tmp235;
1411 		    tmp237 = input[117 * istride];
1412 		    tmp238 = input[53 * istride];
1413 		    tmp239 = tmp237 - tmp238;
1414 		    tmp649 = tmp237 + tmp238;
1415 	       }
1416 	       tmp240 = K707106781 * (tmp236 + tmp239);
1417 	       tmp242 = K707106781 * (tmp239 - tmp236);
1418 	       tmp650 = tmp648 + tmp649;
1419 	       tmp822 = tmp649 - tmp648;
1420 	  }
1421 	  {
1422 	       fftw_real tmp651;
1423 	       fftw_real tmp658;
1424 	       fftw_real tmp832;
1425 	       fftw_real tmp833;
1426 	       ASSERT_ALIGNED_DOUBLE;
1427 	       tmp743 = tmp647 + tmp650;
1428 	       tmp651 = tmp647 - tmp650;
1429 	       tmp658 = tmp654 - tmp657;
1430 	       tmp659 = K707106781 * (tmp651 + tmp658);
1431 	       tmp668 = K707106781 * (tmp658 - tmp651);
1432 	       tmp744 = tmp654 + tmp657;
1433 	       tmp832 = (K923879532 * tmp822) - (K382683432 * tmp821);
1434 	       tmp833 = (K382683432 * tmp824) + (K923879532 * tmp825);
1435 	       tmp834 = tmp832 + tmp833;
1436 	       tmp912 = tmp833 - tmp832;
1437 	  }
1438 	  {
1439 	       fftw_real tmp823;
1440 	       fftw_real tmp826;
1441 	       fftw_real tmp241;
1442 	       fftw_real tmp246;
1443 	       ASSERT_ALIGNED_DOUBLE;
1444 	       tmp823 = (K923879532 * tmp821) + (K382683432 * tmp822);
1445 	       tmp826 = (K923879532 * tmp824) - (K382683432 * tmp825);
1446 	       tmp827 = tmp823 + tmp826;
1447 	       tmp908 = tmp826 - tmp823;
1448 	       tmp241 = tmp233 + tmp240;
1449 	       tmp246 = tmp242 - tmp245;
1450 	       tmp247 = (K980785280 * tmp241) + (K195090322 * tmp246);
1451 	       tmp276 = (K980785280 * tmp246) - (K195090322 * tmp241);
1452 	  }
1453 	  tmp491 = tmp233 - tmp240;
1454 	  tmp492 = tmp245 + tmp242;
1455 	  tmp493 = (K831469612 * tmp491) + (K555570233 * tmp492);
1456 	  tmp502 = (K831469612 * tmp492) - (K555570233 * tmp491);
1457 	  {
1458 	       fftw_real tmp494;
1459 	       fftw_real tmp495;
1460 	       fftw_real tmp258;
1461 	       fftw_real tmp263;
1462 	       ASSERT_ALIGNED_DOUBLE;
1463 	       tmp494 = tmp250 - tmp257;
1464 	       tmp495 = tmp262 + tmp259;
1465 	       tmp496 = (K831469612 * tmp494) - (K555570233 * tmp495);
1466 	       tmp503 = (K555570233 * tmp494) + (K831469612 * tmp495);
1467 	       tmp258 = tmp250 + tmp257;
1468 	       tmp263 = tmp259 - tmp262;
1469 	       tmp264 = (K980785280 * tmp258) - (K195090322 * tmp263);
1470 	       tmp277 = (K195090322 * tmp258) + (K980785280 * tmp263);
1471 	  }
1472      }
1473      {
1474 	  fftw_real tmp63;
1475 	  fftw_real tmp739;
1476 	  fftw_real tmp753;
1477 	  fftw_real tmp759;
1478 	  fftw_real tmp126;
1479 	  fftw_real tmp755;
1480 	  fftw_real tmp746;
1481 	  fftw_real tmp758;
1482 	  ASSERT_ALIGNED_DOUBLE;
1483 	  {
1484 	       fftw_real tmp31;
1485 	       fftw_real tmp62;
1486 	       fftw_real tmp749;
1487 	       fftw_real tmp752;
1488 	       ASSERT_ALIGNED_DOUBLE;
1489 	       tmp31 = tmp15 + tmp30;
1490 	       tmp62 = tmp46 + tmp61;
1491 	       tmp63 = tmp31 + tmp62;
1492 	       tmp739 = tmp31 - tmp62;
1493 	       tmp749 = tmp747 + tmp748;
1494 	       tmp752 = tmp750 + tmp751;
1495 	       tmp753 = tmp749 - tmp752;
1496 	       tmp759 = tmp749 + tmp752;
1497 	  }
1498 	  {
1499 	       fftw_real tmp94;
1500 	       fftw_real tmp125;
1501 	       fftw_real tmp742;
1502 	       fftw_real tmp745;
1503 	       ASSERT_ALIGNED_DOUBLE;
1504 	       tmp94 = tmp78 + tmp93;
1505 	       tmp125 = tmp109 + tmp124;
1506 	       tmp126 = tmp94 + tmp125;
1507 	       tmp755 = tmp125 - tmp94;
1508 	       tmp742 = tmp740 + tmp741;
1509 	       tmp745 = tmp743 + tmp744;
1510 	       tmp746 = tmp742 - tmp745;
1511 	       tmp758 = tmp742 + tmp745;
1512 	  }
1513 	  {
1514 	       fftw_real tmp757;
1515 	       fftw_real tmp760;
1516 	       fftw_real tmp754;
1517 	       fftw_real tmp756;
1518 	       ASSERT_ALIGNED_DOUBLE;
1519 	       real_output[32 * real_ostride] = tmp63 - tmp126;
1520 	       tmp757 = tmp63 + tmp126;
1521 	       tmp760 = tmp758 + tmp759;
1522 	       real_output[64 * real_ostride] = tmp757 - tmp760;
1523 	       real_output[0] = tmp757 + tmp760;
1524 	       imag_output[32 * imag_ostride] = tmp759 - tmp758;
1525 	       tmp754 = K707106781 * (tmp746 + tmp753);
1526 	       real_output[48 * real_ostride] = tmp739 - tmp754;
1527 	       real_output[16 * real_ostride] = tmp739 + tmp754;
1528 	       tmp756 = K707106781 * (tmp753 - tmp746);
1529 	       imag_output[16 * imag_ostride] = tmp755 + tmp756;
1530 	       imag_output[48 * imag_ostride] = tmp756 - tmp755;
1531 	  }
1532      }
1533      {
1534 	  fftw_real tmp761;
1535 	  fftw_real tmp774;
1536 	  fftw_real tmp764;
1537 	  fftw_real tmp773;
1538 	  fftw_real tmp768;
1539 	  fftw_real tmp778;
1540 	  fftw_real tmp771;
1541 	  fftw_real tmp779;
1542 	  fftw_real tmp762;
1543 	  fftw_real tmp763;
1544 	  ASSERT_ALIGNED_DOUBLE;
1545 	  tmp761 = tmp15 - tmp30;
1546 	  tmp774 = tmp61 - tmp46;
1547 	  tmp762 = tmp78 - tmp93;
1548 	  tmp763 = tmp109 - tmp124;
1549 	  tmp764 = K707106781 * (tmp762 + tmp763);
1550 	  tmp773 = K707106781 * (tmp763 - tmp762);
1551 	  {
1552 	       fftw_real tmp766;
1553 	       fftw_real tmp767;
1554 	       fftw_real tmp769;
1555 	       fftw_real tmp770;
1556 	       ASSERT_ALIGNED_DOUBLE;
1557 	       tmp766 = tmp740 - tmp741;
1558 	       tmp767 = tmp744 - tmp743;
1559 	       tmp768 = (K923879532 * tmp766) + (K382683432 * tmp767);
1560 	       tmp778 = (K923879532 * tmp767) - (K382683432 * tmp766);
1561 	       tmp769 = tmp747 - tmp748;
1562 	       tmp770 = tmp751 - tmp750;
1563 	       tmp771 = (K923879532 * tmp769) - (K382683432 * tmp770);
1564 	       tmp779 = (K382683432 * tmp769) + (K923879532 * tmp770);
1565 	  }
1566 	  {
1567 	       fftw_real tmp765;
1568 	       fftw_real tmp772;
1569 	       fftw_real tmp781;
1570 	       fftw_real tmp782;
1571 	       ASSERT_ALIGNED_DOUBLE;
1572 	       tmp765 = tmp761 + tmp764;
1573 	       tmp772 = tmp768 + tmp771;
1574 	       real_output[56 * real_ostride] = tmp765 - tmp772;
1575 	       real_output[8 * real_ostride] = tmp765 + tmp772;
1576 	       tmp781 = tmp761 - tmp764;
1577 	       tmp782 = tmp779 - tmp778;
1578 	       real_output[40 * real_ostride] = tmp781 - tmp782;
1579 	       real_output[24 * real_ostride] = tmp781 + tmp782;
1580 	  }
1581 	  {
1582 	       fftw_real tmp777;
1583 	       fftw_real tmp780;
1584 	       fftw_real tmp775;
1585 	       fftw_real tmp776;
1586 	       ASSERT_ALIGNED_DOUBLE;
1587 	       tmp777 = tmp774 + tmp773;
1588 	       tmp780 = tmp778 + tmp779;
1589 	       imag_output[8 * imag_ostride] = tmp777 + tmp780;
1590 	       imag_output[56 * imag_ostride] = tmp780 - tmp777;
1591 	       tmp775 = tmp773 - tmp774;
1592 	       tmp776 = tmp771 - tmp768;
1593 	       imag_output[24 * imag_ostride] = tmp775 + tmp776;
1594 	       imag_output[40 * imag_ostride] = tmp776 - tmp775;
1595 	  }
1596      }
1597      {
1598 	  fftw_real tmp159;
1599 	  fftw_real tmp381;
1600 	  fftw_real tmp202;
1601 	  fftw_real tmp391;
1602 	  fftw_real tmp372;
1603 	  fftw_real tmp392;
1604 	  fftw_real tmp361;
1605 	  fftw_real tmp382;
1606 	  fftw_real tmp357;
1607 	  fftw_real tmp377;
1608 	  fftw_real tmp389;
1609 	  fftw_real tmp397;
1610 	  fftw_real tmp280;
1611 	  fftw_real tmp376;
1612 	  fftw_real tmp386;
1613 	  fftw_real tmp396;
1614 	  ASSERT_ALIGNED_DOUBLE;
1615 	  {
1616 	       fftw_real tmp139;
1617 	       fftw_real tmp158;
1618 	       fftw_real tmp359;
1619 	       fftw_real tmp360;
1620 	       ASSERT_ALIGNED_DOUBLE;
1621 	       tmp139 = tmp131 + tmp138;
1622 	       tmp158 = tmp148 + tmp157;
1623 	       tmp159 = tmp139 + tmp158;
1624 	       tmp381 = tmp139 - tmp158;
1625 	       {
1626 		    fftw_real tmp180;
1627 		    fftw_real tmp201;
1628 		    fftw_real tmp368;
1629 		    fftw_real tmp371;
1630 		    ASSERT_ALIGNED_DOUBLE;
1631 		    tmp180 = (K098017140 * tmp172) + (K995184726 * tmp179);
1632 		    tmp201 = (K995184726 * tmp193) - (K098017140 * tmp200);
1633 		    tmp202 = tmp180 + tmp201;
1634 		    tmp391 = tmp201 - tmp180;
1635 		    tmp368 = tmp364 + tmp367;
1636 		    tmp371 = tmp369 + tmp370;
1637 		    tmp372 = tmp368 + tmp371;
1638 		    tmp392 = tmp371 - tmp368;
1639 	       }
1640 	       tmp359 = (K995184726 * tmp172) - (K098017140 * tmp179);
1641 	       tmp360 = (K995184726 * tmp200) + (K098017140 * tmp193);
1642 	       tmp361 = tmp359 + tmp360;
1643 	       tmp382 = tmp360 - tmp359;
1644 	       {
1645 		    fftw_real tmp343;
1646 		    fftw_real tmp387;
1647 		    fftw_real tmp356;
1648 		    fftw_real tmp388;
1649 		    fftw_real tmp342;
1650 		    fftw_real tmp355;
1651 		    ASSERT_ALIGNED_DOUBLE;
1652 		    tmp342 = tmp324 + tmp341;
1653 		    tmp343 = tmp307 + tmp342;
1654 		    tmp387 = tmp307 - tmp342;
1655 		    tmp355 = tmp353 + tmp354;
1656 		    tmp356 = tmp352 + tmp355;
1657 		    tmp388 = tmp355 - tmp352;
1658 		    tmp357 = (K998795456 * tmp343) - (K049067674 * tmp356);
1659 		    tmp377 = (K049067674 * tmp343) + (K998795456 * tmp356);
1660 		    tmp389 = (K740951125 * tmp387) - (K671558954 * tmp388);
1661 		    tmp397 = (K671558954 * tmp387) + (K740951125 * tmp388);
1662 	       }
1663 	       {
1664 		    fftw_real tmp266;
1665 		    fftw_real tmp384;
1666 		    fftw_real tmp279;
1667 		    fftw_real tmp385;
1668 		    fftw_real tmp265;
1669 		    fftw_real tmp278;
1670 		    ASSERT_ALIGNED_DOUBLE;
1671 		    tmp265 = tmp247 + tmp264;
1672 		    tmp266 = tmp230 + tmp265;
1673 		    tmp384 = tmp230 - tmp265;
1674 		    tmp278 = tmp276 + tmp277;
1675 		    tmp279 = tmp275 + tmp278;
1676 		    tmp385 = tmp278 - tmp275;
1677 		    tmp280 = (K998795456 * tmp266) + (K049067674 * tmp279);
1678 		    tmp376 = (K998795456 * tmp279) - (K049067674 * tmp266);
1679 		    tmp386 = (K740951125 * tmp384) + (K671558954 * tmp385);
1680 		    tmp396 = (K740951125 * tmp385) - (K671558954 * tmp384);
1681 	       }
1682 	  }
1683 	  {
1684 	       fftw_real tmp203;
1685 	       fftw_real tmp358;
1686 	       fftw_real tmp373;
1687 	       fftw_real tmp374;
1688 	       ASSERT_ALIGNED_DOUBLE;
1689 	       tmp203 = tmp159 + tmp202;
1690 	       tmp358 = tmp280 + tmp357;
1691 	       real_output[63 * real_ostride] = tmp203 - tmp358;
1692 	       real_output[real_ostride] = tmp203 + tmp358;
1693 	       tmp373 = tmp361 - tmp372;
1694 	       tmp374 = tmp357 - tmp280;
1695 	       imag_output[31 * imag_ostride] = tmp373 + tmp374;
1696 	       imag_output[33 * imag_ostride] = tmp374 - tmp373;
1697 	  }
1698 	  {
1699 	       fftw_real tmp375;
1700 	       fftw_real tmp378;
1701 	       fftw_real tmp379;
1702 	       fftw_real tmp380;
1703 	       ASSERT_ALIGNED_DOUBLE;
1704 	       tmp375 = tmp372 + tmp361;
1705 	       tmp378 = tmp376 + tmp377;
1706 	       imag_output[imag_ostride] = tmp375 + tmp378;
1707 	       imag_output[63 * imag_ostride] = tmp378 - tmp375;
1708 	       tmp379 = tmp159 - tmp202;
1709 	       tmp380 = tmp377 - tmp376;
1710 	       real_output[33 * real_ostride] = tmp379 - tmp380;
1711 	       real_output[31 * real_ostride] = tmp379 + tmp380;
1712 	  }
1713 	  {
1714 	       fftw_real tmp383;
1715 	       fftw_real tmp390;
1716 	       fftw_real tmp393;
1717 	       fftw_real tmp394;
1718 	       ASSERT_ALIGNED_DOUBLE;
1719 	       tmp383 = tmp381 + tmp382;
1720 	       tmp390 = tmp386 + tmp389;
1721 	       real_output[49 * real_ostride] = tmp383 - tmp390;
1722 	       real_output[15 * real_ostride] = tmp383 + tmp390;
1723 	       tmp393 = tmp391 - tmp392;
1724 	       tmp394 = tmp389 - tmp386;
1725 	       imag_output[17 * imag_ostride] = tmp393 + tmp394;
1726 	       imag_output[47 * imag_ostride] = tmp394 - tmp393;
1727 	  }
1728 	  {
1729 	       fftw_real tmp395;
1730 	       fftw_real tmp398;
1731 	       fftw_real tmp399;
1732 	       fftw_real tmp400;
1733 	       ASSERT_ALIGNED_DOUBLE;
1734 	       tmp395 = tmp392 + tmp391;
1735 	       tmp398 = tmp396 + tmp397;
1736 	       imag_output[15 * imag_ostride] = tmp395 + tmp398;
1737 	       imag_output[49 * imag_ostride] = tmp398 - tmp395;
1738 	       tmp399 = tmp381 - tmp382;
1739 	       tmp400 = tmp397 - tmp396;
1740 	       real_output[47 * real_ostride] = tmp399 - tmp400;
1741 	       real_output[17 * real_ostride] = tmp399 + tmp400;
1742 	  }
1743      }
1744      {
1745 	  fftw_real tmp403;
1746 	  fftw_real tmp441;
1747 	  fftw_real tmp410;
1748 	  fftw_real tmp451;
1749 	  fftw_real tmp432;
1750 	  fftw_real tmp452;
1751 	  fftw_real tmp429;
1752 	  fftw_real tmp442;
1753 	  fftw_real tmp425;
1754 	  fftw_real tmp437;
1755 	  fftw_real tmp449;
1756 	  fftw_real tmp457;
1757 	  fftw_real tmp418;
1758 	  fftw_real tmp436;
1759 	  fftw_real tmp446;
1760 	  fftw_real tmp456;
1761 	  ASSERT_ALIGNED_DOUBLE;
1762 	  {
1763 	       fftw_real tmp401;
1764 	       fftw_real tmp402;
1765 	       fftw_real tmp427;
1766 	       fftw_real tmp428;
1767 	       ASSERT_ALIGNED_DOUBLE;
1768 	       tmp401 = tmp131 - tmp138;
1769 	       tmp402 = tmp370 - tmp369;
1770 	       tmp403 = tmp401 - tmp402;
1771 	       tmp441 = tmp401 + tmp402;
1772 	       {
1773 		    fftw_real tmp406;
1774 		    fftw_real tmp409;
1775 		    fftw_real tmp430;
1776 		    fftw_real tmp431;
1777 		    ASSERT_ALIGNED_DOUBLE;
1778 		    tmp406 = (K773010453 * tmp404) + (K634393284 * tmp405);
1779 		    tmp409 = (K773010453 * tmp407) - (K634393284 * tmp408);
1780 		    tmp410 = tmp406 - tmp409;
1781 		    tmp451 = tmp409 + tmp406;
1782 		    tmp430 = tmp157 - tmp148;
1783 		    tmp431 = tmp367 - tmp364;
1784 		    tmp432 = tmp430 - tmp431;
1785 		    tmp452 = tmp431 + tmp430;
1786 	       }
1787 	       tmp427 = (K773010453 * tmp405) - (K634393284 * tmp404);
1788 	       tmp428 = (K634393284 * tmp407) + (K773010453 * tmp408);
1789 	       tmp429 = tmp427 - tmp428;
1790 	       tmp442 = tmp428 + tmp427;
1791 	       {
1792 		    fftw_real tmp421;
1793 		    fftw_real tmp447;
1794 		    fftw_real tmp424;
1795 		    fftw_real tmp448;
1796 		    fftw_real tmp420;
1797 		    fftw_real tmp422;
1798 		    ASSERT_ALIGNED_DOUBLE;
1799 		    tmp420 = tmp354 - tmp353;
1800 		    tmp421 = tmp419 - tmp420;
1801 		    tmp447 = tmp419 + tmp420;
1802 		    tmp422 = tmp341 - tmp324;
1803 		    tmp424 = tmp422 - tmp423;
1804 		    tmp448 = tmp423 + tmp422;
1805 		    tmp425 = (K903989293 * tmp421) - (K427555093 * tmp424);
1806 		    tmp437 = (K903989293 * tmp424) + (K427555093 * tmp421);
1807 		    tmp449 = (K941544065 * tmp447) - (K336889853 * tmp448);
1808 		    tmp457 = (K941544065 * tmp448) + (K336889853 * tmp447);
1809 	       }
1810 	       {
1811 		    fftw_real tmp414;
1812 		    fftw_real tmp444;
1813 		    fftw_real tmp417;
1814 		    fftw_real tmp445;
1815 		    fftw_real tmp412;
1816 		    fftw_real tmp416;
1817 		    ASSERT_ALIGNED_DOUBLE;
1818 		    tmp412 = tmp264 - tmp247;
1819 		    tmp414 = tmp412 - tmp413;
1820 		    tmp444 = tmp413 + tmp412;
1821 		    tmp416 = tmp277 - tmp276;
1822 		    tmp417 = tmp415 - tmp416;
1823 		    tmp445 = tmp415 + tmp416;
1824 		    tmp418 = (K427555093 * tmp414) + (K903989293 * tmp417);
1825 		    tmp436 = (K903989293 * tmp414) - (K427555093 * tmp417);
1826 		    tmp446 = (K336889853 * tmp444) + (K941544065 * tmp445);
1827 		    tmp456 = (K941544065 * tmp444) - (K336889853 * tmp445);
1828 	       }
1829 	  }
1830 	  {
1831 	       fftw_real tmp411;
1832 	       fftw_real tmp426;
1833 	       fftw_real tmp433;
1834 	       fftw_real tmp434;
1835 	       ASSERT_ALIGNED_DOUBLE;
1836 	       tmp411 = tmp403 + tmp410;
1837 	       tmp426 = tmp418 + tmp425;
1838 	       real_output[55 * real_ostride] = tmp411 - tmp426;
1839 	       real_output[9 * real_ostride] = tmp411 + tmp426;
1840 	       tmp433 = tmp429 - tmp432;
1841 	       tmp434 = tmp425 - tmp418;
1842 	       imag_output[23 * imag_ostride] = tmp433 + tmp434;
1843 	       imag_output[41 * imag_ostride] = tmp434 - tmp433;
1844 	  }
1845 	  {
1846 	       fftw_real tmp435;
1847 	       fftw_real tmp438;
1848 	       fftw_real tmp439;
1849 	       fftw_real tmp440;
1850 	       ASSERT_ALIGNED_DOUBLE;
1851 	       tmp435 = tmp432 + tmp429;
1852 	       tmp438 = tmp436 + tmp437;
1853 	       imag_output[9 * imag_ostride] = tmp435 + tmp438;
1854 	       imag_output[55 * imag_ostride] = tmp438 - tmp435;
1855 	       tmp439 = tmp403 - tmp410;
1856 	       tmp440 = tmp437 - tmp436;
1857 	       real_output[41 * real_ostride] = tmp439 - tmp440;
1858 	       real_output[23 * real_ostride] = tmp439 + tmp440;
1859 	  }
1860 	  {
1861 	       fftw_real tmp443;
1862 	       fftw_real tmp450;
1863 	       fftw_real tmp453;
1864 	       fftw_real tmp454;
1865 	       ASSERT_ALIGNED_DOUBLE;
1866 	       tmp443 = tmp441 + tmp442;
1867 	       tmp450 = tmp446 + tmp449;
1868 	       real_output[57 * real_ostride] = tmp443 - tmp450;
1869 	       real_output[7 * real_ostride] = tmp443 + tmp450;
1870 	       tmp453 = tmp451 - tmp452;
1871 	       tmp454 = tmp449 - tmp446;
1872 	       imag_output[25 * imag_ostride] = tmp453 + tmp454;
1873 	       imag_output[39 * imag_ostride] = tmp454 - tmp453;
1874 	  }
1875 	  {
1876 	       fftw_real tmp455;
1877 	       fftw_real tmp458;
1878 	       fftw_real tmp459;
1879 	       fftw_real tmp460;
1880 	       ASSERT_ALIGNED_DOUBLE;
1881 	       tmp455 = tmp452 + tmp451;
1882 	       tmp458 = tmp456 + tmp457;
1883 	       imag_output[7 * imag_ostride] = tmp455 + tmp458;
1884 	       imag_output[57 * imag_ostride] = tmp458 - tmp455;
1885 	       tmp459 = tmp441 - tmp442;
1886 	       tmp460 = tmp457 - tmp456;
1887 	       real_output[39 * real_ostride] = tmp459 - tmp460;
1888 	       real_output[25 * real_ostride] = tmp459 + tmp460;
1889 	  }
1890      }
1891      {
1892 	  fftw_real tmp629;
1893 	  fftw_real tmp719;
1894 	  fftw_real tmp710;
1895 	  fftw_real tmp730;
1896 	  fftw_real tmp636;
1897 	  fftw_real tmp729;
1898 	  fftw_real tmp707;
1899 	  fftw_real tmp720;
1900 	  fftw_real tmp670;
1901 	  fftw_real tmp714;
1902 	  fftw_real tmp724;
1903 	  fftw_real tmp734;
1904 	  fftw_real tmp703;
1905 	  fftw_real tmp715;
1906 	  fftw_real tmp727;
1907 	  fftw_real tmp735;
1908 	  fftw_real tmp628;
1909 	  fftw_real tmp709;
1910 	  ASSERT_ALIGNED_DOUBLE;
1911 	  tmp628 = K707106781 * (tmp626 + tmp627);
1912 	  tmp629 = tmp625 + tmp628;
1913 	  tmp719 = tmp625 - tmp628;
1914 	  tmp709 = K707106781 * (tmp627 - tmp626);
1915 	  tmp710 = tmp708 + tmp709;
1916 	  tmp730 = tmp709 - tmp708;
1917 	  {
1918 	       fftw_real tmp632;
1919 	       fftw_real tmp635;
1920 	       fftw_real tmp705;
1921 	       fftw_real tmp706;
1922 	       ASSERT_ALIGNED_DOUBLE;
1923 	       tmp632 = (K923879532 * tmp630) + (K382683432 * tmp631);
1924 	       tmp635 = (K923879532 * tmp633) - (K382683432 * tmp634);
1925 	       tmp636 = tmp632 + tmp635;
1926 	       tmp729 = tmp635 - tmp632;
1927 	       tmp705 = (K923879532 * tmp631) - (K382683432 * tmp630);
1928 	       tmp706 = (K382683432 * tmp633) + (K923879532 * tmp634);
1929 	       tmp707 = tmp705 + tmp706;
1930 	       tmp720 = tmp706 - tmp705;
1931 	  }
1932 	  {
1933 	       fftw_real tmp660;
1934 	       fftw_real tmp669;
1935 	       fftw_real tmp722;
1936 	       fftw_real tmp723;
1937 	       ASSERT_ALIGNED_DOUBLE;
1938 	       tmp660 = tmp644 + tmp659;
1939 	       tmp669 = tmp667 + tmp668;
1940 	       tmp670 = (K980785280 * tmp660) + (K195090322 * tmp669);
1941 	       tmp714 = (K980785280 * tmp669) - (K195090322 * tmp660);
1942 	       tmp722 = tmp644 - tmp659;
1943 	       tmp723 = tmp668 - tmp667;
1944 	       tmp724 = (K831469612 * tmp722) + (K555570233 * tmp723);
1945 	       tmp734 = (K831469612 * tmp723) - (K555570233 * tmp722);
1946 	  }
1947 	  {
1948 	       fftw_real tmp693;
1949 	       fftw_real tmp702;
1950 	       fftw_real tmp725;
1951 	       fftw_real tmp726;
1952 	       ASSERT_ALIGNED_DOUBLE;
1953 	       tmp693 = tmp677 + tmp692;
1954 	       tmp702 = tmp700 + tmp701;
1955 	       tmp703 = (K980785280 * tmp693) - (K195090322 * tmp702);
1956 	       tmp715 = (K195090322 * tmp693) + (K980785280 * tmp702);
1957 	       tmp725 = tmp677 - tmp692;
1958 	       tmp726 = tmp701 - tmp700;
1959 	       tmp727 = (K831469612 * tmp725) - (K555570233 * tmp726);
1960 	       tmp735 = (K555570233 * tmp725) + (K831469612 * tmp726);
1961 	  }
1962 	  {
1963 	       fftw_real tmp637;
1964 	       fftw_real tmp704;
1965 	       fftw_real tmp711;
1966 	       fftw_real tmp712;
1967 	       ASSERT_ALIGNED_DOUBLE;
1968 	       tmp637 = tmp629 + tmp636;
1969 	       tmp704 = tmp670 + tmp703;
1970 	       real_output[60 * real_ostride] = tmp637 - tmp704;
1971 	       real_output[4 * real_ostride] = tmp637 + tmp704;
1972 	       tmp711 = tmp707 - tmp710;
1973 	       tmp712 = tmp703 - tmp670;
1974 	       imag_output[28 * imag_ostride] = tmp711 + tmp712;
1975 	       imag_output[36 * imag_ostride] = tmp712 - tmp711;
1976 	  }
1977 	  {
1978 	       fftw_real tmp713;
1979 	       fftw_real tmp716;
1980 	       fftw_real tmp717;
1981 	       fftw_real tmp718;
1982 	       ASSERT_ALIGNED_DOUBLE;
1983 	       tmp713 = tmp710 + tmp707;
1984 	       tmp716 = tmp714 + tmp715;
1985 	       imag_output[4 * imag_ostride] = tmp713 + tmp716;
1986 	       imag_output[60 * imag_ostride] = tmp716 - tmp713;
1987 	       tmp717 = tmp629 - tmp636;
1988 	       tmp718 = tmp715 - tmp714;
1989 	       real_output[36 * real_ostride] = tmp717 - tmp718;
1990 	       real_output[28 * real_ostride] = tmp717 + tmp718;
1991 	  }
1992 	  {
1993 	       fftw_real tmp721;
1994 	       fftw_real tmp728;
1995 	       fftw_real tmp731;
1996 	       fftw_real tmp732;
1997 	       ASSERT_ALIGNED_DOUBLE;
1998 	       tmp721 = tmp719 + tmp720;
1999 	       tmp728 = tmp724 + tmp727;
2000 	       real_output[52 * real_ostride] = tmp721 - tmp728;
2001 	       real_output[12 * real_ostride] = tmp721 + tmp728;
2002 	       tmp731 = tmp729 - tmp730;
2003 	       tmp732 = tmp727 - tmp724;
2004 	       imag_output[20 * imag_ostride] = tmp731 + tmp732;
2005 	       imag_output[44 * imag_ostride] = tmp732 - tmp731;
2006 	  }
2007 	  {
2008 	       fftw_real tmp733;
2009 	       fftw_real tmp736;
2010 	       fftw_real tmp737;
2011 	       fftw_real tmp738;
2012 	       ASSERT_ALIGNED_DOUBLE;
2013 	       tmp733 = tmp730 + tmp729;
2014 	       tmp736 = tmp734 + tmp735;
2015 	       imag_output[12 * imag_ostride] = tmp733 + tmp736;
2016 	       imag_output[52 * imag_ostride] = tmp736 - tmp733;
2017 	       tmp737 = tmp719 - tmp720;
2018 	       tmp738 = tmp735 - tmp734;
2019 	       real_output[44 * real_ostride] = tmp737 - tmp738;
2020 	       real_output[20 * real_ostride] = tmp737 + tmp738;
2021 	  }
2022      }
2023      {
2024 	  fftw_real tmp795;
2025 	  fftw_real tmp877;
2026 	  fftw_real tmp882;
2027 	  fftw_real tmp892;
2028 	  fftw_real tmp885;
2029 	  fftw_real tmp893;
2030 	  fftw_real tmp857;
2031 	  fftw_real tmp873;
2032 	  fftw_real tmp836;
2033 	  fftw_real tmp872;
2034 	  fftw_real tmp861;
2035 	  fftw_real tmp878;
2036 	  fftw_real tmp814;
2037 	  fftw_real tmp887;
2038 	  fftw_real tmp868;
2039 	  fftw_real tmp888;
2040 	  ASSERT_ALIGNED_DOUBLE;
2041 	  {
2042 	       fftw_real tmp787;
2043 	       fftw_real tmp794;
2044 	       fftw_real tmp880;
2045 	       fftw_real tmp881;
2046 	       ASSERT_ALIGNED_DOUBLE;
2047 	       tmp787 = tmp783 + tmp786;
2048 	       tmp794 = tmp790 + tmp793;
2049 	       tmp795 = tmp787 + tmp794;
2050 	       tmp877 = tmp787 - tmp794;
2051 	       tmp880 = tmp820 - tmp827;
2052 	       tmp881 = tmp834 - tmp831;
2053 	       tmp882 = (K773010453 * tmp880) + (K634393284 * tmp881);
2054 	       tmp892 = (K773010453 * tmp881) - (K634393284 * tmp880);
2055 	  }
2056 	  {
2057 	       fftw_real tmp883;
2058 	       fftw_real tmp884;
2059 	       fftw_real tmp849;
2060 	       fftw_real tmp856;
2061 	       ASSERT_ALIGNED_DOUBLE;
2062 	       tmp883 = tmp841 - tmp848;
2063 	       tmp884 = tmp855 - tmp852;
2064 	       tmp885 = (K773010453 * tmp883) - (K634393284 * tmp884);
2065 	       tmp893 = (K634393284 * tmp883) + (K773010453 * tmp884);
2066 	       tmp849 = tmp841 + tmp848;
2067 	       tmp856 = tmp852 + tmp855;
2068 	       tmp857 = (K995184726 * tmp849) - (K098017140 * tmp856);
2069 	       tmp873 = (K098017140 * tmp849) + (K995184726 * tmp856);
2070 	  }
2071 	  {
2072 	       fftw_real tmp828;
2073 	       fftw_real tmp835;
2074 	       fftw_real tmp859;
2075 	       fftw_real tmp860;
2076 	       ASSERT_ALIGNED_DOUBLE;
2077 	       tmp828 = tmp820 + tmp827;
2078 	       tmp835 = tmp831 + tmp834;
2079 	       tmp836 = (K995184726 * tmp828) + (K098017140 * tmp835);
2080 	       tmp872 = (K995184726 * tmp835) - (K098017140 * tmp828);
2081 	       tmp859 = (K980785280 * tmp803) - (K195090322 * tmp800);
2082 	       tmp860 = (K195090322 * tmp809) + (K980785280 * tmp812);
2083 	       tmp861 = tmp859 + tmp860;
2084 	       tmp878 = tmp860 - tmp859;
2085 	  }
2086 	  {
2087 	       fftw_real tmp804;
2088 	       fftw_real tmp813;
2089 	       fftw_real tmp864;
2090 	       fftw_real tmp867;
2091 	       ASSERT_ALIGNED_DOUBLE;
2092 	       tmp804 = (K980785280 * tmp800) + (K195090322 * tmp803);
2093 	       tmp813 = (K980785280 * tmp809) - (K195090322 * tmp812);
2094 	       tmp814 = tmp804 + tmp813;
2095 	       tmp887 = tmp813 - tmp804;
2096 	       tmp864 = tmp862 + tmp863;
2097 	       tmp867 = tmp865 + tmp866;
2098 	       tmp868 = tmp864 + tmp867;
2099 	       tmp888 = tmp867 - tmp864;
2100 	  }
2101 	  {
2102 	       fftw_real tmp815;
2103 	       fftw_real tmp858;
2104 	       fftw_real tmp869;
2105 	       fftw_real tmp870;
2106 	       ASSERT_ALIGNED_DOUBLE;
2107 	       tmp815 = tmp795 + tmp814;
2108 	       tmp858 = tmp836 + tmp857;
2109 	       real_output[62 * real_ostride] = tmp815 - tmp858;
2110 	       real_output[2 * real_ostride] = tmp815 + tmp858;
2111 	       tmp869 = tmp861 - tmp868;
2112 	       tmp870 = tmp857 - tmp836;
2113 	       imag_output[30 * imag_ostride] = tmp869 + tmp870;
2114 	       imag_output[34 * imag_ostride] = tmp870 - tmp869;
2115 	  }
2116 	  {
2117 	       fftw_real tmp871;
2118 	       fftw_real tmp874;
2119 	       fftw_real tmp875;
2120 	       fftw_real tmp876;
2121 	       ASSERT_ALIGNED_DOUBLE;
2122 	       tmp871 = tmp868 + tmp861;
2123 	       tmp874 = tmp872 + tmp873;
2124 	       imag_output[2 * imag_ostride] = tmp871 + tmp874;
2125 	       imag_output[62 * imag_ostride] = tmp874 - tmp871;
2126 	       tmp875 = tmp795 - tmp814;
2127 	       tmp876 = tmp873 - tmp872;
2128 	       real_output[34 * real_ostride] = tmp875 - tmp876;
2129 	       real_output[30 * real_ostride] = tmp875 + tmp876;
2130 	  }
2131 	  {
2132 	       fftw_real tmp879;
2133 	       fftw_real tmp886;
2134 	       fftw_real tmp889;
2135 	       fftw_real tmp890;
2136 	       ASSERT_ALIGNED_DOUBLE;
2137 	       tmp879 = tmp877 + tmp878;
2138 	       tmp886 = tmp882 + tmp885;
2139 	       real_output[50 * real_ostride] = tmp879 - tmp886;
2140 	       real_output[14 * real_ostride] = tmp879 + tmp886;
2141 	       tmp889 = tmp887 - tmp888;
2142 	       tmp890 = tmp885 - tmp882;
2143 	       imag_output[18 * imag_ostride] = tmp889 + tmp890;
2144 	       imag_output[46 * imag_ostride] = tmp890 - tmp889;
2145 	  }
2146 	  {
2147 	       fftw_real tmp891;
2148 	       fftw_real tmp894;
2149 	       fftw_real tmp895;
2150 	       fftw_real tmp896;
2151 	       ASSERT_ALIGNED_DOUBLE;
2152 	       tmp891 = tmp888 + tmp887;
2153 	       tmp894 = tmp892 + tmp893;
2154 	       imag_output[14 * imag_ostride] = tmp891 + tmp894;
2155 	       imag_output[50 * imag_ostride] = tmp894 - tmp891;
2156 	       tmp895 = tmp877 - tmp878;
2157 	       tmp896 = tmp893 - tmp892;
2158 	       real_output[46 * real_ostride] = tmp895 - tmp896;
2159 	       real_output[18 * real_ostride] = tmp895 + tmp896;
2160 	  }
2161      }
2162      {
2163 	  fftw_real tmp899;
2164 	  fftw_real tmp937;
2165 	  fftw_real tmp942;
2166 	  fftw_real tmp952;
2167 	  fftw_real tmp945;
2168 	  fftw_real tmp953;
2169 	  fftw_real tmp921;
2170 	  fftw_real tmp933;
2171 	  fftw_real tmp914;
2172 	  fftw_real tmp932;
2173 	  fftw_real tmp925;
2174 	  fftw_real tmp938;
2175 	  fftw_real tmp906;
2176 	  fftw_real tmp947;
2177 	  fftw_real tmp928;
2178 	  fftw_real tmp948;
2179 	  ASSERT_ALIGNED_DOUBLE;
2180 	  {
2181 	       fftw_real tmp897;
2182 	       fftw_real tmp898;
2183 	       fftw_real tmp940;
2184 	       fftw_real tmp941;
2185 	       ASSERT_ALIGNED_DOUBLE;
2186 	       tmp897 = tmp783 - tmp786;
2187 	       tmp898 = tmp866 - tmp865;
2188 	       tmp899 = tmp897 - tmp898;
2189 	       tmp937 = tmp897 + tmp898;
2190 	       tmp940 = tmp909 + tmp908;
2191 	       tmp941 = tmp911 + tmp912;
2192 	       tmp942 = (K290284677 * tmp940) + (K956940335 * tmp941);
2193 	       tmp952 = (K956940335 * tmp940) - (K290284677 * tmp941);
2194 	  }
2195 	  {
2196 	       fftw_real tmp943;
2197 	       fftw_real tmp944;
2198 	       fftw_real tmp917;
2199 	       fftw_real tmp920;
2200 	       ASSERT_ALIGNED_DOUBLE;
2201 	       tmp943 = tmp915 + tmp916;
2202 	       tmp944 = tmp919 + tmp918;
2203 	       tmp945 = (K956940335 * tmp943) - (K290284677 * tmp944);
2204 	       tmp953 = (K956940335 * tmp944) + (K290284677 * tmp943);
2205 	       tmp917 = tmp915 - tmp916;
2206 	       tmp920 = tmp918 - tmp919;
2207 	       tmp921 = (K881921264 * tmp917) - (K471396736 * tmp920);
2208 	       tmp933 = (K881921264 * tmp920) + (K471396736 * tmp917);
2209 	  }
2210 	  {
2211 	       fftw_real tmp910;
2212 	       fftw_real tmp913;
2213 	       fftw_real tmp923;
2214 	       fftw_real tmp924;
2215 	       ASSERT_ALIGNED_DOUBLE;
2216 	       tmp910 = tmp908 - tmp909;
2217 	       tmp913 = tmp911 - tmp912;
2218 	       tmp914 = (K471396736 * tmp910) + (K881921264 * tmp913);
2219 	       tmp932 = (K881921264 * tmp910) - (K471396736 * tmp913);
2220 	       tmp923 = (K831469612 * tmp900) - (K555570233 * tmp901);
2221 	       tmp924 = (K831469612 * tmp904) + (K555570233 * tmp903);
2222 	       tmp925 = tmp923 - tmp924;
2223 	       tmp938 = tmp924 + tmp923;
2224 	  }
2225 	  {
2226 	       fftw_real tmp902;
2227 	       fftw_real tmp905;
2228 	       fftw_real tmp926;
2229 	       fftw_real tmp927;
2230 	       ASSERT_ALIGNED_DOUBLE;
2231 	       tmp902 = (K555570233 * tmp900) + (K831469612 * tmp901);
2232 	       tmp905 = (K831469612 * tmp903) - (K555570233 * tmp904);
2233 	       tmp906 = tmp902 - tmp905;
2234 	       tmp947 = tmp905 + tmp902;
2235 	       tmp926 = tmp793 - tmp790;
2236 	       tmp927 = tmp863 - tmp862;
2237 	       tmp928 = tmp926 - tmp927;
2238 	       tmp948 = tmp927 + tmp926;
2239 	  }
2240 	  {
2241 	       fftw_real tmp907;
2242 	       fftw_real tmp922;
2243 	       fftw_real tmp929;
2244 	       fftw_real tmp930;
2245 	       ASSERT_ALIGNED_DOUBLE;
2246 	       tmp907 = tmp899 + tmp906;
2247 	       tmp922 = tmp914 + tmp921;
2248 	       real_output[54 * real_ostride] = tmp907 - tmp922;
2249 	       real_output[10 * real_ostride] = tmp907 + tmp922;
2250 	       tmp929 = tmp925 - tmp928;
2251 	       tmp930 = tmp921 - tmp914;
2252 	       imag_output[22 * imag_ostride] = tmp929 + tmp930;
2253 	       imag_output[42 * imag_ostride] = tmp930 - tmp929;
2254 	  }
2255 	  {
2256 	       fftw_real tmp931;
2257 	       fftw_real tmp934;
2258 	       fftw_real tmp935;
2259 	       fftw_real tmp936;
2260 	       ASSERT_ALIGNED_DOUBLE;
2261 	       tmp931 = tmp928 + tmp925;
2262 	       tmp934 = tmp932 + tmp933;
2263 	       imag_output[10 * imag_ostride] = tmp931 + tmp934;
2264 	       imag_output[54 * imag_ostride] = tmp934 - tmp931;
2265 	       tmp935 = tmp899 - tmp906;
2266 	       tmp936 = tmp933 - tmp932;
2267 	       real_output[42 * real_ostride] = tmp935 - tmp936;
2268 	       real_output[22 * real_ostride] = tmp935 + tmp936;
2269 	  }
2270 	  {
2271 	       fftw_real tmp939;
2272 	       fftw_real tmp946;
2273 	       fftw_real tmp949;
2274 	       fftw_real tmp950;
2275 	       ASSERT_ALIGNED_DOUBLE;
2276 	       tmp939 = tmp937 + tmp938;
2277 	       tmp946 = tmp942 + tmp945;
2278 	       real_output[58 * real_ostride] = tmp939 - tmp946;
2279 	       real_output[6 * real_ostride] = tmp939 + tmp946;
2280 	       tmp949 = tmp947 - tmp948;
2281 	       tmp950 = tmp945 - tmp942;
2282 	       imag_output[26 * imag_ostride] = tmp949 + tmp950;
2283 	       imag_output[38 * imag_ostride] = tmp950 - tmp949;
2284 	  }
2285 	  {
2286 	       fftw_real tmp951;
2287 	       fftw_real tmp954;
2288 	       fftw_real tmp955;
2289 	       fftw_real tmp956;
2290 	       ASSERT_ALIGNED_DOUBLE;
2291 	       tmp951 = tmp948 + tmp947;
2292 	       tmp954 = tmp952 + tmp953;
2293 	       imag_output[6 * imag_ostride] = tmp951 + tmp954;
2294 	       imag_output[58 * imag_ostride] = tmp954 - tmp951;
2295 	       tmp955 = tmp937 - tmp938;
2296 	       tmp956 = tmp953 - tmp952;
2297 	       real_output[38 * real_ostride] = tmp955 - tmp956;
2298 	       real_output[26 * real_ostride] = tmp955 + tmp956;
2299 	  }
2300      }
2301      {
2302 	  fftw_real tmp471;
2303 	  fftw_real tmp545;
2304 	  fftw_real tmp486;
2305 	  fftw_real tmp555;
2306 	  fftw_real tmp536;
2307 	  fftw_real tmp556;
2308 	  fftw_real tmp529;
2309 	  fftw_real tmp546;
2310 	  fftw_real tmp525;
2311 	  fftw_real tmp541;
2312 	  fftw_real tmp553;
2313 	  fftw_real tmp561;
2314 	  fftw_real tmp506;
2315 	  fftw_real tmp540;
2316 	  fftw_real tmp550;
2317 	  fftw_real tmp560;
2318 	  ASSERT_ALIGNED_DOUBLE;
2319 	  {
2320 	       fftw_real tmp463;
2321 	       fftw_real tmp470;
2322 	       fftw_real tmp527;
2323 	       fftw_real tmp528;
2324 	       ASSERT_ALIGNED_DOUBLE;
2325 	       tmp463 = tmp461 + tmp462;
2326 	       tmp470 = tmp466 + tmp469;
2327 	       tmp471 = tmp463 + tmp470;
2328 	       tmp545 = tmp463 - tmp470;
2329 	       {
2330 		    fftw_real tmp478;
2331 		    fftw_real tmp485;
2332 		    fftw_real tmp532;
2333 		    fftw_real tmp535;
2334 		    ASSERT_ALIGNED_DOUBLE;
2335 		    tmp478 = (K956940335 * tmp474) + (K290284677 * tmp477);
2336 		    tmp485 = (K956940335 * tmp481) - (K290284677 * tmp484);
2337 		    tmp486 = tmp478 + tmp485;
2338 		    tmp555 = tmp485 - tmp478;
2339 		    tmp532 = tmp530 + tmp531;
2340 		    tmp535 = tmp533 + tmp534;
2341 		    tmp536 = tmp532 + tmp535;
2342 		    tmp556 = tmp535 - tmp532;
2343 	       }
2344 	       tmp527 = (K956940335 * tmp477) - (K290284677 * tmp474);
2345 	       tmp528 = (K290284677 * tmp481) + (K956940335 * tmp484);
2346 	       tmp529 = tmp527 + tmp528;
2347 	       tmp546 = tmp528 - tmp527;
2348 	       {
2349 		    fftw_real tmp517;
2350 		    fftw_real tmp551;
2351 		    fftw_real tmp524;
2352 		    fftw_real tmp552;
2353 		    fftw_real tmp516;
2354 		    fftw_real tmp523;
2355 		    ASSERT_ALIGNED_DOUBLE;
2356 		    tmp516 = tmp512 + tmp515;
2357 		    tmp517 = tmp509 + tmp516;
2358 		    tmp551 = tmp509 - tmp516;
2359 		    tmp523 = tmp521 + tmp522;
2360 		    tmp524 = tmp520 + tmp523;
2361 		    tmp552 = tmp523 - tmp520;
2362 		    tmp525 = (K989176509 * tmp517) - (K146730474 * tmp524);
2363 		    tmp541 = (K146730474 * tmp517) + (K989176509 * tmp524);
2364 		    tmp553 = (K803207531 * tmp551) - (K595699304 * tmp552);
2365 		    tmp561 = (K595699304 * tmp551) + (K803207531 * tmp552);
2366 	       }
2367 	       {
2368 		    fftw_real tmp498;
2369 		    fftw_real tmp548;
2370 		    fftw_real tmp505;
2371 		    fftw_real tmp549;
2372 		    fftw_real tmp497;
2373 		    fftw_real tmp504;
2374 		    ASSERT_ALIGNED_DOUBLE;
2375 		    tmp497 = tmp493 + tmp496;
2376 		    tmp498 = tmp490 + tmp497;
2377 		    tmp548 = tmp490 - tmp497;
2378 		    tmp504 = tmp502 + tmp503;
2379 		    tmp505 = tmp501 + tmp504;
2380 		    tmp549 = tmp504 - tmp501;
2381 		    tmp506 = (K989176509 * tmp498) + (K146730474 * tmp505);
2382 		    tmp540 = (K989176509 * tmp505) - (K146730474 * tmp498);
2383 		    tmp550 = (K803207531 * tmp548) + (K595699304 * tmp549);
2384 		    tmp560 = (K803207531 * tmp549) - (K595699304 * tmp548);
2385 	       }
2386 	  }
2387 	  {
2388 	       fftw_real tmp487;
2389 	       fftw_real tmp526;
2390 	       fftw_real tmp537;
2391 	       fftw_real tmp538;
2392 	       ASSERT_ALIGNED_DOUBLE;
2393 	       tmp487 = tmp471 + tmp486;
2394 	       tmp526 = tmp506 + tmp525;
2395 	       real_output[61 * real_ostride] = tmp487 - tmp526;
2396 	       real_output[3 * real_ostride] = tmp487 + tmp526;
2397 	       tmp537 = tmp529 - tmp536;
2398 	       tmp538 = tmp525 - tmp506;
2399 	       imag_output[29 * imag_ostride] = tmp537 + tmp538;
2400 	       imag_output[35 * imag_ostride] = tmp538 - tmp537;
2401 	  }
2402 	  {
2403 	       fftw_real tmp539;
2404 	       fftw_real tmp542;
2405 	       fftw_real tmp543;
2406 	       fftw_real tmp544;
2407 	       ASSERT_ALIGNED_DOUBLE;
2408 	       tmp539 = tmp536 + tmp529;
2409 	       tmp542 = tmp540 + tmp541;
2410 	       imag_output[3 * imag_ostride] = tmp539 + tmp542;
2411 	       imag_output[61 * imag_ostride] = tmp542 - tmp539;
2412 	       tmp543 = tmp471 - tmp486;
2413 	       tmp544 = tmp541 - tmp540;
2414 	       real_output[35 * real_ostride] = tmp543 - tmp544;
2415 	       real_output[29 * real_ostride] = tmp543 + tmp544;
2416 	  }
2417 	  {
2418 	       fftw_real tmp547;
2419 	       fftw_real tmp554;
2420 	       fftw_real tmp557;
2421 	       fftw_real tmp558;
2422 	       ASSERT_ALIGNED_DOUBLE;
2423 	       tmp547 = tmp545 + tmp546;
2424 	       tmp554 = tmp550 + tmp553;
2425 	       real_output[51 * real_ostride] = tmp547 - tmp554;
2426 	       real_output[13 * real_ostride] = tmp547 + tmp554;
2427 	       tmp557 = tmp555 - tmp556;
2428 	       tmp558 = tmp553 - tmp550;
2429 	       imag_output[19 * imag_ostride] = tmp557 + tmp558;
2430 	       imag_output[45 * imag_ostride] = tmp558 - tmp557;
2431 	  }
2432 	  {
2433 	       fftw_real tmp559;
2434 	       fftw_real tmp562;
2435 	       fftw_real tmp563;
2436 	       fftw_real tmp564;
2437 	       ASSERT_ALIGNED_DOUBLE;
2438 	       tmp559 = tmp556 + tmp555;
2439 	       tmp562 = tmp560 + tmp561;
2440 	       imag_output[13 * imag_ostride] = tmp559 + tmp562;
2441 	       imag_output[51 * imag_ostride] = tmp562 - tmp559;
2442 	       tmp563 = tmp545 - tmp546;
2443 	       tmp564 = tmp561 - tmp560;
2444 	       real_output[45 * real_ostride] = tmp563 - tmp564;
2445 	       real_output[19 * real_ostride] = tmp563 + tmp564;
2446 	  }
2447      }
2448      {
2449 	  fftw_real tmp567;
2450 	  fftw_real tmp605;
2451 	  fftw_real tmp574;
2452 	  fftw_real tmp615;
2453 	  fftw_real tmp596;
2454 	  fftw_real tmp616;
2455 	  fftw_real tmp593;
2456 	  fftw_real tmp606;
2457 	  fftw_real tmp589;
2458 	  fftw_real tmp601;
2459 	  fftw_real tmp613;
2460 	  fftw_real tmp621;
2461 	  fftw_real tmp582;
2462 	  fftw_real tmp600;
2463 	  fftw_real tmp610;
2464 	  fftw_real tmp620;
2465 	  ASSERT_ALIGNED_DOUBLE;
2466 	  {
2467 	       fftw_real tmp565;
2468 	       fftw_real tmp566;
2469 	       fftw_real tmp591;
2470 	       fftw_real tmp592;
2471 	       ASSERT_ALIGNED_DOUBLE;
2472 	       tmp565 = tmp461 - tmp462;
2473 	       tmp566 = tmp534 - tmp533;
2474 	       tmp567 = tmp565 - tmp566;
2475 	       tmp605 = tmp565 + tmp566;
2476 	       {
2477 		    fftw_real tmp570;
2478 		    fftw_real tmp573;
2479 		    fftw_real tmp594;
2480 		    fftw_real tmp595;
2481 		    ASSERT_ALIGNED_DOUBLE;
2482 		    tmp570 = (K471396736 * tmp568) + (K881921264 * tmp569);
2483 		    tmp573 = (K881921264 * tmp571) - (K471396736 * tmp572);
2484 		    tmp574 = tmp570 - tmp573;
2485 		    tmp615 = tmp573 + tmp570;
2486 		    tmp594 = tmp469 - tmp466;
2487 		    tmp595 = tmp531 - tmp530;
2488 		    tmp596 = tmp594 - tmp595;
2489 		    tmp616 = tmp595 + tmp594;
2490 	       }
2491 	       tmp591 = (K881921264 * tmp568) - (K471396736 * tmp569);
2492 	       tmp592 = (K881921264 * tmp572) + (K471396736 * tmp571);
2493 	       tmp593 = tmp591 - tmp592;
2494 	       tmp606 = tmp592 + tmp591;
2495 	       {
2496 		    fftw_real tmp585;
2497 		    fftw_real tmp611;
2498 		    fftw_real tmp588;
2499 		    fftw_real tmp612;
2500 		    fftw_real tmp584;
2501 		    fftw_real tmp586;
2502 		    ASSERT_ALIGNED_DOUBLE;
2503 		    tmp584 = tmp522 - tmp521;
2504 		    tmp585 = tmp583 - tmp584;
2505 		    tmp611 = tmp583 + tmp584;
2506 		    tmp586 = tmp515 - tmp512;
2507 		    tmp588 = tmp586 - tmp587;
2508 		    tmp612 = tmp587 + tmp586;
2509 		    tmp589 = (K857728610 * tmp585) - (K514102744 * tmp588);
2510 		    tmp601 = (K857728610 * tmp588) + (K514102744 * tmp585);
2511 		    tmp613 = (K970031253 * tmp611) - (K242980179 * tmp612);
2512 		    tmp621 = (K970031253 * tmp612) + (K242980179 * tmp611);
2513 	       }
2514 	       {
2515 		    fftw_real tmp578;
2516 		    fftw_real tmp608;
2517 		    fftw_real tmp581;
2518 		    fftw_real tmp609;
2519 		    fftw_real tmp576;
2520 		    fftw_real tmp580;
2521 		    ASSERT_ALIGNED_DOUBLE;
2522 		    tmp576 = tmp496 - tmp493;
2523 		    tmp578 = tmp576 - tmp577;
2524 		    tmp608 = tmp577 + tmp576;
2525 		    tmp580 = tmp503 - tmp502;
2526 		    tmp581 = tmp579 - tmp580;
2527 		    tmp609 = tmp579 + tmp580;
2528 		    tmp582 = (K514102744 * tmp578) + (K857728610 * tmp581);
2529 		    tmp600 = (K857728610 * tmp578) - (K514102744 * tmp581);
2530 		    tmp610 = (K242980179 * tmp608) + (K970031253 * tmp609);
2531 		    tmp620 = (K970031253 * tmp608) - (K242980179 * tmp609);
2532 	       }
2533 	  }
2534 	  {
2535 	       fftw_real tmp575;
2536 	       fftw_real tmp590;
2537 	       fftw_real tmp597;
2538 	       fftw_real tmp598;
2539 	       ASSERT_ALIGNED_DOUBLE;
2540 	       tmp575 = tmp567 + tmp574;
2541 	       tmp590 = tmp582 + tmp589;
2542 	       real_output[53 * real_ostride] = tmp575 - tmp590;
2543 	       real_output[11 * real_ostride] = tmp575 + tmp590;
2544 	       tmp597 = tmp593 - tmp596;
2545 	       tmp598 = tmp589 - tmp582;
2546 	       imag_output[21 * imag_ostride] = tmp597 + tmp598;
2547 	       imag_output[43 * imag_ostride] = tmp598 - tmp597;
2548 	  }
2549 	  {
2550 	       fftw_real tmp599;
2551 	       fftw_real tmp602;
2552 	       fftw_real tmp603;
2553 	       fftw_real tmp604;
2554 	       ASSERT_ALIGNED_DOUBLE;
2555 	       tmp599 = tmp596 + tmp593;
2556 	       tmp602 = tmp600 + tmp601;
2557 	       imag_output[11 * imag_ostride] = tmp599 + tmp602;
2558 	       imag_output[53 * imag_ostride] = tmp602 - tmp599;
2559 	       tmp603 = tmp567 - tmp574;
2560 	       tmp604 = tmp601 - tmp600;
2561 	       real_output[43 * real_ostride] = tmp603 - tmp604;
2562 	       real_output[21 * real_ostride] = tmp603 + tmp604;
2563 	  }
2564 	  {
2565 	       fftw_real tmp607;
2566 	       fftw_real tmp614;
2567 	       fftw_real tmp617;
2568 	       fftw_real tmp618;
2569 	       ASSERT_ALIGNED_DOUBLE;
2570 	       tmp607 = tmp605 + tmp606;
2571 	       tmp614 = tmp610 + tmp613;
2572 	       real_output[59 * real_ostride] = tmp607 - tmp614;
2573 	       real_output[5 * real_ostride] = tmp607 + tmp614;
2574 	       tmp617 = tmp615 - tmp616;
2575 	       tmp618 = tmp613 - tmp610;
2576 	       imag_output[27 * imag_ostride] = tmp617 + tmp618;
2577 	       imag_output[37 * imag_ostride] = tmp618 - tmp617;
2578 	  }
2579 	  {
2580 	       fftw_real tmp619;
2581 	       fftw_real tmp622;
2582 	       fftw_real tmp623;
2583 	       fftw_real tmp624;
2584 	       ASSERT_ALIGNED_DOUBLE;
2585 	       tmp619 = tmp616 + tmp615;
2586 	       tmp622 = tmp620 + tmp621;
2587 	       imag_output[5 * imag_ostride] = tmp619 + tmp622;
2588 	       imag_output[59 * imag_ostride] = tmp622 - tmp619;
2589 	       tmp623 = tmp605 - tmp606;
2590 	       tmp624 = tmp621 - tmp620;
2591 	       real_output[37 * real_ostride] = tmp623 - tmp624;
2592 	       real_output[27 * real_ostride] = tmp623 + tmp624;
2593 	  }
2594      }
2595 }
2596 
2597 fftw_codelet_desc fftw_real2hc_128_desc = {
2598      "fftw_real2hc_128",
2599      (void (*)()) fftw_real2hc_128,
2600      128,
2601      FFTW_FORWARD,
2602      FFTW_REAL2HC,
2603      2818,
2604      0,
2605      (const int *) 0,
2606 };
2607