1 /*
2  * Copyright (c) 1997-1999, 2003 Massachusetts Institute of Technology
3  *
4  * This program is free software; you can redistribute it and/or modify
5  * it under the terms of the GNU General Public License as published by
6  * the Free Software Foundation; either version 2 of the License, or
7  * (at your option) any later version.
8  *
9  * This program is distributed in the hope that it will be useful,
10  * but WITHOUT ANY WARRANTY; without even the implied warranty of
11  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
12  * GNU General Public License for more details.
13  *
14  * You should have received a copy of the GNU General Public License
15  * along with this program; if not, write to the Free Software
16  * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
17  *
18  */
19 
20 /* This file was automatically generated --- DO NOT EDIT */
21 /* Generated on Mon Mar 24 02:08:53 EST 2003 */
22 
23 #include "fftw-int.h"
24 #include "fftw.h"
25 
26 /* Generated by: /homee/stevenj/cvs/fftw/gensrc/genfft -magic-alignment-check -magic-twiddle-load-all -magic-variables 4 -magic-loopi -hc2hc-backward 5 */
27 
28 /*
29  * This function contains 64 FP additions, 42 FP multiplications,
30  * (or, 42 additions, 20 multiplications, 22 fused multiply/add),
31  * 25 stack variables, and 40 memory accesses
32  */
33 static const fftw_real K250000000 =
34 FFTW_KONST(+0.250000000000000000000000000000000000000000000);
35 static const fftw_real K559016994 =
36 FFTW_KONST(+0.559016994374947424102293417182819058860154590);
37 static const fftw_real K951056516 =
38 FFTW_KONST(+0.951056516295153572116439333379382143405698634);
39 static const fftw_real K587785252 =
40 FFTW_KONST(+0.587785252292473129168705954639072768597652438);
41 static const fftw_real K2_000000000 =
42 FFTW_KONST(+2.000000000000000000000000000000000000000000000);
43 static const fftw_real K500000000 =
44 FFTW_KONST(+0.500000000000000000000000000000000000000000000);
45 static const fftw_real K1_118033988 =
46 FFTW_KONST(+1.118033988749894848204586834365638117720309180);
47 static const fftw_real K1_175570504 =
48 FFTW_KONST(+1.175570504584946258337411909278145537195304875);
49 static const fftw_real K1_902113032 =
50 FFTW_KONST(+1.902113032590307144232878666758764286811397268);
51 
52 /*
53  * Generator Id's :
54  * $Id: exprdag.ml,v 1.43 2003/03/16 23:43:46 stevenj Exp $
55  * $Id: fft.ml,v 1.44 2003/03/16 23:43:46 stevenj Exp $
56  * $Id: to_c.ml,v 1.26 2003/03/16 23:43:46 stevenj Exp $
57  */
58 
fftw_hc2hc_backward_5(fftw_real * A,const fftw_complex * W,int iostride,int m,int dist)59 void fftw_hc2hc_backward_5(fftw_real *A, const fftw_complex *W,
60 			   int iostride, int m, int dist)
61 {
62      int i;
63      fftw_real *X;
64      fftw_real *Y;
65      X = A;
66      Y = A + (5 * iostride);
67      {
68 	  fftw_real tmp70;
69 	  fftw_real tmp72;
70 	  fftw_real tmp61;
71 	  fftw_real tmp64;
72 	  fftw_real tmp65;
73 	  fftw_real tmp66;
74 	  fftw_real tmp71;
75 	  fftw_real tmp67;
76 	  ASSERT_ALIGNED_DOUBLE;
77 	  {
78 	       fftw_real tmp68;
79 	       fftw_real tmp69;
80 	       fftw_real tmp62;
81 	       fftw_real tmp63;
82 	       ASSERT_ALIGNED_DOUBLE;
83 	       tmp68 = Y[-iostride];
84 	       tmp69 = Y[-2 * iostride];
85 	       tmp70 = (K1_902113032 * tmp68) + (K1_175570504 * tmp69);
86 	       tmp72 = (K1_902113032 * tmp69) - (K1_175570504 * tmp68);
87 	       tmp61 = X[0];
88 	       tmp62 = X[iostride];
89 	       tmp63 = X[2 * iostride];
90 	       tmp64 = tmp62 + tmp63;
91 	       tmp65 = K1_118033988 * (tmp62 - tmp63);
92 	       tmp66 = tmp61 - (K500000000 * tmp64);
93 	  }
94 	  X[0] = tmp61 + (K2_000000000 * tmp64);
95 	  tmp71 = tmp66 - tmp65;
96 	  X[3 * iostride] = tmp71 - tmp72;
97 	  X[2 * iostride] = tmp71 + tmp72;
98 	  tmp67 = tmp65 + tmp66;
99 	  X[4 * iostride] = tmp67 + tmp70;
100 	  X[iostride] = tmp67 - tmp70;
101      }
102      X = X + dist;
103      Y = Y - dist;
104      for (i = 2; i < m; i = i + 2, X = X + dist, Y = Y - dist, W = W + 4) {
105 	  fftw_real tmp13;
106 	  fftw_real tmp32;
107 	  fftw_real tmp50;
108 	  fftw_real tmp39;
109 	  fftw_real tmp20;
110 	  fftw_real tmp38;
111 	  fftw_real tmp21;
112 	  fftw_real tmp34;
113 	  fftw_real tmp28;
114 	  fftw_real tmp33;
115 	  fftw_real tmp43;
116 	  fftw_real tmp55;
117 	  ASSERT_ALIGNED_DOUBLE;
118 	  {
119 	       fftw_real tmp19;
120 	       fftw_real tmp31;
121 	       fftw_real tmp16;
122 	       fftw_real tmp30;
123 	       ASSERT_ALIGNED_DOUBLE;
124 	       tmp13 = X[0];
125 	       {
126 		    fftw_real tmp17;
127 		    fftw_real tmp18;
128 		    fftw_real tmp14;
129 		    fftw_real tmp15;
130 		    ASSERT_ALIGNED_DOUBLE;
131 		    tmp17 = X[2 * iostride];
132 		    tmp18 = Y[-3 * iostride];
133 		    tmp19 = tmp17 + tmp18;
134 		    tmp31 = tmp17 - tmp18;
135 		    tmp14 = X[iostride];
136 		    tmp15 = Y[-4 * iostride];
137 		    tmp16 = tmp14 + tmp15;
138 		    tmp30 = tmp14 - tmp15;
139 	       }
140 	       tmp32 = (K587785252 * tmp30) - (K951056516 * tmp31);
141 	       tmp50 = (K951056516 * tmp30) + (K587785252 * tmp31);
142 	       tmp39 = K559016994 * (tmp16 - tmp19);
143 	       tmp20 = tmp16 + tmp19;
144 	       tmp38 = tmp13 - (K250000000 * tmp20);
145 	  }
146 	  {
147 	       fftw_real tmp27;
148 	       fftw_real tmp42;
149 	       fftw_real tmp24;
150 	       fftw_real tmp41;
151 	       ASSERT_ALIGNED_DOUBLE;
152 	       tmp21 = Y[0];
153 	       {
154 		    fftw_real tmp25;
155 		    fftw_real tmp26;
156 		    fftw_real tmp22;
157 		    fftw_real tmp23;
158 		    ASSERT_ALIGNED_DOUBLE;
159 		    tmp25 = Y[-2 * iostride];
160 		    tmp26 = X[3 * iostride];
161 		    tmp27 = tmp25 - tmp26;
162 		    tmp42 = tmp25 + tmp26;
163 		    tmp22 = Y[-iostride];
164 		    tmp23 = X[4 * iostride];
165 		    tmp24 = tmp22 - tmp23;
166 		    tmp41 = tmp22 + tmp23;
167 	       }
168 	       tmp34 = K559016994 * (tmp24 - tmp27);
169 	       tmp28 = tmp24 + tmp27;
170 	       tmp33 = tmp21 - (K250000000 * tmp28);
171 	       tmp43 = (K587785252 * tmp41) - (K951056516 * tmp42);
172 	       tmp55 = (K951056516 * tmp41) + (K587785252 * tmp42);
173 	  }
174 	  X[0] = tmp13 + tmp20;
175 	  {
176 	       fftw_real tmp52;
177 	       fftw_real tmp58;
178 	       fftw_real tmp56;
179 	       fftw_real tmp60;
180 	       fftw_real tmp51;
181 	       fftw_real tmp54;
182 	       ASSERT_ALIGNED_DOUBLE;
183 	       tmp51 = tmp34 + tmp33;
184 	       tmp52 = tmp50 + tmp51;
185 	       tmp58 = tmp51 - tmp50;
186 	       tmp54 = tmp39 + tmp38;
187 	       tmp56 = tmp54 - tmp55;
188 	       tmp60 = tmp54 + tmp55;
189 	       {
190 		    fftw_real tmp49;
191 		    fftw_real tmp53;
192 		    fftw_real tmp57;
193 		    fftw_real tmp59;
194 		    ASSERT_ALIGNED_DOUBLE;
195 		    tmp49 = c_re(W[0]);
196 		    tmp53 = c_im(W[0]);
197 		    Y[-3 * iostride] = (tmp49 * tmp52) - (tmp53 * tmp56);
198 		    X[iostride] = (tmp53 * tmp52) + (tmp49 * tmp56);
199 		    tmp57 = c_re(W[3]);
200 		    tmp59 = c_im(W[3]);
201 		    Y[0] = (tmp57 * tmp58) - (tmp59 * tmp60);
202 		    X[4 * iostride] = (tmp59 * tmp58) + (tmp57 * tmp60);
203 	       }
204 	  }
205 	  Y[-4 * iostride] = tmp21 + tmp28;
206 	  {
207 	       fftw_real tmp36;
208 	       fftw_real tmp46;
209 	       fftw_real tmp44;
210 	       fftw_real tmp48;
211 	       fftw_real tmp35;
212 	       fftw_real tmp40;
213 	       ASSERT_ALIGNED_DOUBLE;
214 	       tmp35 = tmp33 - tmp34;
215 	       tmp36 = tmp32 + tmp35;
216 	       tmp46 = tmp35 - tmp32;
217 	       tmp40 = tmp38 - tmp39;
218 	       tmp44 = tmp40 - tmp43;
219 	       tmp48 = tmp40 + tmp43;
220 	       {
221 		    fftw_real tmp29;
222 		    fftw_real tmp37;
223 		    fftw_real tmp45;
224 		    fftw_real tmp47;
225 		    ASSERT_ALIGNED_DOUBLE;
226 		    tmp29 = c_re(W[1]);
227 		    tmp37 = c_im(W[1]);
228 		    Y[-2 * iostride] = (tmp29 * tmp36) - (tmp37 * tmp44);
229 		    X[2 * iostride] = (tmp37 * tmp36) + (tmp29 * tmp44);
230 		    tmp45 = c_re(W[2]);
231 		    tmp47 = c_im(W[2]);
232 		    Y[-iostride] = (tmp45 * tmp46) - (tmp47 * tmp48);
233 		    X[3 * iostride] = (tmp47 * tmp46) + (tmp45 * tmp48);
234 	       }
235 	  }
236      }
237      if (i == m) {
238 	  fftw_real tmp10;
239 	  fftw_real tmp12;
240 	  fftw_real tmp1;
241 	  fftw_real tmp4;
242 	  fftw_real tmp5;
243 	  fftw_real tmp6;
244 	  fftw_real tmp11;
245 	  fftw_real tmp7;
246 	  ASSERT_ALIGNED_DOUBLE;
247 	  {
248 	       fftw_real tmp8;
249 	       fftw_real tmp9;
250 	       fftw_real tmp2;
251 	       fftw_real tmp3;
252 	       ASSERT_ALIGNED_DOUBLE;
253 	       tmp8 = Y[-iostride];
254 	       tmp9 = Y[0];
255 	       tmp10 = (K1_902113032 * tmp8) + (K1_175570504 * tmp9);
256 	       tmp12 = (K1_175570504 * tmp8) - (K1_902113032 * tmp9);
257 	       tmp1 = X[2 * iostride];
258 	       tmp2 = X[iostride];
259 	       tmp3 = X[0];
260 	       tmp4 = tmp2 + tmp3;
261 	       tmp5 = (K500000000 * tmp4) - tmp1;
262 	       tmp6 = K1_118033988 * (tmp3 - tmp2);
263 	  }
264 	  X[0] = tmp1 + (K2_000000000 * tmp4);
265 	  tmp11 = tmp6 - tmp5;
266 	  X[2 * iostride] = tmp11 + tmp12;
267 	  X[3 * iostride] = tmp12 - tmp11;
268 	  tmp7 = tmp5 + tmp6;
269 	  X[iostride] = tmp7 - tmp10;
270 	  X[4 * iostride] = -(tmp7 + tmp10);
271      }
272 }
273 
274 static const int twiddle_order[] = { 1, 2, 3, 4 };
275 fftw_codelet_desc fftw_hc2hc_backward_5_desc = {
276      "fftw_hc2hc_backward_5",
277      (void (*)()) fftw_hc2hc_backward_5,
278      5,
279      FFTW_BACKWARD,
280      FFTW_HC2HC,
281      124,
282      4,
283      twiddle_order,
284 };
285