Details | Last modification | View Log | RSS feed
Rev | Author | Line No. | Line |
---|---|---|---|
2 | pj | 1 | /* |
2 | * Copyright (c) 1997-1999 Massachusetts Institute of Technology |
||
3 | * |
||
4 | * This program is free software; you can redistribute it and/or modify |
||
5 | * it under the terms of the GNU General Public License as published by |
||
6 | * the Free Software Foundation; either version 2 of the License, or |
||
7 | * (at your option) any later version. |
||
8 | * |
||
9 | * This program is distributed in the hope that it will be useful, |
||
10 | * but WITHOUT ANY WARRANTY; without even the implied warranty of |
||
11 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
||
12 | * GNU General Public License for more details. |
||
13 | * |
||
14 | * You should have received a copy of the GNU General Public License |
||
15 | * along with this program; if not, write to the Free Software |
||
16 | * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA |
||
17 | * |
||
18 | */ |
||
19 | |||
20 | /* This file was automatically generated --- DO NOT EDIT */ |
||
21 | /* Generated on Tue May 18 13:56:10 EDT 1999 */ |
||
22 | |||
23 | #include <ports/fftw-int.h> |
||
24 | #include <ports/fftw.h> |
||
25 | |||
26 | /* Generated by: ./genfft -magic-alignment-check -magic-twiddle-load-all -magic-variables 4 -magic-loopi -hc2hc-backward 32 */ |
||
27 | |||
28 | /* |
||
29 | * This function contains 764 FP additions, 346 FP multiplications, |
||
30 | * (or, 618 additions, 200 multiplications, 146 fused multiply/add), |
||
31 | * 93 stack variables, and 256 memory accesses |
||
32 | */ |
||
33 | static const fftw_real K1_662939224 = FFTW_KONST(+1.662939224605090474157576755235811513477121624); |
||
34 | static const fftw_real K1_111140466 = FFTW_KONST(+1.111140466039204449485661627897065748749874382); |
||
35 | static const fftw_real K390180644 = FFTW_KONST(+0.390180644032256535696569736954044481855383236); |
||
36 | static const fftw_real K1_961570560 = FFTW_KONST(+1.961570560806460898252364472268478073947867462); |
||
37 | static const fftw_real K1_913880671 = FFTW_KONST(+1.913880671464417729871595773960539938965698411); |
||
38 | static const fftw_real K580569354 = FFTW_KONST(+0.580569354508924735272384751634790549382952557); |
||
39 | static const fftw_real K942793473 = FFTW_KONST(+0.942793473651995297112775251810508755314920638); |
||
40 | static const fftw_real K1_763842528 = FFTW_KONST(+1.763842528696710059425513727320776699016885241); |
||
41 | static const fftw_real K1_546020906 = FFTW_KONST(+1.546020906725473921621813219516939601942082586); |
||
42 | static const fftw_real K1_268786568 = FFTW_KONST(+1.268786568327290996430343226450986741351374190); |
||
43 | static const fftw_real K196034280 = FFTW_KONST(+0.196034280659121203988391127777283691722273346); |
||
44 | static const fftw_real K1_990369453 = FFTW_KONST(+1.990369453344393772489673906218959843150949737); |
||
45 | static const fftw_real K382683432 = FFTW_KONST(+0.382683432365089771728459984030398866761344562); |
||
46 | static const fftw_real K923879532 = FFTW_KONST(+0.923879532511286756128183189396788286822416626); |
||
47 | static const fftw_real K707106781 = FFTW_KONST(+0.707106781186547524400844362104849039284835938); |
||
48 | static const fftw_real K765366864 = FFTW_KONST(+0.765366864730179543456919968060797733522689125); |
||
49 | static const fftw_real K1_847759065 = FFTW_KONST(+1.847759065022573512256366378793576573644833252); |
||
50 | static const fftw_real K555570233 = FFTW_KONST(+0.555570233019602224742830813948532874374937191); |
||
51 | static const fftw_real K831469612 = FFTW_KONST(+0.831469612302545237078788377617905756738560812); |
||
52 | static const fftw_real K195090322 = FFTW_KONST(+0.195090322016128267848284868477022240927691618); |
||
53 | static const fftw_real K980785280 = FFTW_KONST(+0.980785280403230449126182236134239036973933731); |
||
54 | static const fftw_real K1_414213562 = FFTW_KONST(+1.414213562373095048801688724209698078569671875); |
||
55 | static const fftw_real K2_000000000 = FFTW_KONST(+2.000000000000000000000000000000000000000000000); |
||
56 | |||
57 | /* |
||
58 | * Generator Id's : |
||
59 | * $Id: fhb_32.c,v 1.1.1.1 2002-03-29 14:12:57 pj Exp $ |
||
60 | * $Id: fhb_32.c,v 1.1.1.1 2002-03-29 14:12:57 pj Exp $ |
||
61 | * $Id: fhb_32.c,v 1.1.1.1 2002-03-29 14:12:57 pj Exp $ |
||
62 | */ |
||
63 | |||
64 | void fftw_hc2hc_backward_32(fftw_real *A, const fftw_complex *W, int iostride, int m, int dist) |
||
65 | { |
||
66 | int i; |
||
67 | fftw_real *X; |
||
68 | fftw_real *Y; |
||
69 | X = A; |
||
70 | Y = A + (32 * iostride); |
||
71 | { |
||
72 | fftw_real tmp679; |
||
73 | fftw_real tmp804; |
||
74 | fftw_real tmp766; |
||
75 | fftw_real tmp707; |
||
76 | fftw_real tmp702; |
||
77 | fftw_real tmp728; |
||
78 | fftw_real tmp726; |
||
79 | fftw_real tmp753; |
||
80 | fftw_real tmp815; |
||
81 | fftw_real tmp819; |
||
82 | fftw_real tmp789; |
||
83 | fftw_real tmp793; |
||
84 | fftw_real tmp676; |
||
85 | fftw_real tmp704; |
||
86 | fftw_real tmp763; |
||
87 | fftw_real tmp803; |
||
88 | fftw_real tmp687; |
||
89 | fftw_real tmp709; |
||
90 | fftw_real tmp716; |
||
91 | fftw_real tmp749; |
||
92 | fftw_real tmp770; |
||
93 | fftw_real tmp806; |
||
94 | fftw_real tmp773; |
||
95 | fftw_real tmp807; |
||
96 | fftw_real tmp695; |
||
97 | fftw_real tmp719; |
||
98 | fftw_real tmp735; |
||
99 | fftw_real tmp752; |
||
100 | fftw_real tmp812; |
||
101 | fftw_real tmp818; |
||
102 | fftw_real tmp782; |
||
103 | fftw_real tmp792; |
||
104 | ASSERT_ALIGNED_DOUBLE(); |
||
105 | { |
||
106 | fftw_real tmp677; |
||
107 | fftw_real tmp678; |
||
108 | fftw_real tmp764; |
||
109 | fftw_real tmp705; |
||
110 | fftw_real tmp706; |
||
111 | fftw_real tmp765; |
||
112 | ASSERT_ALIGNED_DOUBLE(); |
||
113 | tmp677 = X[4 * iostride]; |
||
114 | tmp678 = X[12 * iostride]; |
||
115 | tmp764 = tmp677 - tmp678; |
||
116 | tmp705 = Y[-4 * iostride]; |
||
117 | tmp706 = Y[-12 * iostride]; |
||
118 | tmp765 = tmp706 + tmp705; |
||
119 | tmp679 = K2_000000000 * (tmp677 + tmp678); |
||
120 | tmp804 = K1_414213562 * (tmp764 + tmp765); |
||
121 | tmp766 = K1_414213562 * (tmp764 - tmp765); |
||
122 | tmp707 = K2_000000000 * (tmp705 - tmp706); |
||
123 | } |
||
124 | { |
||
125 | fftw_real tmp698; |
||
126 | fftw_real tmp783; |
||
127 | fftw_real tmp725; |
||
128 | fftw_real tmp787; |
||
129 | fftw_real tmp701; |
||
130 | fftw_real tmp786; |
||
131 | fftw_real tmp722; |
||
132 | fftw_real tmp784; |
||
133 | ASSERT_ALIGNED_DOUBLE(); |
||
134 | { |
||
135 | fftw_real tmp696; |
||
136 | fftw_real tmp697; |
||
137 | fftw_real tmp723; |
||
138 | fftw_real tmp724; |
||
139 | ASSERT_ALIGNED_DOUBLE(); |
||
140 | tmp696 = X[3 * iostride]; |
||
141 | tmp697 = X[13 * iostride]; |
||
142 | tmp698 = tmp696 + tmp697; |
||
143 | tmp783 = tmp696 - tmp697; |
||
144 | tmp723 = Y[-3 * iostride]; |
||
145 | tmp724 = Y[-13 * iostride]; |
||
146 | tmp725 = tmp723 - tmp724; |
||
147 | tmp787 = tmp723 + tmp724; |
||
148 | } |
||
149 | { |
||
150 | fftw_real tmp699; |
||
151 | fftw_real tmp700; |
||
152 | fftw_real tmp720; |
||
153 | fftw_real tmp721; |
||
154 | ASSERT_ALIGNED_DOUBLE(); |
||
155 | tmp699 = X[5 * iostride]; |
||
156 | tmp700 = X[11 * iostride]; |
||
157 | tmp701 = tmp699 + tmp700; |
||
158 | tmp786 = tmp700 - tmp699; |
||
159 | tmp720 = Y[-5 * iostride]; |
||
160 | tmp721 = Y[-11 * iostride]; |
||
161 | tmp722 = tmp720 - tmp721; |
||
162 | tmp784 = tmp721 + tmp720; |
||
163 | } |
||
164 | tmp702 = tmp698 + tmp701; |
||
165 | tmp728 = tmp701 - tmp698; |
||
166 | tmp726 = tmp722 + tmp725; |
||
167 | tmp753 = tmp725 - tmp722; |
||
168 | { |
||
169 | fftw_real tmp813; |
||
170 | fftw_real tmp814; |
||
171 | fftw_real tmp785; |
||
172 | fftw_real tmp788; |
||
173 | ASSERT_ALIGNED_DOUBLE(); |
||
174 | tmp813 = tmp783 + tmp784; |
||
175 | tmp814 = tmp787 - tmp786; |
||
176 | tmp815 = (K980785280 * tmp813) - (K195090322 * tmp814); |
||
177 | tmp819 = (K195090322 * tmp813) + (K980785280 * tmp814); |
||
178 | tmp785 = tmp783 - tmp784; |
||
179 | tmp788 = tmp786 + tmp787; |
||
180 | tmp789 = (K831469612 * tmp785) - (K555570233 * tmp788); |
||
181 | tmp793 = (K555570233 * tmp785) + (K831469612 * tmp788); |
||
182 | } |
||
183 | } |
||
184 | { |
||
185 | fftw_real tmp675; |
||
186 | fftw_real tmp762; |
||
187 | fftw_real tmp673; |
||
188 | fftw_real tmp760; |
||
189 | ASSERT_ALIGNED_DOUBLE(); |
||
190 | { |
||
191 | fftw_real tmp674; |
||
192 | fftw_real tmp761; |
||
193 | fftw_real tmp671; |
||
194 | fftw_real tmp672; |
||
195 | ASSERT_ALIGNED_DOUBLE(); |
||
196 | tmp674 = X[8 * iostride]; |
||
197 | tmp675 = K2_000000000 * tmp674; |
||
198 | tmp761 = Y[-8 * iostride]; |
||
199 | tmp762 = K2_000000000 * tmp761; |
||
200 | tmp671 = X[0]; |
||
201 | tmp672 = X[16 * iostride]; |
||
202 | tmp673 = tmp671 + tmp672; |
||
203 | tmp760 = tmp671 - tmp672; |
||
204 | } |
||
205 | tmp676 = tmp673 + tmp675; |
||
206 | tmp704 = tmp673 - tmp675; |
||
207 | tmp763 = tmp760 - tmp762; |
||
208 | tmp803 = tmp760 + tmp762; |
||
209 | } |
||
210 | { |
||
211 | fftw_real tmp683; |
||
212 | fftw_real tmp768; |
||
213 | fftw_real tmp715; |
||
214 | fftw_real tmp772; |
||
215 | fftw_real tmp686; |
||
216 | fftw_real tmp771; |
||
217 | fftw_real tmp712; |
||
218 | fftw_real tmp769; |
||
219 | ASSERT_ALIGNED_DOUBLE(); |
||
220 | { |
||
221 | fftw_real tmp681; |
||
222 | fftw_real tmp682; |
||
223 | fftw_real tmp713; |
||
224 | fftw_real tmp714; |
||
225 | ASSERT_ALIGNED_DOUBLE(); |
||
226 | tmp681 = X[2 * iostride]; |
||
227 | tmp682 = X[14 * iostride]; |
||
228 | tmp683 = tmp681 + tmp682; |
||
229 | tmp768 = tmp681 - tmp682; |
||
230 | tmp713 = Y[-2 * iostride]; |
||
231 | tmp714 = Y[-14 * iostride]; |
||
232 | tmp715 = tmp713 - tmp714; |
||
233 | tmp772 = tmp713 + tmp714; |
||
234 | } |
||
235 | { |
||
236 | fftw_real tmp684; |
||
237 | fftw_real tmp685; |
||
238 | fftw_real tmp710; |
||
239 | fftw_real tmp711; |
||
240 | ASSERT_ALIGNED_DOUBLE(); |
||
241 | tmp684 = X[6 * iostride]; |
||
242 | tmp685 = X[10 * iostride]; |
||
243 | tmp686 = tmp684 + tmp685; |
||
244 | tmp771 = tmp685 - tmp684; |
||
245 | tmp710 = Y[-6 * iostride]; |
||
246 | tmp711 = Y[-10 * iostride]; |
||
247 | tmp712 = tmp710 - tmp711; |
||
248 | tmp769 = tmp711 + tmp710; |
||
249 | } |
||
250 | tmp687 = K2_000000000 * (tmp683 + tmp686); |
||
251 | tmp709 = tmp683 - tmp686; |
||
252 | tmp716 = tmp712 + tmp715; |
||
253 | tmp749 = K2_000000000 * (tmp715 - tmp712); |
||
254 | tmp770 = tmp768 - tmp769; |
||
255 | tmp806 = tmp768 + tmp769; |
||
256 | tmp773 = tmp771 + tmp772; |
||
257 | tmp807 = tmp772 - tmp771; |
||
258 | } |
||
259 | { |
||
260 | fftw_real tmp691; |
||
261 | fftw_real tmp776; |
||
262 | fftw_real tmp734; |
||
263 | fftw_real tmp780; |
||
264 | fftw_real tmp694; |
||
265 | fftw_real tmp779; |
||
266 | fftw_real tmp731; |
||
267 | fftw_real tmp777; |
||
268 | ASSERT_ALIGNED_DOUBLE(); |
||
269 | { |
||
270 | fftw_real tmp689; |
||
271 | fftw_real tmp690; |
||
272 | fftw_real tmp732; |
||
273 | fftw_real tmp733; |
||
274 | ASSERT_ALIGNED_DOUBLE(); |
||
275 | tmp689 = X[iostride]; |
||
276 | tmp690 = X[15 * iostride]; |
||
277 | tmp691 = tmp689 + tmp690; |
||
278 | tmp776 = tmp689 - tmp690; |
||
279 | tmp732 = Y[-iostride]; |
||
280 | tmp733 = Y[-15 * iostride]; |
||
281 | tmp734 = tmp732 - tmp733; |
||
282 | tmp780 = tmp732 + tmp733; |
||
283 | } |
||
284 | { |
||
285 | fftw_real tmp692; |
||
286 | fftw_real tmp693; |
||
287 | fftw_real tmp729; |
||
288 | fftw_real tmp730; |
||
289 | ASSERT_ALIGNED_DOUBLE(); |
||
290 | tmp692 = X[7 * iostride]; |
||
291 | tmp693 = X[9 * iostride]; |
||
292 | tmp694 = tmp692 + tmp693; |
||
293 | tmp779 = tmp693 - tmp692; |
||
294 | tmp729 = Y[-7 * iostride]; |
||
295 | tmp730 = Y[-9 * iostride]; |
||
296 | tmp731 = tmp729 - tmp730; |
||
297 | tmp777 = tmp730 + tmp729; |
||
298 | } |
||
299 | tmp695 = tmp691 + tmp694; |
||
300 | tmp719 = tmp691 - tmp694; |
||
301 | tmp735 = tmp731 + tmp734; |
||
302 | tmp752 = tmp734 - tmp731; |
||
303 | { |
||
304 | fftw_real tmp810; |
||
305 | fftw_real tmp811; |
||
306 | fftw_real tmp778; |
||
307 | fftw_real tmp781; |
||
308 | ASSERT_ALIGNED_DOUBLE(); |
||
309 | tmp810 = tmp776 + tmp777; |
||
310 | tmp811 = tmp780 - tmp779; |
||
311 | tmp812 = (K555570233 * tmp810) + (K831469612 * tmp811); |
||
312 | tmp818 = (K831469612 * tmp810) - (K555570233 * tmp811); |
||
313 | tmp778 = tmp776 - tmp777; |
||
314 | tmp781 = tmp779 + tmp780; |
||
315 | tmp782 = (K980785280 * tmp778) - (K195090322 * tmp781); |
||
316 | tmp792 = (K195090322 * tmp778) + (K980785280 * tmp781); |
||
317 | } |
||
318 | } |
||
319 | { |
||
320 | fftw_real tmp703; |
||
321 | fftw_real tmp759; |
||
322 | fftw_real tmp688; |
||
323 | fftw_real tmp758; |
||
324 | fftw_real tmp680; |
||
325 | ASSERT_ALIGNED_DOUBLE(); |
||
326 | tmp703 = K2_000000000 * (tmp695 + tmp702); |
||
327 | tmp759 = K2_000000000 * (tmp752 - tmp753); |
||
328 | tmp680 = tmp676 + tmp679; |
||
329 | tmp688 = tmp680 + tmp687; |
||
330 | tmp758 = tmp680 - tmp687; |
||
331 | X[16 * iostride] = tmp688 - tmp703; |
||
332 | X[0] = tmp688 + tmp703; |
||
333 | X[24 * iostride] = tmp758 + tmp759; |
||
334 | X[8 * iostride] = tmp758 - tmp759; |
||
335 | } |
||
336 | { |
||
337 | fftw_real tmp750; |
||
338 | fftw_real tmp756; |
||
339 | fftw_real tmp755; |
||
340 | fftw_real tmp757; |
||
341 | fftw_real tmp748; |
||
342 | fftw_real tmp751; |
||
343 | fftw_real tmp754; |
||
344 | ASSERT_ALIGNED_DOUBLE(); |
||
345 | tmp748 = tmp676 - tmp679; |
||
346 | tmp750 = tmp748 - tmp749; |
||
347 | tmp756 = tmp748 + tmp749; |
||
348 | tmp751 = tmp695 - tmp702; |
||
349 | tmp754 = tmp752 + tmp753; |
||
350 | tmp755 = K1_414213562 * (tmp751 - tmp754); |
||
351 | tmp757 = K1_414213562 * (tmp751 + tmp754); |
||
352 | X[20 * iostride] = tmp750 - tmp755; |
||
353 | X[4 * iostride] = tmp750 + tmp755; |
||
354 | X[12 * iostride] = tmp756 - tmp757; |
||
355 | X[28 * iostride] = tmp756 + tmp757; |
||
356 | } |
||
357 | { |
||
358 | fftw_real tmp718; |
||
359 | fftw_real tmp738; |
||
360 | fftw_real tmp737; |
||
361 | fftw_real tmp739; |
||
362 | ASSERT_ALIGNED_DOUBLE(); |
||
363 | { |
||
364 | fftw_real tmp708; |
||
365 | fftw_real tmp717; |
||
366 | fftw_real tmp727; |
||
367 | fftw_real tmp736; |
||
368 | ASSERT_ALIGNED_DOUBLE(); |
||
369 | tmp708 = tmp704 - tmp707; |
||
370 | tmp717 = K1_414213562 * (tmp709 - tmp716); |
||
371 | tmp718 = tmp708 + tmp717; |
||
372 | tmp738 = tmp708 - tmp717; |
||
373 | tmp727 = tmp719 - tmp726; |
||
374 | tmp736 = tmp728 + tmp735; |
||
375 | tmp737 = (K1_847759065 * tmp727) - (K765366864 * tmp736); |
||
376 | tmp739 = (K1_847759065 * tmp736) + (K765366864 * tmp727); |
||
377 | } |
||
378 | X[18 * iostride] = tmp718 - tmp737; |
||
379 | X[2 * iostride] = tmp718 + tmp737; |
||
380 | X[10 * iostride] = tmp738 - tmp739; |
||
381 | X[26 * iostride] = tmp738 + tmp739; |
||
382 | } |
||
383 | { |
||
384 | fftw_real tmp742; |
||
385 | fftw_real tmp746; |
||
386 | fftw_real tmp745; |
||
387 | fftw_real tmp747; |
||
388 | ASSERT_ALIGNED_DOUBLE(); |
||
389 | { |
||
390 | fftw_real tmp740; |
||
391 | fftw_real tmp741; |
||
392 | fftw_real tmp743; |
||
393 | fftw_real tmp744; |
||
394 | ASSERT_ALIGNED_DOUBLE(); |
||
395 | tmp740 = tmp704 + tmp707; |
||
396 | tmp741 = K1_414213562 * (tmp709 + tmp716); |
||
397 | tmp742 = tmp740 - tmp741; |
||
398 | tmp746 = tmp740 + tmp741; |
||
399 | tmp743 = tmp719 + tmp726; |
||
400 | tmp744 = tmp735 - tmp728; |
||
401 | tmp745 = (K765366864 * tmp743) - (K1_847759065 * tmp744); |
||
402 | tmp747 = (K765366864 * tmp744) + (K1_847759065 * tmp743); |
||
403 | } |
||
404 | X[22 * iostride] = tmp742 - tmp745; |
||
405 | X[6 * iostride] = tmp742 + tmp745; |
||
406 | X[14 * iostride] = tmp746 - tmp747; |
||
407 | X[30 * iostride] = tmp746 + tmp747; |
||
408 | } |
||
409 | { |
||
410 | fftw_real tmp790; |
||
411 | fftw_real tmp794; |
||
412 | fftw_real tmp775; |
||
413 | fftw_real tmp791; |
||
414 | fftw_real tmp767; |
||
415 | fftw_real tmp774; |
||
416 | ASSERT_ALIGNED_DOUBLE(); |
||
417 | tmp790 = K2_000000000 * (tmp782 + tmp789); |
||
418 | tmp794 = K2_000000000 * (tmp792 - tmp793); |
||
419 | tmp767 = tmp763 + tmp766; |
||
420 | tmp774 = (K1_847759065 * tmp770) - (K765366864 * tmp773); |
||
421 | tmp775 = tmp767 + tmp774; |
||
422 | tmp791 = tmp767 - tmp774; |
||
423 | X[17 * iostride] = tmp775 - tmp790; |
||
424 | X[iostride] = tmp775 + tmp790; |
||
425 | X[9 * iostride] = tmp791 - tmp794; |
||
426 | X[25 * iostride] = tmp791 + tmp794; |
||
427 | } |
||
428 | { |
||
429 | fftw_real tmp797; |
||
430 | fftw_real tmp801; |
||
431 | fftw_real tmp800; |
||
432 | fftw_real tmp802; |
||
433 | ASSERT_ALIGNED_DOUBLE(); |
||
434 | { |
||
435 | fftw_real tmp795; |
||
436 | fftw_real tmp796; |
||
437 | fftw_real tmp798; |
||
438 | fftw_real tmp799; |
||
439 | ASSERT_ALIGNED_DOUBLE(); |
||
440 | tmp795 = tmp763 - tmp766; |
||
441 | tmp796 = (K765366864 * tmp770) + (K1_847759065 * tmp773); |
||
442 | tmp797 = tmp795 - tmp796; |
||
443 | tmp801 = tmp795 + tmp796; |
||
444 | tmp798 = tmp782 - tmp789; |
||
445 | tmp799 = tmp792 + tmp793; |
||
446 | tmp800 = K1_414213562 * (tmp798 - tmp799); |
||
447 | tmp802 = K1_414213562 * (tmp798 + tmp799); |
||
448 | } |
||
449 | X[21 * iostride] = tmp797 - tmp800; |
||
450 | X[5 * iostride] = tmp797 + tmp800; |
||
451 | X[13 * iostride] = tmp801 - tmp802; |
||
452 | X[29 * iostride] = tmp801 + tmp802; |
||
453 | } |
||
454 | { |
||
455 | fftw_real tmp816; |
||
456 | fftw_real tmp820; |
||
457 | fftw_real tmp809; |
||
458 | fftw_real tmp817; |
||
459 | fftw_real tmp805; |
||
460 | fftw_real tmp808; |
||
461 | ASSERT_ALIGNED_DOUBLE(); |
||
462 | tmp816 = K2_000000000 * (tmp812 - tmp815); |
||
463 | tmp820 = K2_000000000 * (tmp818 - tmp819); |
||
464 | tmp805 = tmp803 - tmp804; |
||
465 | tmp808 = (K765366864 * tmp806) - (K1_847759065 * tmp807); |
||
466 | tmp809 = tmp805 - tmp808; |
||
467 | tmp817 = tmp805 + tmp808; |
||
468 | X[11 * iostride] = tmp809 - tmp816; |
||
469 | X[27 * iostride] = tmp809 + tmp816; |
||
470 | X[19 * iostride] = tmp817 - tmp820; |
||
471 | X[3 * iostride] = tmp817 + tmp820; |
||
472 | } |
||
473 | { |
||
474 | fftw_real tmp823; |
||
475 | fftw_real tmp827; |
||
476 | fftw_real tmp826; |
||
477 | fftw_real tmp828; |
||
478 | ASSERT_ALIGNED_DOUBLE(); |
||
479 | { |
||
480 | fftw_real tmp821; |
||
481 | fftw_real tmp822; |
||
482 | fftw_real tmp824; |
||
483 | fftw_real tmp825; |
||
484 | ASSERT_ALIGNED_DOUBLE(); |
||
485 | tmp821 = tmp803 + tmp804; |
||
486 | tmp822 = (K1_847759065 * tmp806) + (K765366864 * tmp807); |
||
487 | tmp823 = tmp821 - tmp822; |
||
488 | tmp827 = tmp821 + tmp822; |
||
489 | tmp824 = tmp818 + tmp819; |
||
490 | tmp825 = tmp812 + tmp815; |
||
491 | tmp826 = K1_414213562 * (tmp824 - tmp825); |
||
492 | tmp828 = K1_414213562 * (tmp825 + tmp824); |
||
493 | } |
||
494 | X[23 * iostride] = tmp823 - tmp826; |
||
495 | X[7 * iostride] = tmp823 + tmp826; |
||
496 | X[15 * iostride] = tmp827 - tmp828; |
||
497 | X[31 * iostride] = tmp827 + tmp828; |
||
498 | } |
||
499 | } |
||
500 | X = X + dist; |
||
501 | Y = Y - dist; |
||
502 | for (i = 2; i < m; i = i + 2, X = X + dist, Y = Y - dist, W = W + 31) { |
||
503 | fftw_real tmp446; |
||
504 | fftw_real tmp580; |
||
505 | fftw_real tmp189; |
||
506 | fftw_real tmp238; |
||
507 | fftw_real tmp382; |
||
508 | fftw_real tmp420; |
||
509 | fftw_real tmp307; |
||
510 | fftw_real tmp332; |
||
511 | fftw_real tmp514; |
||
512 | fftw_real tmp608; |
||
513 | fftw_real tmp354; |
||
514 | fftw_real tmp408; |
||
515 | fftw_real tmp453; |
||
516 | fftw_real tmp609; |
||
517 | fftw_real tmp517; |
||
518 | fftw_real tmp581; |
||
519 | fftw_real tmp235; |
||
520 | fftw_real tmp272; |
||
521 | fftw_real tmp365; |
||
522 | fftw_real tmp411; |
||
523 | fftw_real tmp287; |
||
524 | fftw_real tmp336; |
||
525 | fftw_real tmp368; |
||
526 | fftw_real tmp412; |
||
527 | fftw_real tmp500; |
||
528 | fftw_real tmp550; |
||
529 | fftw_real tmp593; |
||
530 | fftw_real tmp643; |
||
531 | fftw_real tmp507; |
||
532 | fftw_real tmp551; |
||
533 | fftw_real tmp596; |
||
534 | fftw_real tmp642; |
||
535 | fftw_real tmp204; |
||
536 | fftw_real tmp292; |
||
537 | fftw_real tmp357; |
||
538 | fftw_real tmp384; |
||
539 | fftw_real tmp253; |
||
540 | fftw_real tmp333; |
||
541 | fftw_real tmp360; |
||
542 | fftw_real tmp383; |
||
543 | fftw_real tmp461; |
||
544 | fftw_real tmp520; |
||
545 | fftw_real tmp588; |
||
546 | fftw_real tmp612; |
||
547 | fftw_real tmp468; |
||
548 | fftw_real tmp519; |
||
549 | fftw_real tmp585; |
||
550 | fftw_real tmp611; |
||
551 | fftw_real tmp220; |
||
552 | fftw_real tmp255; |
||
553 | fftw_real tmp372; |
||
554 | fftw_real tmp414; |
||
555 | fftw_real tmp270; |
||
556 | fftw_real tmp335; |
||
557 | fftw_real tmp375; |
||
558 | fftw_real tmp415; |
||
559 | fftw_real tmp481; |
||
560 | fftw_real tmp547; |
||
561 | fftw_real tmp600; |
||
562 | fftw_real tmp640; |
||
563 | fftw_real tmp488; |
||
564 | fftw_real tmp548; |
||
565 | fftw_real tmp603; |
||
566 | fftw_real tmp639; |
||
567 | ASSERT_ALIGNED_DOUBLE(); |
||
568 | { |
||
569 | fftw_real tmp177; |
||
570 | fftw_real tmp444; |
||
571 | fftw_real tmp295; |
||
572 | fftw_real tmp513; |
||
573 | fftw_real tmp180; |
||
574 | fftw_real tmp512; |
||
575 | fftw_real tmp298; |
||
576 | fftw_real tmp445; |
||
577 | fftw_real tmp184; |
||
578 | fftw_real tmp447; |
||
579 | fftw_real tmp302; |
||
580 | fftw_real tmp448; |
||
581 | fftw_real tmp187; |
||
582 | fftw_real tmp450; |
||
583 | fftw_real tmp305; |
||
584 | fftw_real tmp451; |
||
585 | ASSERT_ALIGNED_DOUBLE(); |
||
586 | { |
||
587 | fftw_real tmp175; |
||
588 | fftw_real tmp176; |
||
589 | fftw_real tmp293; |
||
590 | fftw_real tmp294; |
||
591 | ASSERT_ALIGNED_DOUBLE(); |
||
592 | tmp175 = X[0]; |
||
593 | tmp176 = Y[-16 * iostride]; |
||
594 | tmp177 = tmp175 + tmp176; |
||
595 | tmp444 = tmp175 - tmp176; |
||
596 | tmp293 = Y[0]; |
||
597 | tmp294 = X[16 * iostride]; |
||
598 | tmp295 = tmp293 - tmp294; |
||
599 | tmp513 = tmp293 + tmp294; |
||
600 | } |
||
601 | { |
||
602 | fftw_real tmp178; |
||
603 | fftw_real tmp179; |
||
604 | fftw_real tmp296; |
||
605 | fftw_real tmp297; |
||
606 | ASSERT_ALIGNED_DOUBLE(); |
||
607 | tmp178 = X[8 * iostride]; |
||
608 | tmp179 = Y[-24 * iostride]; |
||
609 | tmp180 = tmp178 + tmp179; |
||
610 | tmp512 = tmp178 - tmp179; |
||
611 | tmp296 = Y[-8 * iostride]; |
||
612 | tmp297 = X[24 * iostride]; |
||
613 | tmp298 = tmp296 - tmp297; |
||
614 | tmp445 = tmp296 + tmp297; |
||
615 | } |
||
616 | { |
||
617 | fftw_real tmp182; |
||
618 | fftw_real tmp183; |
||
619 | fftw_real tmp300; |
||
620 | fftw_real tmp301; |
||
621 | ASSERT_ALIGNED_DOUBLE(); |
||
622 | tmp182 = X[4 * iostride]; |
||
623 | tmp183 = Y[-20 * iostride]; |
||
624 | tmp184 = tmp182 + tmp183; |
||
625 | tmp447 = tmp182 - tmp183; |
||
626 | tmp300 = Y[-4 * iostride]; |
||
627 | tmp301 = X[20 * iostride]; |
||
628 | tmp302 = tmp300 - tmp301; |
||
629 | tmp448 = tmp300 + tmp301; |
||
630 | } |
||
631 | { |
||
632 | fftw_real tmp185; |
||
633 | fftw_real tmp186; |
||
634 | fftw_real tmp303; |
||
635 | fftw_real tmp304; |
||
636 | ASSERT_ALIGNED_DOUBLE(); |
||
637 | tmp185 = Y[-28 * iostride]; |
||
638 | tmp186 = X[12 * iostride]; |
||
639 | tmp187 = tmp185 + tmp186; |
||
640 | tmp450 = tmp185 - tmp186; |
||
641 | tmp303 = Y[-12 * iostride]; |
||
642 | tmp304 = X[28 * iostride]; |
||
643 | tmp305 = tmp303 - tmp304; |
||
644 | tmp451 = tmp303 + tmp304; |
||
645 | } |
||
646 | { |
||
647 | fftw_real tmp181; |
||
648 | fftw_real tmp188; |
||
649 | fftw_real tmp352; |
||
650 | fftw_real tmp353; |
||
651 | ASSERT_ALIGNED_DOUBLE(); |
||
652 | tmp446 = tmp444 - tmp445; |
||
653 | tmp580 = tmp444 + tmp445; |
||
654 | tmp181 = tmp177 + tmp180; |
||
655 | tmp188 = tmp184 + tmp187; |
||
656 | tmp189 = tmp181 + tmp188; |
||
657 | tmp238 = tmp181 - tmp188; |
||
658 | { |
||
659 | fftw_real tmp380; |
||
660 | fftw_real tmp381; |
||
661 | fftw_real tmp299; |
||
662 | fftw_real tmp306; |
||
663 | ASSERT_ALIGNED_DOUBLE(); |
||
664 | tmp380 = tmp295 - tmp298; |
||
665 | tmp381 = tmp184 - tmp187; |
||
666 | tmp382 = tmp380 - tmp381; |
||
667 | tmp420 = tmp381 + tmp380; |
||
668 | tmp299 = tmp295 + tmp298; |
||
669 | tmp306 = tmp302 + tmp305; |
||
670 | tmp307 = tmp299 - tmp306; |
||
671 | tmp332 = tmp299 + tmp306; |
||
672 | } |
||
673 | tmp514 = tmp512 + tmp513; |
||
674 | tmp608 = tmp513 - tmp512; |
||
675 | tmp352 = tmp177 - tmp180; |
||
676 | tmp353 = tmp305 - tmp302; |
||
677 | tmp354 = tmp352 - tmp353; |
||
678 | tmp408 = tmp352 + tmp353; |
||
679 | { |
||
680 | fftw_real tmp449; |
||
681 | fftw_real tmp452; |
||
682 | fftw_real tmp515; |
||
683 | fftw_real tmp516; |
||
684 | ASSERT_ALIGNED_DOUBLE(); |
||
685 | tmp449 = tmp447 - tmp448; |
||
686 | tmp452 = tmp450 - tmp451; |
||
687 | tmp453 = K707106781 * (tmp449 + tmp452); |
||
688 | tmp609 = K707106781 * (tmp449 - tmp452); |
||
689 | tmp515 = tmp447 + tmp448; |
||
690 | tmp516 = tmp450 + tmp451; |
||
691 | tmp517 = K707106781 * (tmp515 - tmp516); |
||
692 | tmp581 = K707106781 * (tmp515 + tmp516); |
||
693 | } |
||
694 | } |
||
695 | } |
||
696 | { |
||
697 | fftw_real tmp223; |
||
698 | fftw_real tmp490; |
||
699 | fftw_real tmp275; |
||
700 | fftw_real tmp502; |
||
701 | fftw_real tmp226; |
||
702 | fftw_real tmp501; |
||
703 | fftw_real tmp278; |
||
704 | fftw_real tmp491; |
||
705 | fftw_real tmp233; |
||
706 | fftw_real tmp505; |
||
707 | fftw_real tmp498; |
||
708 | fftw_real tmp285; |
||
709 | fftw_real tmp230; |
||
710 | fftw_real tmp504; |
||
711 | fftw_real tmp495; |
||
712 | fftw_real tmp282; |
||
713 | ASSERT_ALIGNED_DOUBLE(); |
||
714 | { |
||
715 | fftw_real tmp221; |
||
716 | fftw_real tmp222; |
||
717 | fftw_real tmp276; |
||
718 | fftw_real tmp277; |
||
719 | ASSERT_ALIGNED_DOUBLE(); |
||
720 | tmp221 = Y[-31 * iostride]; |
||
721 | tmp222 = X[15 * iostride]; |
||
722 | tmp223 = tmp221 + tmp222; |
||
723 | tmp490 = tmp221 - tmp222; |
||
724 | { |
||
725 | fftw_real tmp273; |
||
726 | fftw_real tmp274; |
||
727 | fftw_real tmp224; |
||
728 | fftw_real tmp225; |
||
729 | ASSERT_ALIGNED_DOUBLE(); |
||
730 | tmp273 = Y[-15 * iostride]; |
||
731 | tmp274 = X[31 * iostride]; |
||
732 | tmp275 = tmp273 - tmp274; |
||
733 | tmp502 = tmp273 + tmp274; |
||
734 | tmp224 = X[7 * iostride]; |
||
735 | tmp225 = Y[-23 * iostride]; |
||
736 | tmp226 = tmp224 + tmp225; |
||
737 | tmp501 = tmp224 - tmp225; |
||
738 | } |
||
739 | tmp276 = Y[-7 * iostride]; |
||
740 | tmp277 = X[23 * iostride]; |
||
741 | tmp278 = tmp276 - tmp277; |
||
742 | tmp491 = tmp276 + tmp277; |
||
743 | { |
||
744 | fftw_real tmp231; |
||
745 | fftw_real tmp232; |
||
746 | fftw_real tmp496; |
||
747 | fftw_real tmp283; |
||
748 | fftw_real tmp284; |
||
749 | fftw_real tmp497; |
||
750 | ASSERT_ALIGNED_DOUBLE(); |
||
751 | tmp231 = Y[-27 * iostride]; |
||
752 | tmp232 = X[11 * iostride]; |
||
753 | tmp496 = tmp231 - tmp232; |
||
754 | tmp283 = Y[-11 * iostride]; |
||
755 | tmp284 = X[27 * iostride]; |
||
756 | tmp497 = tmp283 + tmp284; |
||
757 | tmp233 = tmp231 + tmp232; |
||
758 | tmp505 = tmp496 + tmp497; |
||
759 | tmp498 = tmp496 - tmp497; |
||
760 | tmp285 = tmp283 - tmp284; |
||
761 | } |
||
762 | { |
||
763 | fftw_real tmp228; |
||
764 | fftw_real tmp229; |
||
765 | fftw_real tmp493; |
||
766 | fftw_real tmp280; |
||
767 | fftw_real tmp281; |
||
768 | fftw_real tmp494; |
||
769 | ASSERT_ALIGNED_DOUBLE(); |
||
770 | tmp228 = X[3 * iostride]; |
||
771 | tmp229 = Y[-19 * iostride]; |
||
772 | tmp493 = tmp228 - tmp229; |
||
773 | tmp280 = Y[-3 * iostride]; |
||
774 | tmp281 = X[19 * iostride]; |
||
775 | tmp494 = tmp280 + tmp281; |
||
776 | tmp230 = tmp228 + tmp229; |
||
777 | tmp504 = tmp493 + tmp494; |
||
778 | tmp495 = tmp493 - tmp494; |
||
779 | tmp282 = tmp280 - tmp281; |
||
780 | } |
||
781 | } |
||
782 | { |
||
783 | fftw_real tmp227; |
||
784 | fftw_real tmp234; |
||
785 | fftw_real tmp363; |
||
786 | fftw_real tmp364; |
||
787 | ASSERT_ALIGNED_DOUBLE(); |
||
788 | tmp227 = tmp223 + tmp226; |
||
789 | tmp234 = tmp230 + tmp233; |
||
790 | tmp235 = tmp227 + tmp234; |
||
791 | tmp272 = tmp227 - tmp234; |
||
792 | tmp363 = tmp275 - tmp278; |
||
793 | tmp364 = tmp230 - tmp233; |
||
794 | tmp365 = tmp363 - tmp364; |
||
795 | tmp411 = tmp364 + tmp363; |
||
796 | } |
||
797 | { |
||
798 | fftw_real tmp279; |
||
799 | fftw_real tmp286; |
||
800 | fftw_real tmp366; |
||
801 | fftw_real tmp367; |
||
802 | ASSERT_ALIGNED_DOUBLE(); |
||
803 | tmp279 = tmp275 + tmp278; |
||
804 | tmp286 = tmp282 + tmp285; |
||
805 | tmp287 = tmp279 - tmp286; |
||
806 | tmp336 = tmp279 + tmp286; |
||
807 | tmp366 = tmp223 - tmp226; |
||
808 | tmp367 = tmp285 - tmp282; |
||
809 | tmp368 = tmp366 - tmp367; |
||
810 | tmp412 = tmp366 + tmp367; |
||
811 | } |
||
812 | { |
||
813 | fftw_real tmp492; |
||
814 | fftw_real tmp499; |
||
815 | fftw_real tmp591; |
||
816 | fftw_real tmp592; |
||
817 | ASSERT_ALIGNED_DOUBLE(); |
||
818 | tmp492 = tmp490 - tmp491; |
||
819 | tmp499 = K707106781 * (tmp495 + tmp498); |
||
820 | tmp500 = tmp492 - tmp499; |
||
821 | tmp550 = tmp492 + tmp499; |
||
822 | tmp591 = K707106781 * (tmp495 - tmp498); |
||
823 | tmp592 = tmp501 + tmp502; |
||
824 | tmp593 = tmp591 - tmp592; |
||
825 | tmp643 = tmp592 + tmp591; |
||
826 | } |
||
827 | { |
||
828 | fftw_real tmp503; |
||
829 | fftw_real tmp506; |
||
830 | fftw_real tmp594; |
||
831 | fftw_real tmp595; |
||
832 | ASSERT_ALIGNED_DOUBLE(); |
||
833 | tmp503 = tmp501 - tmp502; |
||
834 | tmp506 = K707106781 * (tmp504 - tmp505); |
||
835 | tmp507 = tmp503 - tmp506; |
||
836 | tmp551 = tmp503 + tmp506; |
||
837 | tmp594 = tmp490 + tmp491; |
||
838 | tmp595 = K707106781 * (tmp504 + tmp505); |
||
839 | tmp596 = tmp594 - tmp595; |
||
840 | tmp642 = tmp594 + tmp595; |
||
841 | } |
||
842 | } |
||
843 | { |
||
844 | fftw_real tmp192; |
||
845 | fftw_real tmp465; |
||
846 | fftw_real tmp248; |
||
847 | fftw_real tmp463; |
||
848 | fftw_real tmp195; |
||
849 | fftw_real tmp462; |
||
850 | fftw_real tmp251; |
||
851 | fftw_real tmp466; |
||
852 | fftw_real tmp199; |
||
853 | fftw_real tmp458; |
||
854 | fftw_real tmp241; |
||
855 | fftw_real tmp456; |
||
856 | fftw_real tmp202; |
||
857 | fftw_real tmp455; |
||
858 | fftw_real tmp244; |
||
859 | fftw_real tmp459; |
||
860 | ASSERT_ALIGNED_DOUBLE(); |
||
861 | { |
||
862 | fftw_real tmp190; |
||
863 | fftw_real tmp191; |
||
864 | fftw_real tmp246; |
||
865 | fftw_real tmp247; |
||
866 | ASSERT_ALIGNED_DOUBLE(); |
||
867 | tmp190 = X[2 * iostride]; |
||
868 | tmp191 = Y[-18 * iostride]; |
||
869 | tmp192 = tmp190 + tmp191; |
||
870 | tmp465 = tmp190 - tmp191; |
||
871 | tmp246 = Y[-2 * iostride]; |
||
872 | tmp247 = X[18 * iostride]; |
||
873 | tmp248 = tmp246 - tmp247; |
||
874 | tmp463 = tmp246 + tmp247; |
||
875 | } |
||
876 | { |
||
877 | fftw_real tmp193; |
||
878 | fftw_real tmp194; |
||
879 | fftw_real tmp249; |
||
880 | fftw_real tmp250; |
||
881 | ASSERT_ALIGNED_DOUBLE(); |
||
882 | tmp193 = X[10 * iostride]; |
||
883 | tmp194 = Y[-26 * iostride]; |
||
884 | tmp195 = tmp193 + tmp194; |
||
885 | tmp462 = tmp193 - tmp194; |
||
886 | tmp249 = Y[-10 * iostride]; |
||
887 | tmp250 = X[26 * iostride]; |
||
888 | tmp251 = tmp249 - tmp250; |
||
889 | tmp466 = tmp249 + tmp250; |
||
890 | } |
||
891 | { |
||
892 | fftw_real tmp197; |
||
893 | fftw_real tmp198; |
||
894 | fftw_real tmp239; |
||
895 | fftw_real tmp240; |
||
896 | ASSERT_ALIGNED_DOUBLE(); |
||
897 | tmp197 = Y[-30 * iostride]; |
||
898 | tmp198 = X[14 * iostride]; |
||
899 | tmp199 = tmp197 + tmp198; |
||
900 | tmp458 = tmp197 - tmp198; |
||
901 | tmp239 = Y[-14 * iostride]; |
||
902 | tmp240 = X[30 * iostride]; |
||
903 | tmp241 = tmp239 - tmp240; |
||
904 | tmp456 = tmp239 + tmp240; |
||
905 | } |
||
906 | { |
||
907 | fftw_real tmp200; |
||
908 | fftw_real tmp201; |
||
909 | fftw_real tmp242; |
||
910 | fftw_real tmp243; |
||
911 | ASSERT_ALIGNED_DOUBLE(); |
||
912 | tmp200 = X[6 * iostride]; |
||
913 | tmp201 = Y[-22 * iostride]; |
||
914 | tmp202 = tmp200 + tmp201; |
||
915 | tmp455 = tmp200 - tmp201; |
||
916 | tmp242 = Y[-6 * iostride]; |
||
917 | tmp243 = X[22 * iostride]; |
||
918 | tmp244 = tmp242 - tmp243; |
||
919 | tmp459 = tmp242 + tmp243; |
||
920 | } |
||
921 | { |
||
922 | fftw_real tmp196; |
||
923 | fftw_real tmp203; |
||
924 | fftw_real tmp355; |
||
925 | fftw_real tmp356; |
||
926 | ASSERT_ALIGNED_DOUBLE(); |
||
927 | tmp196 = tmp192 + tmp195; |
||
928 | tmp203 = tmp199 + tmp202; |
||
929 | tmp204 = tmp196 + tmp203; |
||
930 | tmp292 = tmp196 - tmp203; |
||
931 | tmp355 = tmp241 - tmp244; |
||
932 | tmp356 = tmp199 - tmp202; |
||
933 | tmp357 = tmp355 - tmp356; |
||
934 | tmp384 = tmp356 + tmp355; |
||
935 | } |
||
936 | { |
||
937 | fftw_real tmp245; |
||
938 | fftw_real tmp252; |
||
939 | fftw_real tmp358; |
||
940 | fftw_real tmp359; |
||
941 | ASSERT_ALIGNED_DOUBLE(); |
||
942 | tmp245 = tmp241 + tmp244; |
||
943 | tmp252 = tmp248 + tmp251; |
||
944 | tmp253 = tmp245 - tmp252; |
||
945 | tmp333 = tmp252 + tmp245; |
||
946 | tmp358 = tmp192 - tmp195; |
||
947 | tmp359 = tmp248 - tmp251; |
||
948 | tmp360 = tmp358 + tmp359; |
||
949 | tmp383 = tmp358 - tmp359; |
||
950 | } |
||
951 | { |
||
952 | fftw_real tmp457; |
||
953 | fftw_real tmp460; |
||
954 | fftw_real tmp586; |
||
955 | fftw_real tmp587; |
||
956 | ASSERT_ALIGNED_DOUBLE(); |
||
957 | tmp457 = tmp455 - tmp456; |
||
958 | tmp460 = tmp458 - tmp459; |
||
959 | tmp461 = (K923879532 * tmp457) - (K382683432 * tmp460); |
||
960 | tmp520 = (K382683432 * tmp457) + (K923879532 * tmp460); |
||
961 | tmp586 = tmp458 + tmp459; |
||
962 | tmp587 = tmp455 + tmp456; |
||
963 | tmp588 = (K382683432 * tmp586) - (K923879532 * tmp587); |
||
964 | tmp612 = (K382683432 * tmp587) + (K923879532 * tmp586); |
||
965 | } |
||
966 | { |
||
967 | fftw_real tmp464; |
||
968 | fftw_real tmp467; |
||
969 | fftw_real tmp583; |
||
970 | fftw_real tmp584; |
||
971 | ASSERT_ALIGNED_DOUBLE(); |
||
972 | tmp464 = tmp462 + tmp463; |
||
973 | tmp467 = tmp465 - tmp466; |
||
974 | tmp468 = (K923879532 * tmp464) + (K382683432 * tmp467); |
||
975 | tmp519 = (K923879532 * tmp467) - (K382683432 * tmp464); |
||
976 | tmp583 = tmp465 + tmp466; |
||
977 | tmp584 = tmp463 - tmp462; |
||
978 | tmp585 = (K382683432 * tmp583) - (K923879532 * tmp584); |
||
979 | tmp611 = (K382683432 * tmp584) + (K923879532 * tmp583); |
||
980 | } |
||
981 | } |
||
982 | { |
||
983 | fftw_real tmp208; |
||
984 | fftw_real tmp471; |
||
985 | fftw_real tmp258; |
||
986 | fftw_real tmp483; |
||
987 | fftw_real tmp211; |
||
988 | fftw_real tmp482; |
||
989 | fftw_real tmp261; |
||
990 | fftw_real tmp472; |
||
991 | fftw_real tmp218; |
||
992 | fftw_real tmp486; |
||
993 | fftw_real tmp479; |
||
994 | fftw_real tmp268; |
||
995 | fftw_real tmp215; |
||
996 | fftw_real tmp485; |
||
997 | fftw_real tmp476; |
||
998 | fftw_real tmp265; |
||
999 | ASSERT_ALIGNED_DOUBLE(); |
||
1000 | { |
||
1001 | fftw_real tmp206; |
||
1002 | fftw_real tmp207; |
||
1003 | fftw_real tmp259; |
||
1004 | fftw_real tmp260; |
||
1005 | ASSERT_ALIGNED_DOUBLE(); |
||
1006 | tmp206 = X[iostride]; |
||
1007 | tmp207 = Y[-17 * iostride]; |
||
1008 | tmp208 = tmp206 + tmp207; |
||
1009 | tmp471 = tmp206 - tmp207; |
||
1010 | { |
||
1011 | fftw_real tmp256; |
||
1012 | fftw_real tmp257; |
||
1013 | fftw_real tmp209; |
||
1014 | fftw_real tmp210; |
||
1015 | ASSERT_ALIGNED_DOUBLE(); |
||
1016 | tmp256 = Y[-iostride]; |
||
1017 | tmp257 = X[17 * iostride]; |
||
1018 | tmp258 = tmp256 - tmp257; |
||
1019 | tmp483 = tmp256 + tmp257; |
||
1020 | tmp209 = X[9 * iostride]; |
||
1021 | tmp210 = Y[-25 * iostride]; |
||
1022 | tmp211 = tmp209 + tmp210; |
||
1023 | tmp482 = tmp209 - tmp210; |
||
1024 | } |
||
1025 | tmp259 = Y[-9 * iostride]; |
||
1026 | tmp260 = X[25 * iostride]; |
||
1027 | tmp261 = tmp259 - tmp260; |
||
1028 | tmp472 = tmp259 + tmp260; |
||
1029 | { |
||
1030 | fftw_real tmp216; |
||
1031 | fftw_real tmp217; |
||
1032 | fftw_real tmp477; |
||
1033 | fftw_real tmp266; |
||
1034 | fftw_real tmp267; |
||
1035 | fftw_real tmp478; |
||
1036 | ASSERT_ALIGNED_DOUBLE(); |
||
1037 | tmp216 = Y[-29 * iostride]; |
||
1038 | tmp217 = X[13 * iostride]; |
||
1039 | tmp477 = tmp216 - tmp217; |
||
1040 | tmp266 = Y[-13 * iostride]; |
||
1041 | tmp267 = X[29 * iostride]; |
||
1042 | tmp478 = tmp266 + tmp267; |
||
1043 | tmp218 = tmp216 + tmp217; |
||
1044 | tmp486 = tmp477 + tmp478; |
||
1045 | tmp479 = tmp477 - tmp478; |
||
1046 | tmp268 = tmp266 - tmp267; |
||
1047 | } |
||
1048 | { |
||
1049 | fftw_real tmp213; |
||
1050 | fftw_real tmp214; |
||
1051 | fftw_real tmp474; |
||
1052 | fftw_real tmp263; |
||
1053 | fftw_real tmp264; |
||
1054 | fftw_real tmp475; |
||
1055 | ASSERT_ALIGNED_DOUBLE(); |
||
1056 | tmp213 = X[5 * iostride]; |
||
1057 | tmp214 = Y[-21 * iostride]; |
||
1058 | tmp474 = tmp213 - tmp214; |
||
1059 | tmp263 = Y[-5 * iostride]; |
||
1060 | tmp264 = X[21 * iostride]; |
||
1061 | tmp475 = tmp263 + tmp264; |
||
1062 | tmp215 = tmp213 + tmp214; |
||
1063 | tmp485 = tmp474 + tmp475; |
||
1064 | tmp476 = tmp474 - tmp475; |
||
1065 | tmp265 = tmp263 - tmp264; |
||
1066 | } |
||
1067 | } |
||
1068 | { |
||
1069 | fftw_real tmp212; |
||
1070 | fftw_real tmp219; |
||
1071 | fftw_real tmp370; |
||
1072 | fftw_real tmp371; |
||
1073 | ASSERT_ALIGNED_DOUBLE(); |
||
1074 | tmp212 = tmp208 + tmp211; |
||
1075 | tmp219 = tmp215 + tmp218; |
||
1076 | tmp220 = tmp212 + tmp219; |
||
1077 | tmp255 = tmp212 - tmp219; |
||
1078 | tmp370 = tmp258 - tmp261; |
||
1079 | tmp371 = tmp215 - tmp218; |
||
1080 | tmp372 = tmp370 - tmp371; |
||
1081 | tmp414 = tmp371 + tmp370; |
||
1082 | } |
||
1083 | { |
||
1084 | fftw_real tmp262; |
||
1085 | fftw_real tmp269; |
||
1086 | fftw_real tmp373; |
||
1087 | fftw_real tmp374; |
||
1088 | ASSERT_ALIGNED_DOUBLE(); |
||
1089 | tmp262 = tmp258 + tmp261; |
||
1090 | tmp269 = tmp265 + tmp268; |
||
1091 | tmp270 = tmp262 - tmp269; |
||
1092 | tmp335 = tmp262 + tmp269; |
||
1093 | tmp373 = tmp208 - tmp211; |
||
1094 | tmp374 = tmp268 - tmp265; |
||
1095 | tmp375 = tmp373 - tmp374; |
||
1096 | tmp415 = tmp373 + tmp374; |
||
1097 | } |
||
1098 | { |
||
1099 | fftw_real tmp473; |
||
1100 | fftw_real tmp480; |
||
1101 | fftw_real tmp598; |
||
1102 | fftw_real tmp599; |
||
1103 | ASSERT_ALIGNED_DOUBLE(); |
||
1104 | tmp473 = tmp471 - tmp472; |
||
1105 | tmp480 = K707106781 * (tmp476 + tmp479); |
||
1106 | tmp481 = tmp473 - tmp480; |
||
1107 | tmp547 = tmp473 + tmp480; |
||
1108 | tmp598 = tmp483 - tmp482; |
||
1109 | tmp599 = K707106781 * (tmp476 - tmp479); |
||
1110 | tmp600 = tmp598 + tmp599; |
||
1111 | tmp640 = tmp598 - tmp599; |
||
1112 | } |
||
1113 | { |
||
1114 | fftw_real tmp484; |
||
1115 | fftw_real tmp487; |
||
1116 | fftw_real tmp601; |
||
1117 | fftw_real tmp602; |
||
1118 | ASSERT_ALIGNED_DOUBLE(); |
||
1119 | tmp484 = tmp482 + tmp483; |
||
1120 | tmp487 = K707106781 * (tmp485 - tmp486); |
||
1121 | tmp488 = tmp484 - tmp487; |
||
1122 | tmp548 = tmp484 + tmp487; |
||
1123 | tmp601 = tmp471 + tmp472; |
||
1124 | tmp602 = K707106781 * (tmp485 + tmp486); |
||
1125 | tmp603 = tmp601 - tmp602; |
||
1126 | tmp639 = tmp601 + tmp602; |
||
1127 | } |
||
1128 | } |
||
1129 | { |
||
1130 | fftw_real tmp205; |
||
1131 | fftw_real tmp236; |
||
1132 | fftw_real tmp330; |
||
1133 | fftw_real tmp334; |
||
1134 | fftw_real tmp337; |
||
1135 | fftw_real tmp338; |
||
1136 | fftw_real tmp329; |
||
1137 | fftw_real tmp331; |
||
1138 | ASSERT_ALIGNED_DOUBLE(); |
||
1139 | tmp205 = tmp189 + tmp204; |
||
1140 | tmp236 = tmp220 + tmp235; |
||
1141 | tmp330 = tmp205 - tmp236; |
||
1142 | tmp334 = tmp332 + tmp333; |
||
1143 | tmp337 = tmp335 + tmp336; |
||
1144 | tmp338 = tmp334 - tmp337; |
||
1145 | X[0] = tmp205 + tmp236; |
||
1146 | Y[-31 * iostride] = tmp334 + tmp337; |
||
1147 | tmp329 = c_re(W[15]); |
||
1148 | tmp331 = c_im(W[15]); |
||
1149 | X[16 * iostride] = (tmp329 * tmp330) + (tmp331 * tmp338); |
||
1150 | Y[-15 * iostride] = (tmp329 * tmp338) - (tmp331 * tmp330); |
||
1151 | } |
||
1152 | { |
||
1153 | fftw_real tmp342; |
||
1154 | fftw_real tmp348; |
||
1155 | fftw_real tmp346; |
||
1156 | fftw_real tmp350; |
||
1157 | ASSERT_ALIGNED_DOUBLE(); |
||
1158 | { |
||
1159 | fftw_real tmp340; |
||
1160 | fftw_real tmp341; |
||
1161 | fftw_real tmp344; |
||
1162 | fftw_real tmp345; |
||
1163 | ASSERT_ALIGNED_DOUBLE(); |
||
1164 | tmp340 = tmp332 - tmp333; |
||
1165 | tmp341 = tmp220 - tmp235; |
||
1166 | tmp342 = tmp340 - tmp341; |
||
1167 | tmp348 = tmp341 + tmp340; |
||
1168 | tmp344 = tmp189 - tmp204; |
||
1169 | tmp345 = tmp336 - tmp335; |
||
1170 | tmp346 = tmp344 - tmp345; |
||
1171 | tmp350 = tmp344 + tmp345; |
||
1172 | } |
||
1173 | { |
||
1174 | fftw_real tmp339; |
||
1175 | fftw_real tmp343; |
||
1176 | fftw_real tmp347; |
||
1177 | fftw_real tmp349; |
||
1178 | ASSERT_ALIGNED_DOUBLE(); |
||
1179 | tmp339 = c_re(W[23]); |
||
1180 | tmp343 = c_im(W[23]); |
||
1181 | Y[-7 * iostride] = (tmp339 * tmp342) - (tmp343 * tmp346); |
||
1182 | X[24 * iostride] = (tmp343 * tmp342) + (tmp339 * tmp346); |
||
1183 | tmp347 = c_re(W[7]); |
||
1184 | tmp349 = c_im(W[7]); |
||
1185 | Y[-23 * iostride] = (tmp347 * tmp348) - (tmp349 * tmp350); |
||
1186 | X[8 * iostride] = (tmp349 * tmp348) + (tmp347 * tmp350); |
||
1187 | } |
||
1188 | } |
||
1189 | { |
||
1190 | fftw_real tmp254; |
||
1191 | fftw_real tmp322; |
||
1192 | fftw_real tmp289; |
||
1193 | fftw_real tmp319; |
||
1194 | fftw_real tmp308; |
||
1195 | fftw_real tmp318; |
||
1196 | fftw_real tmp311; |
||
1197 | fftw_real tmp323; |
||
1198 | ASSERT_ALIGNED_DOUBLE(); |
||
1199 | { |
||
1200 | fftw_real tmp271; |
||
1201 | fftw_real tmp288; |
||
1202 | fftw_real tmp309; |
||
1203 | fftw_real tmp310; |
||
1204 | ASSERT_ALIGNED_DOUBLE(); |
||
1205 | tmp254 = tmp238 + tmp253; |
||
1206 | tmp322 = tmp238 - tmp253; |
||
1207 | tmp271 = tmp255 - tmp270; |
||
1208 | tmp288 = tmp272 + tmp287; |
||
1209 | tmp289 = K707106781 * (tmp271 + tmp288); |
||
1210 | tmp319 = K707106781 * (tmp271 - tmp288); |
||
1211 | tmp308 = tmp292 + tmp307; |
||
1212 | tmp318 = tmp307 - tmp292; |
||
1213 | tmp309 = tmp255 + tmp270; |
||
1214 | tmp310 = tmp287 - tmp272; |
||
1215 | tmp311 = K707106781 * (tmp309 + tmp310); |
||
1216 | tmp323 = K707106781 * (tmp310 - tmp309); |
||
1217 | } |
||
1218 | { |
||
1219 | fftw_real tmp290; |
||
1220 | fftw_real tmp312; |
||
1221 | fftw_real tmp237; |
||
1222 | fftw_real tmp291; |
||
1223 | ASSERT_ALIGNED_DOUBLE(); |
||
1224 | tmp290 = tmp254 - tmp289; |
||
1225 | tmp312 = tmp308 - tmp311; |
||
1226 | tmp237 = c_re(W[19]); |
||
1227 | tmp291 = c_im(W[19]); |
||
1228 | X[20 * iostride] = (tmp237 * tmp290) + (tmp291 * tmp312); |
||
1229 | Y[-11 * iostride] = (tmp237 * tmp312) - (tmp291 * tmp290); |
||
1230 | } |
||
1231 | { |
||
1232 | fftw_real tmp314; |
||
1233 | fftw_real tmp316; |
||
1234 | fftw_real tmp313; |
||
1235 | fftw_real tmp315; |
||
1236 | ASSERT_ALIGNED_DOUBLE(); |
||
1237 | tmp314 = tmp254 + tmp289; |
||
1238 | tmp316 = tmp308 + tmp311; |
||
1239 | tmp313 = c_re(W[3]); |
||
1240 | tmp315 = c_im(W[3]); |
||
1241 | X[4 * iostride] = (tmp313 * tmp314) + (tmp315 * tmp316); |
||
1242 | Y[-27 * iostride] = (tmp313 * tmp316) - (tmp315 * tmp314); |
||
1243 | } |
||
1244 | { |
||
1245 | fftw_real tmp320; |
||
1246 | fftw_real tmp324; |
||
1247 | fftw_real tmp317; |
||
1248 | fftw_real tmp321; |
||
1249 | ASSERT_ALIGNED_DOUBLE(); |
||
1250 | tmp320 = tmp318 - tmp319; |
||
1251 | tmp324 = tmp322 - tmp323; |
||
1252 | tmp317 = c_re(W[27]); |
||
1253 | tmp321 = c_im(W[27]); |
||
1254 | Y[-3 * iostride] = (tmp317 * tmp320) - (tmp321 * tmp324); |
||
1255 | X[28 * iostride] = (tmp321 * tmp320) + (tmp317 * tmp324); |
||
1256 | } |
||
1257 | { |
||
1258 | fftw_real tmp326; |
||
1259 | fftw_real tmp328; |
||
1260 | fftw_real tmp325; |
||
1261 | fftw_real tmp327; |
||
1262 | ASSERT_ALIGNED_DOUBLE(); |
||
1263 | tmp326 = tmp318 + tmp319; |
||
1264 | tmp328 = tmp322 + tmp323; |
||
1265 | tmp325 = c_re(W[11]); |
||
1266 | tmp327 = c_im(W[11]); |
||
1267 | Y[-19 * iostride] = (tmp325 * tmp326) - (tmp327 * tmp328); |
||
1268 | X[12 * iostride] = (tmp327 * tmp326) + (tmp325 * tmp328); |
||
1269 | } |
||
1270 | } |
||
1271 | { |
||
1272 | fftw_real tmp638; |
||
1273 | fftw_real tmp664; |
||
1274 | fftw_real tmp653; |
||
1275 | fftw_real tmp665; |
||
1276 | fftw_real tmp645; |
||
1277 | fftw_real tmp661; |
||
1278 | fftw_real tmp650; |
||
1279 | fftw_real tmp660; |
||
1280 | ASSERT_ALIGNED_DOUBLE(); |
||
1281 | { |
||
1282 | fftw_real tmp636; |
||
1283 | fftw_real tmp637; |
||
1284 | fftw_real tmp651; |
||
1285 | fftw_real tmp652; |
||
1286 | ASSERT_ALIGNED_DOUBLE(); |
||
1287 | tmp636 = tmp580 + tmp581; |
||
1288 | tmp637 = tmp611 + tmp612; |
||
1289 | tmp638 = tmp636 - tmp637; |
||
1290 | tmp664 = tmp636 + tmp637; |
||
1291 | tmp651 = (K195090322 * tmp640) + (K980785280 * tmp639); |
||
1292 | tmp652 = (K195090322 * tmp643) + (K980785280 * tmp642); |
||
1293 | tmp653 = tmp651 - tmp652; |
||
1294 | tmp665 = tmp651 + tmp652; |
||
1295 | } |
||
1296 | { |
||
1297 | fftw_real tmp641; |
||
1298 | fftw_real tmp644; |
||
1299 | fftw_real tmp648; |
||
1300 | fftw_real tmp649; |
||
1301 | ASSERT_ALIGNED_DOUBLE(); |
||
1302 | tmp641 = (K195090322 * tmp639) - (K980785280 * tmp640); |
||
1303 | tmp644 = (K195090322 * tmp642) - (K980785280 * tmp643); |
||
1304 | tmp645 = tmp641 + tmp644; |
||
1305 | tmp661 = tmp641 - tmp644; |
||
1306 | tmp648 = tmp608 - tmp609; |
||
1307 | tmp649 = tmp585 - tmp588; |
||
1308 | tmp650 = tmp648 + tmp649; |
||
1309 | tmp660 = tmp648 - tmp649; |
||
1310 | } |
||
1311 | { |
||
1312 | fftw_real tmp646; |
||
1313 | fftw_real tmp654; |
||
1314 | fftw_real tmp635; |
||
1315 | fftw_real tmp647; |
||
1316 | ASSERT_ALIGNED_DOUBLE(); |
||
1317 | tmp646 = tmp638 - tmp645; |
||
1318 | tmp654 = tmp650 - tmp653; |
||
1319 | tmp635 = c_re(W[22]); |
||
1320 | tmp647 = c_im(W[22]); |
||
1321 | X[23 * iostride] = (tmp635 * tmp646) + (tmp647 * tmp654); |
||
1322 | Y[-8 * iostride] = (tmp635 * tmp654) - (tmp647 * tmp646); |
||
1323 | } |
||
1324 | { |
||
1325 | fftw_real tmp656; |
||
1326 | fftw_real tmp658; |
||
1327 | fftw_real tmp655; |
||
1328 | fftw_real tmp657; |
||
1329 | ASSERT_ALIGNED_DOUBLE(); |
||
1330 | tmp656 = tmp638 + tmp645; |
||
1331 | tmp658 = tmp650 + tmp653; |
||
1332 | tmp655 = c_re(W[6]); |
||
1333 | tmp657 = c_im(W[6]); |
||
1334 | X[7 * iostride] = (tmp655 * tmp656) + (tmp657 * tmp658); |
||
1335 | Y[-24 * iostride] = (tmp655 * tmp658) - (tmp657 * tmp656); |
||
1336 | } |
||
1337 | { |
||
1338 | fftw_real tmp662; |
||
1339 | fftw_real tmp666; |
||
1340 | fftw_real tmp659; |
||
1341 | fftw_real tmp663; |
||
1342 | ASSERT_ALIGNED_DOUBLE(); |
||
1343 | tmp662 = tmp660 + tmp661; |
||
1344 | tmp666 = tmp664 - tmp665; |
||
1345 | tmp659 = c_re(W[14]); |
||
1346 | tmp663 = c_im(W[14]); |
||
1347 | Y[-16 * iostride] = (tmp659 * tmp662) - (tmp663 * tmp666); |
||
1348 | X[15 * iostride] = (tmp663 * tmp662) + (tmp659 * tmp666); |
||
1349 | } |
||
1350 | { |
||
1351 | fftw_real tmp668; |
||
1352 | fftw_real tmp670; |
||
1353 | fftw_real tmp667; |
||
1354 | fftw_real tmp669; |
||
1355 | ASSERT_ALIGNED_DOUBLE(); |
||
1356 | tmp668 = tmp660 - tmp661; |
||
1357 | tmp670 = tmp664 + tmp665; |
||
1358 | tmp667 = c_re(W[30]); |
||
1359 | tmp669 = c_im(W[30]); |
||
1360 | Y[0] = (tmp667 * tmp668) - (tmp669 * tmp670); |
||
1361 | X[31 * iostride] = (tmp669 * tmp668) + (tmp667 * tmp670); |
||
1362 | } |
||
1363 | } |
||
1364 | { |
||
1365 | fftw_real tmp410; |
||
1366 | fftw_real tmp436; |
||
1367 | fftw_real tmp425; |
||
1368 | fftw_real tmp437; |
||
1369 | fftw_real tmp422; |
||
1370 | fftw_real tmp432; |
||
1371 | fftw_real tmp417; |
||
1372 | fftw_real tmp433; |
||
1373 | ASSERT_ALIGNED_DOUBLE(); |
||
1374 | { |
||
1375 | fftw_real tmp409; |
||
1376 | fftw_real tmp423; |
||
1377 | fftw_real tmp424; |
||
1378 | fftw_real tmp421; |
||
1379 | fftw_real tmp413; |
||
1380 | fftw_real tmp416; |
||
1381 | ASSERT_ALIGNED_DOUBLE(); |
||
1382 | tmp409 = K707106781 * (tmp383 + tmp384); |
||
1383 | tmp410 = tmp408 - tmp409; |
||
1384 | tmp436 = tmp408 + tmp409; |
||
1385 | tmp423 = (K923879532 * tmp415) - (K382683432 * tmp414); |
||
1386 | tmp424 = (K382683432 * tmp411) + (K923879532 * tmp412); |
||
1387 | tmp425 = tmp423 - tmp424; |
||
1388 | tmp437 = tmp423 + tmp424; |
||
1389 | tmp421 = K707106781 * (tmp360 + tmp357); |
||
1390 | tmp422 = tmp420 - tmp421; |
||
1391 | tmp432 = tmp420 + tmp421; |
||
1392 | tmp413 = (K923879532 * tmp411) - (K382683432 * tmp412); |
||
1393 | tmp416 = (K923879532 * tmp414) + (K382683432 * tmp415); |
||
1394 | tmp417 = tmp413 - tmp416; |
||
1395 | tmp433 = tmp416 + tmp413; |
||
1396 | } |
||
1397 | { |
||
1398 | fftw_real tmp418; |
||
1399 | fftw_real tmp426; |
||
1400 | fftw_real tmp407; |
||
1401 | fftw_real tmp419; |
||
1402 | ASSERT_ALIGNED_DOUBLE(); |
||
1403 | tmp418 = tmp410 - tmp417; |
||
1404 | tmp426 = tmp422 - tmp425; |
||
1405 | tmp407 = c_re(W[25]); |
||
1406 | tmp419 = c_im(W[25]); |
||
1407 | X[26 * iostride] = (tmp407 * tmp418) + (tmp419 * tmp426); |
||
1408 | Y[-5 * iostride] = (tmp407 * tmp426) - (tmp419 * tmp418); |
||
1409 | } |
||
1410 | { |
||
1411 | fftw_real tmp428; |
||
1412 | fftw_real tmp430; |
||
1413 | fftw_real tmp427; |
||
1414 | fftw_real tmp429; |
||
1415 | ASSERT_ALIGNED_DOUBLE(); |
||
1416 | tmp428 = tmp410 + tmp417; |
||
1417 | tmp430 = tmp422 + tmp425; |
||
1418 | tmp427 = c_re(W[9]); |
||
1419 | tmp429 = c_im(W[9]); |
||
1420 | X[10 * iostride] = (tmp427 * tmp428) + (tmp429 * tmp430); |
||
1421 | Y[-21 * iostride] = (tmp427 * tmp430) - (tmp429 * tmp428); |
||
1422 | } |
||
1423 | { |
||
1424 | fftw_real tmp434; |
||
1425 | fftw_real tmp438; |
||
1426 | fftw_real tmp431; |
||
1427 | fftw_real tmp435; |
||
1428 | ASSERT_ALIGNED_DOUBLE(); |
||
1429 | tmp434 = tmp432 - tmp433; |
||
1430 | tmp438 = tmp436 - tmp437; |
||
1431 | tmp431 = c_re(W[17]); |
||
1432 | tmp435 = c_im(W[17]); |
||
1433 | Y[-13 * iostride] = (tmp431 * tmp434) - (tmp435 * tmp438); |
||
1434 | X[18 * iostride] = (tmp435 * tmp434) + (tmp431 * tmp438); |
||
1435 | } |
||
1436 | { |
||
1437 | fftw_real tmp440; |
||
1438 | fftw_real tmp442; |
||
1439 | fftw_real tmp439; |
||
1440 | fftw_real tmp441; |
||
1441 | ASSERT_ALIGNED_DOUBLE(); |
||
1442 | tmp440 = tmp432 + tmp433; |
||
1443 | tmp442 = tmp436 + tmp437; |
||
1444 | tmp439 = c_re(W[1]); |
||
1445 | tmp441 = c_im(W[1]); |
||
1446 | Y[-29 * iostride] = (tmp439 * tmp440) - (tmp441 * tmp442); |
||
1447 | X[2 * iostride] = (tmp441 * tmp440) + (tmp439 * tmp442); |
||
1448 | } |
||
1449 | } |
||
1450 | { |
||
1451 | fftw_real tmp362; |
||
1452 | fftw_real tmp400; |
||
1453 | fftw_real tmp389; |
||
1454 | fftw_real tmp401; |
||
1455 | fftw_real tmp386; |
||
1456 | fftw_real tmp396; |
||
1457 | fftw_real tmp377; |
||
1458 | fftw_real tmp397; |
||
1459 | ASSERT_ALIGNED_DOUBLE(); |
||
1460 | { |
||
1461 | fftw_real tmp361; |
||
1462 | fftw_real tmp387; |
||
1463 | fftw_real tmp388; |
||
1464 | fftw_real tmp385; |
||
1465 | fftw_real tmp369; |
||
1466 | fftw_real tmp376; |
||
1467 | ASSERT_ALIGNED_DOUBLE(); |
||
1468 | tmp361 = K707106781 * (tmp357 - tmp360); |
||
1469 | tmp362 = tmp354 - tmp361; |
||
1470 | tmp400 = tmp354 + tmp361; |
||
1471 | tmp387 = (K382683432 * tmp375) - (K923879532 * tmp372); |
||
1472 | tmp388 = (K923879532 * tmp365) + (K382683432 * tmp368); |
||
1473 | tmp389 = tmp387 - tmp388; |
||
1474 | tmp401 = tmp387 + tmp388; |
||
1475 | tmp385 = K707106781 * (tmp383 - tmp384); |
||
1476 | tmp386 = tmp382 - tmp385; |
||
1477 | tmp396 = tmp382 + tmp385; |
||
1478 | tmp369 = (K382683432 * tmp365) - (K923879532 * tmp368); |
||
1479 | tmp376 = (K382683432 * tmp372) + (K923879532 * tmp375); |
||
1480 | tmp377 = tmp369 - tmp376; |
||
1481 | tmp397 = tmp376 + tmp369; |
||
1482 | } |
||
1483 | { |
||
1484 | fftw_real tmp378; |
||
1485 | fftw_real tmp390; |
||
1486 | fftw_real tmp351; |
||
1487 | fftw_real tmp379; |
||
1488 | ASSERT_ALIGNED_DOUBLE(); |
||
1489 | tmp378 = tmp362 - tmp377; |
||
1490 | tmp390 = tmp386 - tmp389; |
||
1491 | tmp351 = c_re(W[29]); |
||
1492 | tmp379 = c_im(W[29]); |
||
1493 | X[30 * iostride] = (tmp351 * tmp378) + (tmp379 * tmp390); |
||
1494 | Y[-iostride] = (tmp351 * tmp390) - (tmp379 * tmp378); |
||
1495 | } |
||
1496 | { |
||
1497 | fftw_real tmp392; |
||
1498 | fftw_real tmp394; |
||
1499 | fftw_real tmp391; |
||
1500 | fftw_real tmp393; |
||
1501 | ASSERT_ALIGNED_DOUBLE(); |
||
1502 | tmp392 = tmp362 + tmp377; |
||
1503 | tmp394 = tmp386 + tmp389; |
||
1504 | tmp391 = c_re(W[13]); |
||
1505 | tmp393 = c_im(W[13]); |
||
1506 | X[14 * iostride] = (tmp391 * tmp392) + (tmp393 * tmp394); |
||
1507 | Y[-17 * iostride] = (tmp391 * tmp394) - (tmp393 * tmp392); |
||
1508 | } |
||
1509 | { |
||
1510 | fftw_real tmp398; |
||
1511 | fftw_real tmp402; |
||
1512 | fftw_real tmp395; |
||
1513 | fftw_real tmp399; |
||
1514 | ASSERT_ALIGNED_DOUBLE(); |
||
1515 | tmp398 = tmp396 - tmp397; |
||
1516 | tmp402 = tmp400 - tmp401; |
||
1517 | tmp395 = c_re(W[21]); |
||
1518 | tmp399 = c_im(W[21]); |
||
1519 | Y[-9 * iostride] = (tmp395 * tmp398) - (tmp399 * tmp402); |
||
1520 | X[22 * iostride] = (tmp399 * tmp398) + (tmp395 * tmp402); |
||
1521 | } |
||
1522 | { |
||
1523 | fftw_real tmp404; |
||
1524 | fftw_real tmp406; |
||
1525 | fftw_real tmp403; |
||
1526 | fftw_real tmp405; |
||
1527 | ASSERT_ALIGNED_DOUBLE(); |
||
1528 | tmp404 = tmp396 + tmp397; |
||
1529 | tmp406 = tmp400 + tmp401; |
||
1530 | tmp403 = c_re(W[5]); |
||
1531 | tmp405 = c_im(W[5]); |
||
1532 | Y[-25 * iostride] = (tmp403 * tmp404) - (tmp405 * tmp406); |
||
1533 | X[6 * iostride] = (tmp405 * tmp404) + (tmp403 * tmp406); |
||
1534 | } |
||
1535 | } |
||
1536 | { |
||
1537 | fftw_real tmp590; |
||
1538 | fftw_real tmp628; |
||
1539 | fftw_real tmp617; |
||
1540 | fftw_real tmp629; |
||
1541 | fftw_real tmp605; |
||
1542 | fftw_real tmp625; |
||
1543 | fftw_real tmp614; |
||
1544 | fftw_real tmp624; |
||
1545 | ASSERT_ALIGNED_DOUBLE(); |
||
1546 | { |
||
1547 | fftw_real tmp582; |
||
1548 | fftw_real tmp589; |
||
1549 | fftw_real tmp615; |
||
1550 | fftw_real tmp616; |
||
1551 | ASSERT_ALIGNED_DOUBLE(); |
||
1552 | tmp582 = tmp580 - tmp581; |
||
1553 | tmp589 = tmp585 + tmp588; |
||
1554 | tmp590 = tmp582 - tmp589; |
||
1555 | tmp628 = tmp582 + tmp589; |
||
1556 | tmp615 = (K831469612 * tmp603) - (K555570233 * tmp600); |
||
1557 | tmp616 = (K555570233 * tmp593) + (K831469612 * tmp596); |
||
1558 | tmp617 = tmp615 - tmp616; |
||
1559 | tmp629 = tmp615 + tmp616; |
||
1560 | } |
||
1561 | { |
||
1562 | fftw_real tmp597; |
||
1563 | fftw_real tmp604; |
||
1564 | fftw_real tmp610; |
||
1565 | fftw_real tmp613; |
||
1566 | ASSERT_ALIGNED_DOUBLE(); |
||
1567 | tmp597 = (K831469612 * tmp593) - (K555570233 * tmp596); |
||
1568 | tmp604 = (K831469612 * tmp600) + (K555570233 * tmp603); |
||
1569 | tmp605 = tmp597 - tmp604; |
||
1570 | tmp625 = tmp604 + tmp597; |
||
1571 | tmp610 = tmp608 + tmp609; |
||
1572 | tmp613 = tmp611 - tmp612; |
||
1573 | tmp614 = tmp610 - tmp613; |
||
1574 | tmp624 = tmp610 + tmp613; |
||
1575 | } |
||
1576 | { |
||
1577 | fftw_real tmp606; |
||
1578 | fftw_real tmp618; |
||
1579 | fftw_real tmp579; |
||
1580 | fftw_real tmp607; |
||
1581 | ASSERT_ALIGNED_DOUBLE(); |
||
1582 | tmp606 = tmp590 - tmp605; |
||
1583 | tmp618 = tmp614 - tmp617; |
||
1584 | tmp579 = c_re(W[26]); |
||
1585 | tmp607 = c_im(W[26]); |
||
1586 | X[27 * iostride] = (tmp579 * tmp606) + (tmp607 * tmp618); |
||
1587 | Y[-4 * iostride] = (tmp579 * tmp618) - (tmp607 * tmp606); |
||
1588 | } |
||
1589 | { |
||
1590 | fftw_real tmp620; |
||
1591 | fftw_real tmp622; |
||
1592 | fftw_real tmp619; |
||
1593 | fftw_real tmp621; |
||
1594 | ASSERT_ALIGNED_DOUBLE(); |
||
1595 | tmp620 = tmp590 + tmp605; |
||
1596 | tmp622 = tmp614 + tmp617; |
||
1597 | tmp619 = c_re(W[10]); |
||
1598 | tmp621 = c_im(W[10]); |
||
1599 | X[11 * iostride] = (tmp619 * tmp620) + (tmp621 * tmp622); |
||
1600 | Y[-20 * iostride] = (tmp619 * tmp622) - (tmp621 * tmp620); |
||
1601 | } |
||
1602 | { |
||
1603 | fftw_real tmp626; |
||
1604 | fftw_real tmp630; |
||
1605 | fftw_real tmp623; |
||
1606 | fftw_real tmp627; |
||
1607 | ASSERT_ALIGNED_DOUBLE(); |
||
1608 | tmp626 = tmp624 - tmp625; |
||
1609 | tmp630 = tmp628 - tmp629; |
||
1610 | tmp623 = c_re(W[18]); |
||
1611 | tmp627 = c_im(W[18]); |
||
1612 | Y[-12 * iostride] = (tmp623 * tmp626) - (tmp627 * tmp630); |
||
1613 | X[19 * iostride] = (tmp627 * tmp626) + (tmp623 * tmp630); |
||
1614 | } |
||
1615 | { |
||
1616 | fftw_real tmp632; |
||
1617 | fftw_real tmp634; |
||
1618 | fftw_real tmp631; |
||
1619 | fftw_real tmp633; |
||
1620 | ASSERT_ALIGNED_DOUBLE(); |
||
1621 | tmp632 = tmp624 + tmp625; |
||
1622 | tmp634 = tmp628 + tmp629; |
||
1623 | tmp631 = c_re(W[2]); |
||
1624 | tmp633 = c_im(W[2]); |
||
1625 | Y[-28 * iostride] = (tmp631 * tmp632) - (tmp633 * tmp634); |
||
1626 | X[3 * iostride] = (tmp633 * tmp632) + (tmp631 * tmp634); |
||
1627 | } |
||
1628 | } |
||
1629 | { |
||
1630 | fftw_real tmp546; |
||
1631 | fftw_real tmp572; |
||
1632 | fftw_real tmp561; |
||
1633 | fftw_real tmp573; |
||
1634 | fftw_real tmp553; |
||
1635 | fftw_real tmp569; |
||
1636 | fftw_real tmp558; |
||
1637 | fftw_real tmp568; |
||
1638 | ASSERT_ALIGNED_DOUBLE(); |
||
1639 | { |
||
1640 | fftw_real tmp544; |
||
1641 | fftw_real tmp545; |
||
1642 | fftw_real tmp559; |
||
1643 | fftw_real tmp560; |
||
1644 | ASSERT_ALIGNED_DOUBLE(); |
||
1645 | tmp544 = tmp446 + tmp453; |
||
1646 | tmp545 = tmp519 + tmp520; |
||
1647 | tmp546 = tmp544 + tmp545; |
||
1648 | tmp572 = tmp544 - tmp545; |
||
1649 | tmp559 = (K195090322 * tmp547) + (K980785280 * tmp548); |
||
1650 | tmp560 = (K980785280 * tmp551) - (K195090322 * tmp550); |
||
1651 | tmp561 = tmp559 + tmp560; |
||
1652 | tmp573 = tmp560 - tmp559; |
||
1653 | } |
||
1654 | { |
||
1655 | fftw_real tmp549; |
||
1656 | fftw_real tmp552; |
||
1657 | fftw_real tmp556; |
||
1658 | fftw_real tmp557; |
||
1659 | ASSERT_ALIGNED_DOUBLE(); |
||
1660 | tmp549 = (K980785280 * tmp547) - (K195090322 * tmp548); |
||
1661 | tmp552 = (K980785280 * tmp550) + (K195090322 * tmp551); |
||
1662 | tmp553 = tmp549 + tmp552; |
||
1663 | tmp569 = tmp549 - tmp552; |
||
1664 | tmp556 = tmp514 + tmp517; |
||
1665 | tmp557 = tmp468 + tmp461; |
||
1666 | tmp558 = tmp556 + tmp557; |
||
1667 | tmp568 = tmp556 - tmp557; |
||
1668 | } |
||
1669 | { |
||
1670 | fftw_real tmp554; |
||
1671 | fftw_real tmp562; |
||
1672 | fftw_real tmp543; |
||
1673 | fftw_real tmp555; |
||
1674 | ASSERT_ALIGNED_DOUBLE(); |
||
1675 | tmp554 = tmp546 - tmp553; |
||
1676 | tmp562 = tmp558 - tmp561; |
||
1677 | tmp543 = c_re(W[16]); |
||
1678 | tmp555 = c_im(W[16]); |
||
1679 | X[17 * iostride] = (tmp543 * tmp554) + (tmp555 * tmp562); |
||
1680 | Y[-14 * iostride] = (tmp543 * tmp562) - (tmp555 * tmp554); |
||
1681 | } |
||
1682 | { |
||
1683 | fftw_real tmp564; |
||
1684 | fftw_real tmp566; |
||
1685 | fftw_real tmp563; |
||
1686 | fftw_real tmp565; |
||
1687 | ASSERT_ALIGNED_DOUBLE(); |
||
1688 | tmp564 = tmp546 + tmp553; |
||
1689 | tmp566 = tmp558 + tmp561; |
||
1690 | tmp563 = c_re(W[0]); |
||
1691 | tmp565 = c_im(W[0]); |
||
1692 | X[iostride] = (tmp563 * tmp564) + (tmp565 * tmp566); |
||
1693 | Y[-30 * iostride] = (tmp563 * tmp566) - (tmp565 * tmp564); |
||
1694 | } |
||
1695 | { |
||
1696 | fftw_real tmp570; |
||
1697 | fftw_real tmp574; |
||
1698 | fftw_real tmp567; |
||
1699 | fftw_real tmp571; |
||
1700 | ASSERT_ALIGNED_DOUBLE(); |
||
1701 | tmp570 = tmp568 - tmp569; |
||
1702 | tmp574 = tmp572 - tmp573; |
||
1703 | tmp567 = c_re(W[24]); |
||
1704 | tmp571 = c_im(W[24]); |
||
1705 | Y[-6 * iostride] = (tmp567 * tmp570) - (tmp571 * tmp574); |
||
1706 | X[25 * iostride] = (tmp571 * tmp570) + (tmp567 * tmp574); |
||
1707 | } |
||
1708 | { |
||
1709 | fftw_real tmp576; |
||
1710 | fftw_real tmp578; |
||
1711 | fftw_real tmp575; |
||
1712 | fftw_real tmp577; |
||
1713 | ASSERT_ALIGNED_DOUBLE(); |
||
1714 | tmp576 = tmp568 + tmp569; |
||
1715 | tmp578 = tmp572 + tmp573; |
||
1716 | tmp575 = c_re(W[8]); |
||
1717 | tmp577 = c_im(W[8]); |
||
1718 | Y[-22 * iostride] = (tmp575 * tmp576) - (tmp577 * tmp578); |
||
1719 | X[9 * iostride] = (tmp577 * tmp576) + (tmp575 * tmp578); |
||
1720 | } |
||
1721 | } |
||
1722 | { |
||
1723 | fftw_real tmp470; |
||
1724 | fftw_real tmp536; |
||
1725 | fftw_real tmp525; |
||
1726 | fftw_real tmp537; |
||
1727 | fftw_real tmp509; |
||
1728 | fftw_real tmp533; |
||
1729 | fftw_real tmp522; |
||
1730 | fftw_real tmp532; |
||
1731 | ASSERT_ALIGNED_DOUBLE(); |
||
1732 | { |
||
1733 | fftw_real tmp454; |
||
1734 | fftw_real tmp469; |
||
1735 | fftw_real tmp523; |
||
1736 | fftw_real tmp524; |
||
1737 | ASSERT_ALIGNED_DOUBLE(); |
||
1738 | tmp454 = tmp446 - tmp453; |
||
1739 | tmp469 = tmp461 - tmp468; |
||
1740 | tmp470 = tmp454 + tmp469; |
||
1741 | tmp536 = tmp454 - tmp469; |
||
1742 | tmp523 = (K831469612 * tmp481) + (K555570233 * tmp488); |
||
1743 | tmp524 = (K555570233 * tmp507) - (K831469612 * tmp500); |
||
1744 | tmp525 = tmp523 + tmp524; |
||
1745 | tmp537 = tmp524 - tmp523; |
||
1746 | } |
||
1747 | { |
||
1748 | fftw_real tmp489; |
||
1749 | fftw_real tmp508; |
||
1750 | fftw_real tmp518; |
||
1751 | fftw_real tmp521; |
||
1752 | ASSERT_ALIGNED_DOUBLE(); |
||
1753 | tmp489 = (K555570233 * tmp481) - (K831469612 * tmp488); |
||
1754 | tmp508 = (K555570233 * tmp500) + (K831469612 * tmp507); |
||
1755 | tmp509 = tmp489 + tmp508; |
||
1756 | tmp533 = tmp489 - tmp508; |
||
1757 | tmp518 = tmp514 - tmp517; |
||
1758 | tmp521 = tmp519 - tmp520; |
||
1759 | tmp522 = tmp518 + tmp521; |
||
1760 | tmp532 = tmp518 - tmp521; |
||
1761 | } |
||
1762 | { |
||
1763 | fftw_real tmp510; |
||
1764 | fftw_real tmp526; |
||
1765 | fftw_real tmp443; |
||
1766 | fftw_real tmp511; |
||
1767 | ASSERT_ALIGNED_DOUBLE(); |
||
1768 | tmp510 = tmp470 - tmp509; |
||
1769 | tmp526 = tmp522 - tmp525; |
||
1770 | tmp443 = c_re(W[20]); |
||
1771 | tmp511 = c_im(W[20]); |
||
1772 | X[21 * iostride] = (tmp443 * tmp510) + (tmp511 * tmp526); |
||
1773 | Y[-10 * iostride] = (tmp443 * tmp526) - (tmp511 * tmp510); |
||
1774 | } |
||
1775 | { |
||
1776 | fftw_real tmp528; |
||
1777 | fftw_real tmp530; |
||
1778 | fftw_real tmp527; |
||
1779 | fftw_real tmp529; |
||
1780 | ASSERT_ALIGNED_DOUBLE(); |
||
1781 | tmp528 = tmp470 + tmp509; |
||
1782 | tmp530 = tmp522 + tmp525; |
||
1783 | tmp527 = c_re(W[4]); |
||
1784 | tmp529 = c_im(W[4]); |
||
1785 | X[5 * iostride] = (tmp527 * tmp528) + (tmp529 * tmp530); |
||
1786 | Y[-26 * iostride] = (tmp527 * tmp530) - (tmp529 * tmp528); |
||
1787 | } |
||
1788 | { |
||
1789 | fftw_real tmp534; |
||
1790 | fftw_real tmp538; |
||
1791 | fftw_real tmp531; |
||
1792 | fftw_real tmp535; |
||
1793 | ASSERT_ALIGNED_DOUBLE(); |
||
1794 | tmp534 = tmp532 - tmp533; |
||
1795 | tmp538 = tmp536 - tmp537; |
||
1796 | tmp531 = c_re(W[28]); |
||
1797 | tmp535 = c_im(W[28]); |
||
1798 | Y[-2 * iostride] = (tmp531 * tmp534) - (tmp535 * tmp538); |
||
1799 | X[29 * iostride] = (tmp535 * tmp534) + (tmp531 * tmp538); |
||
1800 | } |
||
1801 | { |
||
1802 | fftw_real tmp540; |
||
1803 | fftw_real tmp542; |
||
1804 | fftw_real tmp539; |
||
1805 | fftw_real tmp541; |
||
1806 | ASSERT_ALIGNED_DOUBLE(); |
||
1807 | tmp540 = tmp532 + tmp533; |
||
1808 | tmp542 = tmp536 + tmp537; |
||
1809 | tmp539 = c_re(W[12]); |
||
1810 | tmp541 = c_im(W[12]); |
||
1811 | Y[-18 * iostride] = (tmp539 * tmp540) - (tmp541 * tmp542); |
||
1812 | X[13 * iostride] = (tmp541 * tmp540) + (tmp539 * tmp542); |
||
1813 | } |
||
1814 | } |
||
1815 | } |
||
1816 | if (i == m) { |
||
1817 | fftw_real tmp7; |
||
1818 | fftw_real tmp123; |
||
1819 | fftw_real tmp35; |
||
1820 | fftw_real tmp95; |
||
1821 | fftw_real tmp82; |
||
1822 | fftw_real tmp110; |
||
1823 | fftw_real tmp146; |
||
1824 | fftw_real tmp165; |
||
1825 | fftw_real tmp29; |
||
1826 | fftw_real tmp137; |
||
1827 | fftw_real tmp141; |
||
1828 | fftw_real tmp160; |
||
1829 | fftw_real tmp69; |
||
1830 | fftw_real tmp73; |
||
1831 | fftw_real tmp103; |
||
1832 | fftw_real tmp107; |
||
1833 | fftw_real tmp14; |
||
1834 | fftw_real tmp143; |
||
1835 | fftw_real tmp46; |
||
1836 | fftw_real tmp109; |
||
1837 | fftw_real tmp126; |
||
1838 | fftw_real tmp166; |
||
1839 | fftw_real tmp77; |
||
1840 | fftw_real tmp96; |
||
1841 | fftw_real tmp22; |
||
1842 | fftw_real tmp132; |
||
1843 | fftw_real tmp140; |
||
1844 | fftw_real tmp161; |
||
1845 | fftw_real tmp58; |
||
1846 | fftw_real tmp72; |
||
1847 | fftw_real tmp100; |
||
1848 | fftw_real tmp106; |
||
1849 | ASSERT_ALIGNED_DOUBLE(); |
||
1850 | { |
||
1851 | fftw_real tmp3; |
||
1852 | fftw_real tmp31; |
||
1853 | fftw_real tmp81; |
||
1854 | fftw_real tmp144; |
||
1855 | fftw_real tmp6; |
||
1856 | fftw_real tmp78; |
||
1857 | fftw_real tmp34; |
||
1858 | fftw_real tmp145; |
||
1859 | ASSERT_ALIGNED_DOUBLE(); |
||
1860 | { |
||
1861 | fftw_real tmp1; |
||
1862 | fftw_real tmp2; |
||
1863 | fftw_real tmp79; |
||
1864 | fftw_real tmp80; |
||
1865 | ASSERT_ALIGNED_DOUBLE(); |
||
1866 | tmp1 = X[0]; |
||
1867 | tmp2 = X[15 * iostride]; |
||
1868 | tmp3 = tmp1 + tmp2; |
||
1869 | tmp31 = tmp1 - tmp2; |
||
1870 | tmp79 = Y[0]; |
||
1871 | tmp80 = Y[-15 * iostride]; |
||
1872 | tmp81 = tmp79 + tmp80; |
||
1873 | tmp144 = tmp79 - tmp80; |
||
1874 | } |
||
1875 | { |
||
1876 | fftw_real tmp4; |
||
1877 | fftw_real tmp5; |
||
1878 | fftw_real tmp32; |
||
1879 | fftw_real tmp33; |
||
1880 | ASSERT_ALIGNED_DOUBLE(); |
||
1881 | tmp4 = X[8 * iostride]; |
||
1882 | tmp5 = X[7 * iostride]; |
||
1883 | tmp6 = tmp4 + tmp5; |
||
1884 | tmp78 = tmp4 - tmp5; |
||
1885 | tmp32 = Y[-8 * iostride]; |
||
1886 | tmp33 = Y[-7 * iostride]; |
||
1887 | tmp34 = tmp32 + tmp33; |
||
1888 | tmp145 = tmp32 - tmp33; |
||
1889 | } |
||
1890 | tmp7 = tmp3 + tmp6; |
||
1891 | tmp123 = tmp3 - tmp6; |
||
1892 | tmp35 = tmp31 - tmp34; |
||
1893 | tmp95 = tmp31 + tmp34; |
||
1894 | tmp82 = tmp78 + tmp81; |
||
1895 | tmp110 = tmp81 - tmp78; |
||
1896 | tmp146 = tmp144 - tmp145; |
||
1897 | tmp165 = tmp145 + tmp144; |
||
1898 | } |
||
1899 | { |
||
1900 | fftw_real tmp25; |
||
1901 | fftw_real tmp59; |
||
1902 | fftw_real tmp67; |
||
1903 | fftw_real tmp134; |
||
1904 | fftw_real tmp28; |
||
1905 | fftw_real tmp64; |
||
1906 | fftw_real tmp62; |
||
1907 | fftw_real tmp135; |
||
1908 | fftw_real tmp133; |
||
1909 | fftw_real tmp136; |
||
1910 | ASSERT_ALIGNED_DOUBLE(); |
||
1911 | { |
||
1912 | fftw_real tmp23; |
||
1913 | fftw_real tmp24; |
||
1914 | fftw_real tmp65; |
||
1915 | fftw_real tmp66; |
||
1916 | ASSERT_ALIGNED_DOUBLE(); |
||
1917 | tmp23 = X[iostride]; |
||
1918 | tmp24 = X[14 * iostride]; |
||
1919 | tmp25 = tmp23 + tmp24; |
||
1920 | tmp59 = tmp23 - tmp24; |
||
1921 | tmp65 = Y[-iostride]; |
||
1922 | tmp66 = Y[-14 * iostride]; |
||
1923 | tmp67 = tmp65 + tmp66; |
||
1924 | tmp134 = tmp66 - tmp65; |
||
1925 | } |
||
1926 | { |
||
1927 | fftw_real tmp26; |
||
1928 | fftw_real tmp27; |
||
1929 | fftw_real tmp60; |
||
1930 | fftw_real tmp61; |
||
1931 | ASSERT_ALIGNED_DOUBLE(); |
||
1932 | tmp26 = X[6 * iostride]; |
||
1933 | tmp27 = X[9 * iostride]; |
||
1934 | tmp28 = tmp26 + tmp27; |
||
1935 | tmp64 = tmp26 - tmp27; |
||
1936 | tmp60 = Y[-6 * iostride]; |
||
1937 | tmp61 = Y[-9 * iostride]; |
||
1938 | tmp62 = tmp60 + tmp61; |
||
1939 | tmp135 = tmp60 - tmp61; |
||
1940 | } |
||
1941 | tmp29 = tmp25 + tmp28; |
||
1942 | tmp133 = tmp25 - tmp28; |
||
1943 | tmp136 = tmp134 - tmp135; |
||
1944 | tmp137 = tmp133 + tmp136; |
||
1945 | tmp141 = tmp136 - tmp133; |
||
1946 | tmp160 = tmp135 + tmp134; |
||
1947 | { |
||
1948 | fftw_real tmp63; |
||
1949 | fftw_real tmp68; |
||
1950 | fftw_real tmp101; |
||
1951 | fftw_real tmp102; |
||
1952 | ASSERT_ALIGNED_DOUBLE(); |
||
1953 | tmp63 = tmp59 - tmp62; |
||
1954 | tmp68 = tmp64 - tmp67; |
||
1955 | tmp69 = (K923879532 * tmp63) + (K382683432 * tmp68); |
||
1956 | tmp73 = (K923879532 * tmp68) - (K382683432 * tmp63); |
||
1957 | tmp101 = tmp59 + tmp62; |
||
1958 | tmp102 = tmp64 + tmp67; |
||
1959 | tmp103 = (K382683432 * tmp101) - (K923879532 * tmp102); |
||
1960 | tmp107 = (K923879532 * tmp101) + (K382683432 * tmp102); |
||
1961 | } |
||
1962 | } |
||
1963 | { |
||
1964 | fftw_real tmp10; |
||
1965 | fftw_real tmp36; |
||
1966 | fftw_real tmp39; |
||
1967 | fftw_real tmp125; |
||
1968 | fftw_real tmp13; |
||
1969 | fftw_real tmp41; |
||
1970 | fftw_real tmp44; |
||
1971 | fftw_real tmp124; |
||
1972 | ASSERT_ALIGNED_DOUBLE(); |
||
1973 | { |
||
1974 | fftw_real tmp8; |
||
1975 | fftw_real tmp9; |
||
1976 | fftw_real tmp37; |
||
1977 | fftw_real tmp38; |
||
1978 | ASSERT_ALIGNED_DOUBLE(); |
||
1979 | tmp8 = X[4 * iostride]; |
||
1980 | tmp9 = X[11 * iostride]; |
||
1981 | tmp10 = tmp8 + tmp9; |
||
1982 | tmp36 = tmp8 - tmp9; |
||
1983 | tmp37 = Y[-4 * iostride]; |
||
1984 | tmp38 = Y[-11 * iostride]; |
||
1985 | tmp39 = tmp37 + tmp38; |
||
1986 | tmp125 = tmp37 - tmp38; |
||
1987 | } |
||
1988 | { |
||
1989 | fftw_real tmp11; |
||
1990 | fftw_real tmp12; |
||
1991 | fftw_real tmp42; |
||
1992 | fftw_real tmp43; |
||
1993 | ASSERT_ALIGNED_DOUBLE(); |
||
1994 | tmp11 = X[3 * iostride]; |
||
1995 | tmp12 = X[12 * iostride]; |
||
1996 | tmp13 = tmp11 + tmp12; |
||
1997 | tmp41 = tmp11 - tmp12; |
||
1998 | tmp42 = Y[-3 * iostride]; |
||
1999 | tmp43 = Y[-12 * iostride]; |
||
2000 | tmp44 = tmp42 + tmp43; |
||
2001 | tmp124 = tmp43 - tmp42; |
||
2002 | } |
||
2003 | { |
||
2004 | fftw_real tmp40; |
||
2005 | fftw_real tmp45; |
||
2006 | fftw_real tmp75; |
||
2007 | fftw_real tmp76; |
||
2008 | ASSERT_ALIGNED_DOUBLE(); |
||
2009 | tmp14 = tmp10 + tmp13; |
||
2010 | tmp143 = tmp10 - tmp13; |
||
2011 | tmp40 = tmp36 - tmp39; |
||
2012 | tmp45 = tmp41 - tmp44; |
||
2013 | tmp46 = K707106781 * (tmp40 + tmp45); |
||
2014 | tmp109 = K707106781 * (tmp40 - tmp45); |
||
2015 | tmp126 = tmp124 - tmp125; |
||
2016 | tmp166 = tmp125 + tmp124; |
||
2017 | tmp75 = tmp36 + tmp39; |
||
2018 | tmp76 = tmp41 + tmp44; |
||
2019 | tmp77 = K707106781 * (tmp75 - tmp76); |
||
2020 | tmp96 = K707106781 * (tmp75 + tmp76); |
||
2021 | } |
||
2022 | } |
||
2023 | { |
||
2024 | fftw_real tmp18; |
||
2025 | fftw_real tmp48; |
||
2026 | fftw_real tmp56; |
||
2027 | fftw_real tmp129; |
||
2028 | fftw_real tmp21; |
||
2029 | fftw_real tmp53; |
||
2030 | fftw_real tmp51; |
||
2031 | fftw_real tmp130; |
||
2032 | fftw_real tmp128; |
||
2033 | fftw_real tmp131; |
||
2034 | ASSERT_ALIGNED_DOUBLE(); |
||
2035 | { |
||
2036 | fftw_real tmp16; |
||
2037 | fftw_real tmp17; |
||
2038 | fftw_real tmp54; |
||
2039 | fftw_real tmp55; |
||
2040 | ASSERT_ALIGNED_DOUBLE(); |
||
2041 | tmp16 = X[2 * iostride]; |
||
2042 | tmp17 = X[13 * iostride]; |
||
2043 | tmp18 = tmp16 + tmp17; |
||
2044 | tmp48 = tmp16 - tmp17; |
||
2045 | tmp54 = Y[-2 * iostride]; |
||
2046 | tmp55 = Y[-13 * iostride]; |
||
2047 | tmp56 = tmp54 + tmp55; |
||
2048 | tmp129 = tmp54 - tmp55; |
||
2049 | } |
||
2050 | { |
||
2051 | fftw_real tmp19; |
||
2052 | fftw_real tmp20; |
||
2053 | fftw_real tmp49; |
||
2054 | fftw_real tmp50; |
||
2055 | ASSERT_ALIGNED_DOUBLE(); |
||
2056 | tmp19 = X[10 * iostride]; |
||
2057 | tmp20 = X[5 * iostride]; |
||
2058 | tmp21 = tmp19 + tmp20; |
||
2059 | tmp53 = tmp19 - tmp20; |
||
2060 | tmp49 = Y[-10 * iostride]; |
||
2061 | tmp50 = Y[-5 * iostride]; |
||
2062 | tmp51 = tmp49 + tmp50; |
||
2063 | tmp130 = tmp49 - tmp50; |
||
2064 | } |
||
2065 | tmp22 = tmp18 + tmp21; |
||
2066 | tmp128 = tmp18 - tmp21; |
||
2067 | tmp131 = tmp129 - tmp130; |
||
2068 | tmp132 = tmp128 - tmp131; |
||
2069 | tmp140 = tmp128 + tmp131; |
||
2070 | tmp161 = tmp130 + tmp129; |
||
2071 | { |
||
2072 | fftw_real tmp52; |
||
2073 | fftw_real tmp57; |
||
2074 | fftw_real tmp98; |
||
2075 | fftw_real tmp99; |
||
2076 | ASSERT_ALIGNED_DOUBLE(); |
||
2077 | tmp52 = tmp48 - tmp51; |
||
2078 | tmp57 = tmp53 + tmp56; |
||
2079 | tmp58 = (K923879532 * tmp52) - (K382683432 * tmp57); |
||
2080 | tmp72 = (K382683432 * tmp52) + (K923879532 * tmp57); |
||
2081 | tmp98 = tmp48 + tmp51; |
||
2082 | tmp99 = tmp56 - tmp53; |
||
2083 | tmp100 = (K382683432 * tmp98) - (K923879532 * tmp99); |
||
2084 | tmp106 = (K923879532 * tmp98) + (K382683432 * tmp99); |
||
2085 | } |
||
2086 | } |
||
2087 | { |
||
2088 | fftw_real tmp15; |
||
2089 | fftw_real tmp30; |
||
2090 | fftw_real tmp171; |
||
2091 | fftw_real tmp172; |
||
2092 | fftw_real tmp173; |
||
2093 | fftw_real tmp174; |
||
2094 | ASSERT_ALIGNED_DOUBLE(); |
||
2095 | tmp15 = tmp7 + tmp14; |
||
2096 | tmp30 = tmp22 + tmp29; |
||
2097 | tmp171 = tmp15 - tmp30; |
||
2098 | tmp172 = tmp166 + tmp165; |
||
2099 | tmp173 = tmp161 + tmp160; |
||
2100 | tmp174 = tmp172 - tmp173; |
||
2101 | X[0] = K2_000000000 * (tmp15 + tmp30); |
||
2102 | X[16 * iostride] = -(K2_000000000 * (tmp173 + tmp172)); |
||
2103 | X[8 * iostride] = K1_414213562 * (tmp171 - tmp174); |
||
2104 | X[24 * iostride] = -(K1_414213562 * (tmp171 + tmp174)); |
||
2105 | } |
||
2106 | { |
||
2107 | fftw_real tmp163; |
||
2108 | fftw_real tmp169; |
||
2109 | fftw_real tmp168; |
||
2110 | fftw_real tmp170; |
||
2111 | ASSERT_ALIGNED_DOUBLE(); |
||
2112 | { |
||
2113 | fftw_real tmp159; |
||
2114 | fftw_real tmp162; |
||
2115 | fftw_real tmp164; |
||
2116 | fftw_real tmp167; |
||
2117 | ASSERT_ALIGNED_DOUBLE(); |
||
2118 | tmp159 = tmp7 - tmp14; |
||
2119 | tmp162 = tmp160 - tmp161; |
||
2120 | tmp163 = tmp159 + tmp162; |
||
2121 | tmp169 = tmp159 - tmp162; |
||
2122 | tmp164 = tmp22 - tmp29; |
||
2123 | tmp167 = tmp165 - tmp166; |
||
2124 | tmp168 = tmp164 + tmp167; |
||
2125 | tmp170 = tmp167 - tmp164; |
||
2126 | } |
||
2127 | X[4 * iostride] = (K1_847759065 * tmp163) - (K765366864 * tmp168); |
||
2128 | X[20 * iostride] = -((K765366864 * tmp163) + (K1_847759065 * tmp168)); |
||
2129 | X[12 * iostride] = (K765366864 * tmp169) - (K1_847759065 * tmp170); |
||
2130 | X[28 * iostride] = -((K1_847759065 * tmp169) + (K765366864 * tmp170)); |
||
2131 | } |
||
2132 | { |
||
2133 | fftw_real tmp71; |
||
2134 | fftw_real tmp85; |
||
2135 | fftw_real tmp84; |
||
2136 | fftw_real tmp86; |
||
2137 | ASSERT_ALIGNED_DOUBLE(); |
||
2138 | { |
||
2139 | fftw_real tmp47; |
||
2140 | fftw_real tmp70; |
||
2141 | fftw_real tmp74; |
||
2142 | fftw_real tmp83; |
||
2143 | ASSERT_ALIGNED_DOUBLE(); |
||
2144 | tmp47 = tmp35 + tmp46; |
||
2145 | tmp70 = tmp58 + tmp69; |
||
2146 | tmp71 = tmp47 + tmp70; |
||
2147 | tmp85 = tmp47 - tmp70; |
||
2148 | tmp74 = tmp72 + tmp73; |
||
2149 | tmp83 = tmp77 + tmp82; |
||
2150 | tmp84 = tmp74 + tmp83; |
||
2151 | tmp86 = tmp83 - tmp74; |
||
2152 | } |
||
2153 | X[iostride] = (K1_990369453 * tmp71) - (K196034280 * tmp84); |
||
2154 | X[17 * iostride] = -((K196034280 * tmp71) + (K1_990369453 * tmp84)); |
||
2155 | X[9 * iostride] = (K1_268786568 * tmp85) - (K1_546020906 * tmp86); |
||
2156 | X[25 * iostride] = -((K1_546020906 * tmp85) + (K1_268786568 * tmp86)); |
||
2157 | } |
||
2158 | { |
||
2159 | fftw_real tmp89; |
||
2160 | fftw_real tmp93; |
||
2161 | fftw_real tmp92; |
||
2162 | fftw_real tmp94; |
||
2163 | ASSERT_ALIGNED_DOUBLE(); |
||
2164 | { |
||
2165 | fftw_real tmp87; |
||
2166 | fftw_real tmp88; |
||
2167 | fftw_real tmp90; |
||
2168 | fftw_real tmp91; |
||
2169 | ASSERT_ALIGNED_DOUBLE(); |
||
2170 | tmp87 = tmp35 - tmp46; |
||
2171 | tmp88 = tmp73 - tmp72; |
||
2172 | tmp89 = tmp87 + tmp88; |
||
2173 | tmp93 = tmp87 - tmp88; |
||
2174 | tmp90 = tmp58 - tmp69; |
||
2175 | tmp91 = tmp82 - tmp77; |
||
2176 | tmp92 = tmp90 + tmp91; |
||
2177 | tmp94 = tmp91 - tmp90; |
||
2178 | } |
||
2179 | X[5 * iostride] = (K1_763842528 * tmp89) - (K942793473 * tmp92); |
||
2180 | X[21 * iostride] = -((K942793473 * tmp89) + (K1_763842528 * tmp92)); |
||
2181 | X[13 * iostride] = (K580569354 * tmp93) - (K1_913880671 * tmp94); |
||
2182 | X[29 * iostride] = -((K1_913880671 * tmp93) + (K580569354 * tmp94)); |
||
2183 | } |
||
2184 | { |
||
2185 | fftw_real tmp105; |
||
2186 | fftw_real tmp113; |
||
2187 | fftw_real tmp112; |
||
2188 | fftw_real tmp114; |
||
2189 | ASSERT_ALIGNED_DOUBLE(); |
||
2190 | { |
||
2191 | fftw_real tmp97; |
||
2192 | fftw_real tmp104; |
||
2193 | fftw_real tmp108; |
||
2194 | fftw_real tmp111; |
||
2195 | ASSERT_ALIGNED_DOUBLE(); |
||
2196 | tmp97 = tmp95 - tmp96; |
||
2197 | tmp104 = tmp100 + tmp103; |
||
2198 | tmp105 = tmp97 + tmp104; |
||
2199 | tmp113 = tmp97 - tmp104; |
||
2200 | tmp108 = tmp106 - tmp107; |
||
2201 | tmp111 = tmp109 + tmp110; |
||
2202 | tmp112 = tmp108 + tmp111; |
||
2203 | tmp114 = tmp111 - tmp108; |
||
2204 | } |
||
2205 | X[3 * iostride] = (K1_913880671 * tmp105) - (K580569354 * tmp112); |
||
2206 | X[19 * iostride] = -((K580569354 * tmp105) + (K1_913880671 * tmp112)); |
||
2207 | X[11 * iostride] = (K942793473 * tmp113) - (K1_763842528 * tmp114); |
||
2208 | X[27 * iostride] = -((K1_763842528 * tmp113) + (K942793473 * tmp114)); |
||
2209 | } |
||
2210 | { |
||
2211 | fftw_real tmp117; |
||
2212 | fftw_real tmp121; |
||
2213 | fftw_real tmp120; |
||
2214 | fftw_real tmp122; |
||
2215 | ASSERT_ALIGNED_DOUBLE(); |
||
2216 | { |
||
2217 | fftw_real tmp115; |
||
2218 | fftw_real tmp116; |
||
2219 | fftw_real tmp118; |
||
2220 | fftw_real tmp119; |
||
2221 | ASSERT_ALIGNED_DOUBLE(); |
||
2222 | tmp115 = tmp95 + tmp96; |
||
2223 | tmp116 = tmp106 + tmp107; |
||
2224 | tmp117 = tmp115 - tmp116; |
||
2225 | tmp121 = tmp115 + tmp116; |
||
2226 | tmp118 = tmp100 - tmp103; |
||
2227 | tmp119 = tmp110 - tmp109; |
||
2228 | tmp120 = tmp118 + tmp119; |
||
2229 | tmp122 = tmp119 - tmp118; |
||
2230 | } |
||
2231 | X[7 * iostride] = (K1_546020906 * tmp117) - (K1_268786568 * tmp120); |
||
2232 | X[23 * iostride] = -((K1_268786568 * tmp117) + (K1_546020906 * tmp120)); |
||
2233 | X[15 * iostride] = (K196034280 * tmp121) - (K1_990369453 * tmp122); |
||
2234 | X[31 * iostride] = -((K1_990369453 * tmp121) + (K196034280 * tmp122)); |
||
2235 | } |
||
2236 | { |
||
2237 | fftw_real tmp139; |
||
2238 | fftw_real tmp149; |
||
2239 | fftw_real tmp148; |
||
2240 | fftw_real tmp150; |
||
2241 | ASSERT_ALIGNED_DOUBLE(); |
||
2242 | { |
||
2243 | fftw_real tmp127; |
||
2244 | fftw_real tmp138; |
||
2245 | fftw_real tmp142; |
||
2246 | fftw_real tmp147; |
||
2247 | ASSERT_ALIGNED_DOUBLE(); |
||
2248 | tmp127 = tmp123 + tmp126; |
||
2249 | tmp138 = K707106781 * (tmp132 + tmp137); |
||
2250 | tmp139 = tmp127 + tmp138; |
||
2251 | tmp149 = tmp127 - tmp138; |
||
2252 | tmp142 = K707106781 * (tmp140 + tmp141); |
||
2253 | tmp147 = tmp143 + tmp146; |
||
2254 | tmp148 = tmp142 + tmp147; |
||
2255 | tmp150 = tmp147 - tmp142; |
||
2256 | } |
||
2257 | X[2 * iostride] = (K1_961570560 * tmp139) - (K390180644 * tmp148); |
||
2258 | X[18 * iostride] = -((K390180644 * tmp139) + (K1_961570560 * tmp148)); |
||
2259 | X[10 * iostride] = (K1_111140466 * tmp149) - (K1_662939224 * tmp150); |
||
2260 | X[26 * iostride] = -((K1_662939224 * tmp149) + (K1_111140466 * tmp150)); |
||
2261 | } |
||
2262 | { |
||
2263 | fftw_real tmp153; |
||
2264 | fftw_real tmp157; |
||
2265 | fftw_real tmp156; |
||
2266 | fftw_real tmp158; |
||
2267 | ASSERT_ALIGNED_DOUBLE(); |
||
2268 | { |
||
2269 | fftw_real tmp151; |
||
2270 | fftw_real tmp152; |
||
2271 | fftw_real tmp154; |
||
2272 | fftw_real tmp155; |
||
2273 | ASSERT_ALIGNED_DOUBLE(); |
||
2274 | tmp151 = tmp123 - tmp126; |
||
2275 | tmp152 = K707106781 * (tmp141 - tmp140); |
||
2276 | tmp153 = tmp151 + tmp152; |
||
2277 | tmp157 = tmp151 - tmp152; |
||
2278 | tmp154 = K707106781 * (tmp132 - tmp137); |
||
2279 | tmp155 = tmp146 - tmp143; |
||
2280 | tmp156 = tmp154 + tmp155; |
||
2281 | tmp158 = tmp155 - tmp154; |
||
2282 | } |
||
2283 | X[6 * iostride] = (K1_662939224 * tmp153) - (K1_111140466 * tmp156); |
||
2284 | X[22 * iostride] = -((K1_111140466 * tmp153) + (K1_662939224 * tmp156)); |
||
2285 | X[14 * iostride] = (K390180644 * tmp157) - (K1_961570560 * tmp158); |
||
2286 | X[30 * iostride] = -((K1_961570560 * tmp157) + (K390180644 * tmp158)); |
||
2287 | } |
||
2288 | } |
||
2289 | } |
||
2290 | |||
2291 | static const int twiddle_order[] = |
||
2292 | {1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31}; |
||
2293 | fftw_codelet_desc fftw_hc2hc_backward_32_desc = |
||
2294 | { |
||
2295 | "fftw_hc2hc_backward_32", |
||
2296 | (void (*)()) fftw_hc2hc_backward_32, |
||
2297 | 32, |
||
2298 | FFTW_BACKWARD, |
||
2299 | FFTW_HC2HC, |
||
2300 | 718, |
||
2301 | 31, |
||
2302 | twiddle_order, |
||
2303 | }; |