changed reading hint
[gromacs/adressmacs.git] / src / fftw / fni_16.c
blobd71c91f0a8027f0b71bf367c25e458128ba4b372
1 /*
2 * Copyright (c) 1997-1999 Massachusetts Institute of Technology
4 * This program is free software; you can redistribute it and/or modify
5 * it under the terms of the GNU General Public License as published by
6 * the Free Software Foundation; either version 2 of the License, or
7 * (at your option) any later version.
9 * This program is distributed in the hope that it will be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 * GNU General Public License for more details.
14 * You should have received a copy of the GNU General Public License
15 * along with this program; if not, write to the Free Software
16 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
20 /* This file was automatically generated --- DO NOT EDIT */
21 /* Generated on Tue May 18 13:54:55 EDT 1999 */
23 #include <fftw-int.h>
24 #include <fftw.h>
26 /* Generated by: ./genfft -magic-alignment-check -magic-twiddle-load-all -magic-variables 4 -magic-loopi -notwiddleinv 16 */
29 * This function contains 144 FP additions, 24 FP multiplications,
30 * (or, 136 additions, 16 multiplications, 8 fused multiply/add),
31 * 46 stack variables, and 64 memory accesses
33 static const fftw_real K382683432 = FFTW_KONST(+0.382683432365089771728459984030398866761344562);
34 static const fftw_real K923879532 = FFTW_KONST(+0.923879532511286756128183189396788286822416626);
35 static const fftw_real K707106781 = FFTW_KONST(+0.707106781186547524400844362104849039284835938);
38 * Generator Id's :
39 * $Id$
40 * $Id$
41 * $Id$
44 void fftwi_no_twiddle_16(const fftw_complex *input, fftw_complex *output, int istride, int ostride)
46 fftw_real tmp7;
47 fftw_real tmp129;
48 fftw_real tmp38;
49 fftw_real tmp115;
50 fftw_real tmp49;
51 fftw_real tmp95;
52 fftw_real tmp83;
53 fftw_real tmp105;
54 fftw_real tmp29;
55 fftw_real tmp123;
56 fftw_real tmp73;
57 fftw_real tmp101;
58 fftw_real tmp78;
59 fftw_real tmp102;
60 fftw_real tmp126;
61 fftw_real tmp141;
62 fftw_real tmp14;
63 fftw_real tmp116;
64 fftw_real tmp45;
65 fftw_real tmp130;
66 fftw_real tmp52;
67 fftw_real tmp84;
68 fftw_real tmp55;
69 fftw_real tmp85;
70 fftw_real tmp22;
71 fftw_real tmp118;
72 fftw_real tmp62;
73 fftw_real tmp98;
74 fftw_real tmp67;
75 fftw_real tmp99;
76 fftw_real tmp121;
77 fftw_real tmp140;
78 ASSERT_ALIGNED_DOUBLE();
80 fftw_real tmp3;
81 fftw_real tmp81;
82 fftw_real tmp34;
83 fftw_real tmp48;
84 fftw_real tmp6;
85 fftw_real tmp47;
86 fftw_real tmp37;
87 fftw_real tmp82;
88 ASSERT_ALIGNED_DOUBLE();
90 fftw_real tmp1;
91 fftw_real tmp2;
92 fftw_real tmp32;
93 fftw_real tmp33;
94 ASSERT_ALIGNED_DOUBLE();
95 tmp1 = c_re(input[0]);
96 tmp2 = c_re(input[8 * istride]);
97 tmp3 = tmp1 + tmp2;
98 tmp81 = tmp1 - tmp2;
99 tmp32 = c_im(input[0]);
100 tmp33 = c_im(input[8 * istride]);
101 tmp34 = tmp32 + tmp33;
102 tmp48 = tmp32 - tmp33;
105 fftw_real tmp4;
106 fftw_real tmp5;
107 fftw_real tmp35;
108 fftw_real tmp36;
109 ASSERT_ALIGNED_DOUBLE();
110 tmp4 = c_re(input[4 * istride]);
111 tmp5 = c_re(input[12 * istride]);
112 tmp6 = tmp4 + tmp5;
113 tmp47 = tmp4 - tmp5;
114 tmp35 = c_im(input[4 * istride]);
115 tmp36 = c_im(input[12 * istride]);
116 tmp37 = tmp35 + tmp36;
117 tmp82 = tmp35 - tmp36;
119 tmp7 = tmp3 + tmp6;
120 tmp129 = tmp3 - tmp6;
121 tmp38 = tmp34 + tmp37;
122 tmp115 = tmp34 - tmp37;
123 tmp49 = tmp47 + tmp48;
124 tmp95 = tmp48 - tmp47;
125 tmp83 = tmp81 - tmp82;
126 tmp105 = tmp81 + tmp82;
129 fftw_real tmp25;
130 fftw_real tmp74;
131 fftw_real tmp72;
132 fftw_real tmp124;
133 fftw_real tmp28;
134 fftw_real tmp69;
135 fftw_real tmp77;
136 fftw_real tmp125;
137 ASSERT_ALIGNED_DOUBLE();
139 fftw_real tmp23;
140 fftw_real tmp24;
141 fftw_real tmp70;
142 fftw_real tmp71;
143 ASSERT_ALIGNED_DOUBLE();
144 tmp23 = c_re(input[15 * istride]);
145 tmp24 = c_re(input[7 * istride]);
146 tmp25 = tmp23 + tmp24;
147 tmp74 = tmp23 - tmp24;
148 tmp70 = c_im(input[15 * istride]);
149 tmp71 = c_im(input[7 * istride]);
150 tmp72 = tmp70 - tmp71;
151 tmp124 = tmp70 + tmp71;
154 fftw_real tmp26;
155 fftw_real tmp27;
156 fftw_real tmp75;
157 fftw_real tmp76;
158 ASSERT_ALIGNED_DOUBLE();
159 tmp26 = c_re(input[3 * istride]);
160 tmp27 = c_re(input[11 * istride]);
161 tmp28 = tmp26 + tmp27;
162 tmp69 = tmp26 - tmp27;
163 tmp75 = c_im(input[3 * istride]);
164 tmp76 = c_im(input[11 * istride]);
165 tmp77 = tmp75 - tmp76;
166 tmp125 = tmp75 + tmp76;
168 tmp29 = tmp25 + tmp28;
169 tmp123 = tmp25 - tmp28;
170 tmp73 = tmp69 + tmp72;
171 tmp101 = tmp72 - tmp69;
172 tmp78 = tmp74 - tmp77;
173 tmp102 = tmp74 + tmp77;
174 tmp126 = tmp124 - tmp125;
175 tmp141 = tmp124 + tmp125;
178 fftw_real tmp10;
179 fftw_real tmp50;
180 fftw_real tmp41;
181 fftw_real tmp51;
182 fftw_real tmp13;
183 fftw_real tmp54;
184 fftw_real tmp44;
185 fftw_real tmp53;
186 ASSERT_ALIGNED_DOUBLE();
188 fftw_real tmp8;
189 fftw_real tmp9;
190 fftw_real tmp39;
191 fftw_real tmp40;
192 ASSERT_ALIGNED_DOUBLE();
193 tmp8 = c_re(input[2 * istride]);
194 tmp9 = c_re(input[10 * istride]);
195 tmp10 = tmp8 + tmp9;
196 tmp50 = tmp8 - tmp9;
197 tmp39 = c_im(input[2 * istride]);
198 tmp40 = c_im(input[10 * istride]);
199 tmp41 = tmp39 + tmp40;
200 tmp51 = tmp39 - tmp40;
203 fftw_real tmp11;
204 fftw_real tmp12;
205 fftw_real tmp42;
206 fftw_real tmp43;
207 ASSERT_ALIGNED_DOUBLE();
208 tmp11 = c_re(input[14 * istride]);
209 tmp12 = c_re(input[6 * istride]);
210 tmp13 = tmp11 + tmp12;
211 tmp54 = tmp11 - tmp12;
212 tmp42 = c_im(input[14 * istride]);
213 tmp43 = c_im(input[6 * istride]);
214 tmp44 = tmp42 + tmp43;
215 tmp53 = tmp42 - tmp43;
217 tmp14 = tmp10 + tmp13;
218 tmp116 = tmp10 - tmp13;
219 tmp45 = tmp41 + tmp44;
220 tmp130 = tmp44 - tmp41;
221 tmp52 = tmp50 + tmp51;
222 tmp84 = tmp50 - tmp51;
223 tmp55 = tmp53 - tmp54;
224 tmp85 = tmp54 + tmp53;
227 fftw_real tmp18;
228 fftw_real tmp63;
229 fftw_real tmp61;
230 fftw_real tmp119;
231 fftw_real tmp21;
232 fftw_real tmp58;
233 fftw_real tmp66;
234 fftw_real tmp120;
235 ASSERT_ALIGNED_DOUBLE();
237 fftw_real tmp16;
238 fftw_real tmp17;
239 fftw_real tmp59;
240 fftw_real tmp60;
241 ASSERT_ALIGNED_DOUBLE();
242 tmp16 = c_re(input[istride]);
243 tmp17 = c_re(input[9 * istride]);
244 tmp18 = tmp16 + tmp17;
245 tmp63 = tmp16 - tmp17;
246 tmp59 = c_im(input[istride]);
247 tmp60 = c_im(input[9 * istride]);
248 tmp61 = tmp59 - tmp60;
249 tmp119 = tmp59 + tmp60;
252 fftw_real tmp19;
253 fftw_real tmp20;
254 fftw_real tmp64;
255 fftw_real tmp65;
256 ASSERT_ALIGNED_DOUBLE();
257 tmp19 = c_re(input[5 * istride]);
258 tmp20 = c_re(input[13 * istride]);
259 tmp21 = tmp19 + tmp20;
260 tmp58 = tmp19 - tmp20;
261 tmp64 = c_im(input[5 * istride]);
262 tmp65 = c_im(input[13 * istride]);
263 tmp66 = tmp64 - tmp65;
264 tmp120 = tmp64 + tmp65;
266 tmp22 = tmp18 + tmp21;
267 tmp118 = tmp18 - tmp21;
268 tmp62 = tmp58 + tmp61;
269 tmp98 = tmp61 - tmp58;
270 tmp67 = tmp63 - tmp66;
271 tmp99 = tmp63 + tmp66;
272 tmp121 = tmp119 - tmp120;
273 tmp140 = tmp119 + tmp120;
276 fftw_real tmp15;
277 fftw_real tmp30;
278 fftw_real tmp31;
279 fftw_real tmp46;
280 ASSERT_ALIGNED_DOUBLE();
281 tmp15 = tmp7 + tmp14;
282 tmp30 = tmp22 + tmp29;
283 c_re(output[8 * ostride]) = tmp15 - tmp30;
284 c_re(output[0]) = tmp15 + tmp30;
285 tmp31 = tmp22 - tmp29;
286 tmp46 = tmp38 - tmp45;
287 c_im(output[4 * ostride]) = tmp31 + tmp46;
288 c_im(output[12 * ostride]) = tmp46 - tmp31;
291 fftw_real tmp139;
292 fftw_real tmp142;
293 fftw_real tmp143;
294 fftw_real tmp144;
295 ASSERT_ALIGNED_DOUBLE();
296 tmp139 = tmp38 + tmp45;
297 tmp142 = tmp140 + tmp141;
298 c_im(output[8 * ostride]) = tmp139 - tmp142;
299 c_im(output[0]) = tmp139 + tmp142;
300 tmp143 = tmp7 - tmp14;
301 tmp144 = tmp141 - tmp140;
302 c_re(output[12 * ostride]) = tmp143 - tmp144;
303 c_re(output[4 * ostride]) = tmp143 + tmp144;
306 fftw_real tmp117;
307 fftw_real tmp131;
308 fftw_real tmp128;
309 fftw_real tmp132;
310 fftw_real tmp122;
311 fftw_real tmp127;
312 ASSERT_ALIGNED_DOUBLE();
313 tmp117 = tmp115 - tmp116;
314 tmp131 = tmp129 + tmp130;
315 tmp122 = tmp118 - tmp121;
316 tmp127 = tmp123 + tmp126;
317 tmp128 = K707106781 * (tmp122 - tmp127);
318 tmp132 = K707106781 * (tmp122 + tmp127);
319 c_im(output[14 * ostride]) = tmp117 - tmp128;
320 c_im(output[6 * ostride]) = tmp117 + tmp128;
321 c_re(output[10 * ostride]) = tmp131 - tmp132;
322 c_re(output[2 * ostride]) = tmp131 + tmp132;
325 fftw_real tmp133;
326 fftw_real tmp137;
327 fftw_real tmp136;
328 fftw_real tmp138;
329 fftw_real tmp134;
330 fftw_real tmp135;
331 ASSERT_ALIGNED_DOUBLE();
332 tmp133 = tmp116 + tmp115;
333 tmp137 = tmp129 - tmp130;
334 tmp134 = tmp118 + tmp121;
335 tmp135 = tmp126 - tmp123;
336 tmp136 = K707106781 * (tmp134 + tmp135);
337 tmp138 = K707106781 * (tmp135 - tmp134);
338 c_im(output[10 * ostride]) = tmp133 - tmp136;
339 c_im(output[2 * ostride]) = tmp133 + tmp136;
340 c_re(output[14 * ostride]) = tmp137 - tmp138;
341 c_re(output[6 * ostride]) = tmp137 + tmp138;
344 fftw_real tmp57;
345 fftw_real tmp89;
346 fftw_real tmp92;
347 fftw_real tmp94;
348 fftw_real tmp87;
349 fftw_real tmp93;
350 fftw_real tmp80;
351 fftw_real tmp88;
352 ASSERT_ALIGNED_DOUBLE();
354 fftw_real tmp56;
355 fftw_real tmp90;
356 fftw_real tmp91;
357 fftw_real tmp86;
358 fftw_real tmp68;
359 fftw_real tmp79;
360 ASSERT_ALIGNED_DOUBLE();
361 tmp56 = K707106781 * (tmp52 + tmp55);
362 tmp57 = tmp49 + tmp56;
363 tmp89 = tmp49 - tmp56;
364 tmp90 = (K923879532 * tmp67) - (K382683432 * tmp62);
365 tmp91 = (K382683432 * tmp73) + (K923879532 * tmp78);
366 tmp92 = tmp90 - tmp91;
367 tmp94 = tmp90 + tmp91;
368 tmp86 = K707106781 * (tmp84 + tmp85);
369 tmp87 = tmp83 - tmp86;
370 tmp93 = tmp83 + tmp86;
371 tmp68 = (K923879532 * tmp62) + (K382683432 * tmp67);
372 tmp79 = (K923879532 * tmp73) - (K382683432 * tmp78);
373 tmp80 = tmp68 + tmp79;
374 tmp88 = tmp79 - tmp68;
376 c_im(output[9 * ostride]) = tmp57 - tmp80;
377 c_im(output[ostride]) = tmp57 + tmp80;
378 c_re(output[13 * ostride]) = tmp87 - tmp88;
379 c_re(output[5 * ostride]) = tmp87 + tmp88;
380 c_im(output[13 * ostride]) = tmp89 - tmp92;
381 c_im(output[5 * ostride]) = tmp89 + tmp92;
382 c_re(output[9 * ostride]) = tmp93 - tmp94;
383 c_re(output[ostride]) = tmp93 + tmp94;
386 fftw_real tmp97;
387 fftw_real tmp109;
388 fftw_real tmp112;
389 fftw_real tmp114;
390 fftw_real tmp107;
391 fftw_real tmp113;
392 fftw_real tmp104;
393 fftw_real tmp108;
394 ASSERT_ALIGNED_DOUBLE();
396 fftw_real tmp96;
397 fftw_real tmp110;
398 fftw_real tmp111;
399 fftw_real tmp106;
400 fftw_real tmp100;
401 fftw_real tmp103;
402 ASSERT_ALIGNED_DOUBLE();
403 tmp96 = K707106781 * (tmp84 - tmp85);
404 tmp97 = tmp95 + tmp96;
405 tmp109 = tmp95 - tmp96;
406 tmp110 = (K382683432 * tmp99) - (K923879532 * tmp98);
407 tmp111 = (K923879532 * tmp101) + (K382683432 * tmp102);
408 tmp112 = tmp110 - tmp111;
409 tmp114 = tmp110 + tmp111;
410 tmp106 = K707106781 * (tmp55 - tmp52);
411 tmp107 = tmp105 - tmp106;
412 tmp113 = tmp105 + tmp106;
413 tmp100 = (K382683432 * tmp98) + (K923879532 * tmp99);
414 tmp103 = (K382683432 * tmp101) - (K923879532 * tmp102);
415 tmp104 = tmp100 + tmp103;
416 tmp108 = tmp103 - tmp100;
418 c_im(output[11 * ostride]) = tmp97 - tmp104;
419 c_im(output[3 * ostride]) = tmp97 + tmp104;
420 c_re(output[15 * ostride]) = tmp107 - tmp108;
421 c_re(output[7 * ostride]) = tmp107 + tmp108;
422 c_im(output[15 * ostride]) = tmp109 - tmp112;
423 c_im(output[7 * ostride]) = tmp109 + tmp112;
424 c_re(output[11 * ostride]) = tmp113 - tmp114;
425 c_re(output[3 * ostride]) = tmp113 + tmp114;
429 fftw_codelet_desc fftwi_no_twiddle_16_desc =
431 "fftwi_no_twiddle_16",
432 (void (*)()) fftwi_no_twiddle_16,
434 FFTW_BACKWARD,
435 FFTW_NOTW,
436 364,
438 (const int *) 0,