changed reading hint
[gromacs/adressmacs.git] / src / fftw / fhf_10.c
blob1eff354cdd64880a041f92e7883ec05dd737b781
1 /*
2 * Copyright (c) 1997-1999 Massachusetts Institute of Technology
4 * This program is free software; you can redistribute it and/or modify
5 * it under the terms of the GNU General Public License as published by
6 * the Free Software Foundation; either version 2 of the License, or
7 * (at your option) any later version.
9 * This program is distributed in the hope that it will be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 * GNU General Public License for more details.
14 * You should have received a copy of the GNU General Public License
15 * along with this program; if not, write to the Free Software
16 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
20 /* This file was automatically generated --- DO NOT EDIT */
21 /* Generated on Tue May 18 13:55:36 EDT 1999 */
23 #include <fftw-int.h>
24 #include <fftw.h>
26 /* Generated by: ./genfft -magic-alignment-check -magic-twiddle-load-all -magic-variables 4 -magic-loopi -hc2hc-forward 10 */
29 * This function contains 168 FP additions, 84 FP multiplications,
30 * (or, 126 additions, 42 multiplications, 42 fused multiply/add),
31 * 43 stack variables, and 80 memory accesses
33 static const fftw_real K587785252 = FFTW_KONST(+0.587785252292473129168705954639072768597652438);
34 static const fftw_real K951056516 = FFTW_KONST(+0.951056516295153572116439333379382143405698634);
35 static const fftw_real K250000000 = FFTW_KONST(+0.250000000000000000000000000000000000000000000);
36 static const fftw_real K559016994 = FFTW_KONST(+0.559016994374947424102293417182819058860154590);
39 * Generator Id's :
40 * $Id$
41 * $Id$
42 * $Id$
45 void fftw_hc2hc_forward_10(fftw_real *A, const fftw_complex *W, int iostride, int m, int dist)
47 int i;
48 fftw_real *X;
49 fftw_real *Y;
50 X = A;
51 Y = A + (10 * iostride);
53 fftw_real tmp170;
54 fftw_real tmp181;
55 fftw_real tmp162;
56 fftw_real tmp175;
57 fftw_real tmp165;
58 fftw_real tmp176;
59 fftw_real tmp166;
60 fftw_real tmp183;
61 fftw_real tmp155;
62 fftw_real tmp178;
63 fftw_real tmp158;
64 fftw_real tmp179;
65 fftw_real tmp159;
66 fftw_real tmp182;
67 fftw_real tmp168;
68 fftw_real tmp169;
69 ASSERT_ALIGNED_DOUBLE();
70 tmp168 = X[0];
71 tmp169 = X[5 * iostride];
72 tmp170 = tmp168 - tmp169;
73 tmp181 = tmp168 + tmp169;
75 fftw_real tmp160;
76 fftw_real tmp161;
77 fftw_real tmp163;
78 fftw_real tmp164;
79 ASSERT_ALIGNED_DOUBLE();
80 tmp160 = X[4 * iostride];
81 tmp161 = X[9 * iostride];
82 tmp162 = tmp160 - tmp161;
83 tmp175 = tmp160 + tmp161;
84 tmp163 = X[6 * iostride];
85 tmp164 = X[iostride];
86 tmp165 = tmp163 - tmp164;
87 tmp176 = tmp163 + tmp164;
89 tmp166 = tmp162 + tmp165;
90 tmp183 = tmp175 + tmp176;
92 fftw_real tmp153;
93 fftw_real tmp154;
94 fftw_real tmp156;
95 fftw_real tmp157;
96 ASSERT_ALIGNED_DOUBLE();
97 tmp153 = X[2 * iostride];
98 tmp154 = X[7 * iostride];
99 tmp155 = tmp153 - tmp154;
100 tmp178 = tmp153 + tmp154;
101 tmp156 = X[8 * iostride];
102 tmp157 = X[3 * iostride];
103 tmp158 = tmp156 - tmp157;
104 tmp179 = tmp156 + tmp157;
106 tmp159 = tmp155 + tmp158;
107 tmp182 = tmp178 + tmp179;
109 fftw_real tmp167;
110 fftw_real tmp171;
111 fftw_real tmp172;
112 fftw_real tmp186;
113 fftw_real tmp184;
114 fftw_real tmp185;
115 ASSERT_ALIGNED_DOUBLE();
116 tmp167 = K559016994 * (tmp159 - tmp166);
117 tmp171 = tmp159 + tmp166;
118 tmp172 = tmp170 - (K250000000 * tmp171);
119 X[iostride] = tmp167 + tmp172;
120 X[3 * iostride] = tmp172 - tmp167;
121 X[5 * iostride] = tmp170 + tmp171;
122 tmp186 = K559016994 * (tmp182 - tmp183);
123 tmp184 = tmp182 + tmp183;
124 tmp185 = tmp181 - (K250000000 * tmp184);
125 X[2 * iostride] = tmp185 - tmp186;
126 X[4 * iostride] = tmp186 + tmp185;
127 X[0] = tmp181 + tmp184;
130 fftw_real tmp173;
131 fftw_real tmp174;
132 fftw_real tmp177;
133 fftw_real tmp180;
134 ASSERT_ALIGNED_DOUBLE();
135 tmp173 = tmp155 - tmp158;
136 tmp174 = tmp162 - tmp165;
137 Y[-iostride] = -((K951056516 * tmp173) + (K587785252 * tmp174));
138 Y[-3 * iostride] = (K587785252 * tmp173) - (K951056516 * tmp174);
139 tmp177 = tmp175 - tmp176;
140 tmp180 = tmp178 - tmp179;
141 Y[-2 * iostride] = (K951056516 * tmp177) - (K587785252 * tmp180);
142 Y[-4 * iostride] = (K951056516 * tmp180) + (K587785252 * tmp177);
145 X = X + dist;
146 Y = Y - dist;
147 for (i = 2; i < m; i = i + 2, X = X + dist, Y = Y - dist, W = W + 9) {
148 fftw_real tmp39;
149 fftw_real tmp87;
150 fftw_real tmp132;
151 fftw_real tmp144;
152 fftw_real tmp73;
153 fftw_real tmp84;
154 fftw_real tmp85;
155 fftw_real tmp91;
156 fftw_real tmp92;
157 fftw_real tmp93;
158 fftw_real tmp100;
159 fftw_real tmp103;
160 fftw_real tmp128;
161 fftw_real tmp121;
162 fftw_real tmp122;
163 fftw_real tmp142;
164 fftw_real tmp50;
165 fftw_real tmp61;
166 fftw_real tmp62;
167 fftw_real tmp88;
168 fftw_real tmp89;
169 fftw_real tmp90;
170 fftw_real tmp107;
171 fftw_real tmp110;
172 fftw_real tmp127;
173 fftw_real tmp118;
174 fftw_real tmp119;
175 fftw_real tmp141;
176 ASSERT_ALIGNED_DOUBLE();
178 fftw_real tmp33;
179 fftw_real tmp131;
180 fftw_real tmp38;
181 fftw_real tmp130;
182 ASSERT_ALIGNED_DOUBLE();
183 tmp33 = X[0];
184 tmp131 = Y[-9 * iostride];
186 fftw_real tmp35;
187 fftw_real tmp37;
188 fftw_real tmp34;
189 fftw_real tmp36;
190 ASSERT_ALIGNED_DOUBLE();
191 tmp35 = X[5 * iostride];
192 tmp37 = Y[-4 * iostride];
193 tmp34 = c_re(W[4]);
194 tmp36 = c_im(W[4]);
195 tmp38 = (tmp34 * tmp35) - (tmp36 * tmp37);
196 tmp130 = (tmp36 * tmp35) + (tmp34 * tmp37);
198 tmp39 = tmp33 - tmp38;
199 tmp87 = tmp33 + tmp38;
200 tmp132 = tmp130 + tmp131;
201 tmp144 = tmp131 - tmp130;
204 fftw_real tmp67;
205 fftw_real tmp98;
206 fftw_real tmp83;
207 fftw_real tmp102;
208 fftw_real tmp72;
209 fftw_real tmp99;
210 fftw_real tmp78;
211 fftw_real tmp101;
212 ASSERT_ALIGNED_DOUBLE();
214 fftw_real tmp64;
215 fftw_real tmp66;
216 fftw_real tmp63;
217 fftw_real tmp65;
218 ASSERT_ALIGNED_DOUBLE();
219 tmp64 = X[4 * iostride];
220 tmp66 = Y[-5 * iostride];
221 tmp63 = c_re(W[3]);
222 tmp65 = c_im(W[3]);
223 tmp67 = (tmp63 * tmp64) - (tmp65 * tmp66);
224 tmp98 = (tmp65 * tmp64) + (tmp63 * tmp66);
227 fftw_real tmp80;
228 fftw_real tmp82;
229 fftw_real tmp79;
230 fftw_real tmp81;
231 ASSERT_ALIGNED_DOUBLE();
232 tmp80 = X[iostride];
233 tmp82 = Y[-8 * iostride];
234 tmp79 = c_re(W[0]);
235 tmp81 = c_im(W[0]);
236 tmp83 = (tmp79 * tmp80) - (tmp81 * tmp82);
237 tmp102 = (tmp81 * tmp80) + (tmp79 * tmp82);
240 fftw_real tmp69;
241 fftw_real tmp71;
242 fftw_real tmp68;
243 fftw_real tmp70;
244 ASSERT_ALIGNED_DOUBLE();
245 tmp69 = X[9 * iostride];
246 tmp71 = Y[0];
247 tmp68 = c_re(W[8]);
248 tmp70 = c_im(W[8]);
249 tmp72 = (tmp68 * tmp69) - (tmp70 * tmp71);
250 tmp99 = (tmp70 * tmp69) + (tmp68 * tmp71);
253 fftw_real tmp75;
254 fftw_real tmp77;
255 fftw_real tmp74;
256 fftw_real tmp76;
257 ASSERT_ALIGNED_DOUBLE();
258 tmp75 = X[6 * iostride];
259 tmp77 = Y[-3 * iostride];
260 tmp74 = c_re(W[5]);
261 tmp76 = c_im(W[5]);
262 tmp78 = (tmp74 * tmp75) - (tmp76 * tmp77);
263 tmp101 = (tmp76 * tmp75) + (tmp74 * tmp77);
265 tmp73 = tmp67 - tmp72;
266 tmp84 = tmp78 - tmp83;
267 tmp85 = tmp73 + tmp84;
268 tmp91 = tmp67 + tmp72;
269 tmp92 = tmp78 + tmp83;
270 tmp93 = tmp91 + tmp92;
271 tmp100 = tmp98 + tmp99;
272 tmp103 = tmp101 + tmp102;
273 tmp128 = tmp100 + tmp103;
274 tmp121 = tmp98 - tmp99;
275 tmp122 = tmp101 - tmp102;
276 tmp142 = tmp121 + tmp122;
279 fftw_real tmp44;
280 fftw_real tmp105;
281 fftw_real tmp60;
282 fftw_real tmp109;
283 fftw_real tmp49;
284 fftw_real tmp106;
285 fftw_real tmp55;
286 fftw_real tmp108;
287 ASSERT_ALIGNED_DOUBLE();
289 fftw_real tmp41;
290 fftw_real tmp43;
291 fftw_real tmp40;
292 fftw_real tmp42;
293 ASSERT_ALIGNED_DOUBLE();
294 tmp41 = X[2 * iostride];
295 tmp43 = Y[-7 * iostride];
296 tmp40 = c_re(W[1]);
297 tmp42 = c_im(W[1]);
298 tmp44 = (tmp40 * tmp41) - (tmp42 * tmp43);
299 tmp105 = (tmp42 * tmp41) + (tmp40 * tmp43);
302 fftw_real tmp57;
303 fftw_real tmp59;
304 fftw_real tmp56;
305 fftw_real tmp58;
306 ASSERT_ALIGNED_DOUBLE();
307 tmp57 = X[3 * iostride];
308 tmp59 = Y[-6 * iostride];
309 tmp56 = c_re(W[2]);
310 tmp58 = c_im(W[2]);
311 tmp60 = (tmp56 * tmp57) - (tmp58 * tmp59);
312 tmp109 = (tmp58 * tmp57) + (tmp56 * tmp59);
315 fftw_real tmp46;
316 fftw_real tmp48;
317 fftw_real tmp45;
318 fftw_real tmp47;
319 ASSERT_ALIGNED_DOUBLE();
320 tmp46 = X[7 * iostride];
321 tmp48 = Y[-2 * iostride];
322 tmp45 = c_re(W[6]);
323 tmp47 = c_im(W[6]);
324 tmp49 = (tmp45 * tmp46) - (tmp47 * tmp48);
325 tmp106 = (tmp47 * tmp46) + (tmp45 * tmp48);
328 fftw_real tmp52;
329 fftw_real tmp54;
330 fftw_real tmp51;
331 fftw_real tmp53;
332 ASSERT_ALIGNED_DOUBLE();
333 tmp52 = X[8 * iostride];
334 tmp54 = Y[-iostride];
335 tmp51 = c_re(W[7]);
336 tmp53 = c_im(W[7]);
337 tmp55 = (tmp51 * tmp52) - (tmp53 * tmp54);
338 tmp108 = (tmp53 * tmp52) + (tmp51 * tmp54);
340 tmp50 = tmp44 - tmp49;
341 tmp61 = tmp55 - tmp60;
342 tmp62 = tmp50 + tmp61;
343 tmp88 = tmp44 + tmp49;
344 tmp89 = tmp55 + tmp60;
345 tmp90 = tmp88 + tmp89;
346 tmp107 = tmp105 + tmp106;
347 tmp110 = tmp108 + tmp109;
348 tmp127 = tmp107 + tmp110;
349 tmp118 = tmp105 - tmp106;
350 tmp119 = tmp108 - tmp109;
351 tmp141 = tmp118 + tmp119;
354 fftw_real tmp115;
355 fftw_real tmp86;
356 fftw_real tmp116;
357 fftw_real tmp124;
358 fftw_real tmp126;
359 fftw_real tmp120;
360 fftw_real tmp123;
361 fftw_real tmp125;
362 fftw_real tmp117;
363 ASSERT_ALIGNED_DOUBLE();
364 tmp115 = K559016994 * (tmp62 - tmp85);
365 tmp86 = tmp62 + tmp85;
366 tmp116 = tmp39 - (K250000000 * tmp86);
367 tmp120 = tmp118 - tmp119;
368 tmp123 = tmp121 - tmp122;
369 tmp124 = (K951056516 * tmp120) + (K587785252 * tmp123);
370 tmp126 = (K951056516 * tmp123) - (K587785252 * tmp120);
371 Y[-5 * iostride] = tmp39 + tmp86;
372 tmp125 = tmp116 - tmp115;
373 Y[-7 * iostride] = tmp125 - tmp126;
374 X[3 * iostride] = tmp125 + tmp126;
375 tmp117 = tmp115 + tmp116;
376 Y[-9 * iostride] = tmp117 - tmp124;
377 X[iostride] = tmp117 + tmp124;
380 fftw_real tmp148;
381 fftw_real tmp143;
382 fftw_real tmp149;
383 fftw_real tmp147;
384 fftw_real tmp151;
385 fftw_real tmp145;
386 fftw_real tmp146;
387 fftw_real tmp152;
388 fftw_real tmp150;
389 ASSERT_ALIGNED_DOUBLE();
390 tmp148 = K559016994 * (tmp141 - tmp142);
391 tmp143 = tmp141 + tmp142;
392 tmp149 = tmp144 - (K250000000 * tmp143);
393 tmp145 = tmp50 - tmp61;
394 tmp146 = tmp73 - tmp84;
395 tmp147 = (K951056516 * tmp145) + (K587785252 * tmp146);
396 tmp151 = (K587785252 * tmp145) - (K951056516 * tmp146);
397 X[5 * iostride] = -(tmp143 + tmp144);
398 tmp152 = tmp149 - tmp148;
399 X[7 * iostride] = tmp151 - tmp152;
400 Y[-3 * iostride] = tmp151 + tmp152;
401 tmp150 = tmp148 + tmp149;
402 X[9 * iostride] = -(tmp147 + tmp150);
403 Y[-iostride] = tmp150 - tmp147;
406 fftw_real tmp96;
407 fftw_real tmp94;
408 fftw_real tmp95;
409 fftw_real tmp112;
410 fftw_real tmp114;
411 fftw_real tmp104;
412 fftw_real tmp111;
413 fftw_real tmp113;
414 fftw_real tmp97;
415 ASSERT_ALIGNED_DOUBLE();
416 tmp96 = K559016994 * (tmp90 - tmp93);
417 tmp94 = tmp90 + tmp93;
418 tmp95 = tmp87 - (K250000000 * tmp94);
419 tmp104 = tmp100 - tmp103;
420 tmp111 = tmp107 - tmp110;
421 tmp112 = (K951056516 * tmp104) - (K587785252 * tmp111);
422 tmp114 = (K951056516 * tmp111) + (K587785252 * tmp104);
423 X[0] = tmp87 + tmp94;
424 tmp113 = tmp96 + tmp95;
425 X[4 * iostride] = tmp113 - tmp114;
426 Y[-6 * iostride] = tmp113 + tmp114;
427 tmp97 = tmp95 - tmp96;
428 X[2 * iostride] = tmp97 - tmp112;
429 Y[-8 * iostride] = tmp97 + tmp112;
432 fftw_real tmp134;
433 fftw_real tmp129;
434 fftw_real tmp133;
435 fftw_real tmp138;
436 fftw_real tmp140;
437 fftw_real tmp136;
438 fftw_real tmp137;
439 fftw_real tmp139;
440 fftw_real tmp135;
441 ASSERT_ALIGNED_DOUBLE();
442 tmp134 = K559016994 * (tmp127 - tmp128);
443 tmp129 = tmp127 + tmp128;
444 tmp133 = tmp132 - (K250000000 * tmp129);
445 tmp136 = tmp91 - tmp92;
446 tmp137 = tmp88 - tmp89;
447 tmp138 = (K951056516 * tmp136) - (K587785252 * tmp137);
448 tmp140 = (K951056516 * tmp137) + (K587785252 * tmp136);
449 Y[0] = tmp129 + tmp132;
450 tmp139 = tmp134 + tmp133;
451 X[6 * iostride] = -(tmp139 - tmp140);
452 Y[-4 * iostride] = tmp140 + tmp139;
453 tmp135 = tmp133 - tmp134;
454 X[8 * iostride] = -(tmp135 - tmp138);
455 Y[-2 * iostride] = tmp138 + tmp135;
458 if (i == m) {
459 fftw_real tmp1;
460 fftw_real tmp24;
461 fftw_real tmp8;
462 fftw_real tmp10;
463 fftw_real tmp25;
464 fftw_real tmp26;
465 fftw_real tmp14;
466 fftw_real tmp28;
467 fftw_real tmp23;
468 fftw_real tmp17;
469 ASSERT_ALIGNED_DOUBLE();
470 tmp1 = X[0];
471 tmp24 = X[5 * iostride];
473 fftw_real tmp2;
474 fftw_real tmp3;
475 fftw_real tmp4;
476 fftw_real tmp5;
477 fftw_real tmp6;
478 fftw_real tmp7;
479 ASSERT_ALIGNED_DOUBLE();
480 tmp2 = X[4 * iostride];
481 tmp3 = X[6 * iostride];
482 tmp4 = tmp2 - tmp3;
483 tmp5 = X[8 * iostride];
484 tmp6 = X[2 * iostride];
485 tmp7 = tmp5 - tmp6;
486 tmp8 = tmp4 + tmp7;
487 tmp10 = K559016994 * (tmp4 - tmp7);
488 tmp25 = tmp2 + tmp3;
489 tmp26 = tmp5 + tmp6;
492 fftw_real tmp12;
493 fftw_real tmp13;
494 fftw_real tmp22;
495 fftw_real tmp15;
496 fftw_real tmp16;
497 fftw_real tmp21;
498 ASSERT_ALIGNED_DOUBLE();
499 tmp12 = X[iostride];
500 tmp13 = X[9 * iostride];
501 tmp22 = tmp12 + tmp13;
502 tmp15 = X[3 * iostride];
503 tmp16 = X[7 * iostride];
504 tmp21 = tmp15 + tmp16;
505 tmp14 = tmp12 - tmp13;
506 tmp28 = K559016994 * (tmp22 + tmp21);
507 tmp23 = tmp21 - tmp22;
508 tmp17 = tmp15 - tmp16;
510 X[2 * iostride] = tmp1 + tmp8;
512 fftw_real tmp18;
513 fftw_real tmp20;
514 fftw_real tmp11;
515 fftw_real tmp19;
516 fftw_real tmp9;
517 ASSERT_ALIGNED_DOUBLE();
518 tmp18 = (K587785252 * tmp14) - (K951056516 * tmp17);
519 tmp20 = (K951056516 * tmp14) + (K587785252 * tmp17);
520 tmp9 = tmp1 - (K250000000 * tmp8);
521 tmp11 = tmp9 - tmp10;
522 tmp19 = tmp10 + tmp9;
523 X[3 * iostride] = tmp11 - tmp18;
524 X[iostride] = tmp11 + tmp18;
525 X[4 * iostride] = tmp19 - tmp20;
526 X[0] = tmp19 + tmp20;
528 Y[-2 * iostride] = tmp23 - tmp24;
530 fftw_real tmp27;
531 fftw_real tmp32;
532 fftw_real tmp30;
533 fftw_real tmp31;
534 fftw_real tmp29;
535 ASSERT_ALIGNED_DOUBLE();
536 tmp27 = (K951056516 * tmp25) + (K587785252 * tmp26);
537 tmp32 = (K951056516 * tmp26) - (K587785252 * tmp25);
538 tmp29 = (K250000000 * tmp23) + tmp24;
539 tmp30 = tmp28 + tmp29;
540 tmp31 = tmp29 - tmp28;
541 Y[0] = -(tmp27 + tmp30);
542 Y[-4 * iostride] = tmp27 - tmp30;
543 Y[-iostride] = tmp31 - tmp32;
544 Y[-3 * iostride] = tmp32 + tmp31;
549 static const int twiddle_order[] =
550 {1, 2, 3, 4, 5, 6, 7, 8, 9};
551 fftw_codelet_desc fftw_hc2hc_forward_10_desc =
553 "fftw_hc2hc_forward_10",
554 (void (*)()) fftw_hc2hc_forward_10,
556 FFTW_FORWARD,
557 FFTW_HC2HC,
558 223,
560 twiddle_order,