51
51
DK(KP198912367, +0.198912367379658006911597622644676228597850501);
52
52
DK(KP707106781, +0.707106781186547524400844362104849039284835938);
53
53
DK(KP414213562, +0.414213562373095048801688724209698078569671875);
55
for (i = v; i > 0; i = i - 1, R0 = R0 + ivs, R1 = R1 + ivs, Cr = Cr + ovs, Ci = Ci + ovs, MAKE_VOLATILE_STRIDE(rs), MAKE_VOLATILE_STRIDE(csr), MAKE_VOLATILE_STRIDE(csi)) {
56
E T23, T1S, T21, T1L, T2z, T2x, T1Z, T22;
58
E T2n, T2B, T1z, T5, T1C, T2C, T2o, Tc, T27, T1J, T1l, Tm, T26, T1G, T1k;
59
E Tv, T1s, T1c, T2e, T1Y, T1r, T15, T2d, T1V, TP, TF, T1M, TC, T1P, TN;
62
E T1A, T8, Te, Tj, Tf, T1B, Tb, Tg;
64
E T1, T2l, T2, T3, T9, Ta;
76
T1A = FNMS(KP414213562, T6, T7);
77
T8 = FMA(KP414213562, T7, T6);
78
T2n = FMA(KP707106781, T2m, T2l);
79
T2B = FNMS(KP707106781, T2m, T2l);
80
T1z = FMA(KP707106781, T4, T1);
81
T5 = FNMS(KP707106781, T4, T1);
87
T1B = FMS(KP414213562, T9, Ta);
88
Tb = FMA(KP414213562, Ta, T9);
92
E Tn, Ts, To, T1I, Tl, T1H, Ti, Tp, Tk, Th, T1T, T1U;
102
T1I = FMA(KP707106781, Tk, Tj);
103
Tl = FNMS(KP707106781, Tk, Tj);
104
T1H = FMA(KP707106781, Th, Te);
105
Ti = FNMS(KP707106781, Th, Te);
108
E TT, T16, TY, T17, TW, TZ, T11, T12, Tt, Tq;
110
T27 = FNMS(KP198912367, T1H, T1I);
111
T1J = FMA(KP198912367, T1I, T1H);
112
T1l = FMA(KP668178637, Ti, Tl);
113
Tm = FNMS(KP668178637, Tl, Ti);
118
E TU, T1F, Tu, T1E, Tr, TV;
120
T1F = FMA(KP707106781, Tt, Ts);
121
Tu = FNMS(KP707106781, Tt, Ts);
122
T1E = FMA(KP707106781, Tq, Tn);
123
Tr = FNMS(KP707106781, Tq, Tn);
126
T26 = FNMS(KP198912367, T1E, T1F);
127
T1G = FMA(KP198912367, T1F, T1E);
128
T1k = FMA(KP668178637, Tr, Tu);
129
Tv = FNMS(KP668178637, Tu, Tr);
134
T12 = R1[WS(rs, 13)];
137
E TX, T1a, T10, T19, T13, T1W, T18, T1b, T14, T1X;
138
T1T = FMS(KP707106781, TW, TT);
139
TX = FMA(KP707106781, TW, TT);
140
T1a = FNMS(KP414213562, TY, TZ);
141
T10 = FMA(KP414213562, TZ, TY);
142
T19 = FMS(KP414213562, T11, T12);
143
T13 = FMA(KP414213562, T12, T11);
144
T1W = FMA(KP707106781, T17, T16);
145
T18 = FNMS(KP707106781, T17, T16);
150
T1s = FMA(KP923879532, T1b, T18);
151
T1c = FNMS(KP923879532, T1b, T18);
152
T2e = FMA(KP923879532, T1X, T1W);
153
T1Y = FNMS(KP923879532, T1X, T1W);
154
T1r = FNMS(KP923879532, T14, TX);
155
T15 = FMA(KP923879532, T14, TX);
159
E Ty, TL, TG, TM, TB, TH;
165
T2d = FMA(KP923879532, T1U, T1T);
166
T1V = FNMS(KP923879532, T1U, T1T);
173
TP = FNMS(KP414213562, TD, TE);
174
TF = FMA(KP414213562, TE, TD);
177
T1M = FMA(KP707106781, TB, Ty);
178
TC = FNMS(KP707106781, TB, Ty);
179
T1P = FMA(KP707106781, TM, TL);
180
TN = FNMS(KP707106781, TM, TL);
181
TO = FMS(KP414213562, TG, TH);
182
TI = FMA(KP414213562, TH, TG);
187
E T1j, T1O, T1p, T1R, T1o, T2E, T2D, T1m, T1D, T2w, T2v, T1K, T2i, T2c, T2h;
188
E T29, T2t, T2r, T2f, T2j;
190
E T2a, T2b, T1g, TS, T1f, Tx, T2N, T2L, T1d, T1h;
192
E Td, TR, TK, Tw, T2J, T2K;
193
T1j = FMA(KP923879532, Tc, T5);
194
Td = FNMS(KP923879532, Tc, T5);
201
T2a = FMA(KP923879532, T1N, T1M);
202
T1O = FNMS(KP923879532, T1N, T1M);
203
T1p = FMA(KP923879532, TQ, TN);
204
TR = FNMS(KP923879532, TQ, TN);
205
T2b = FMA(KP923879532, T1Q, T1P);
206
T1R = FNMS(KP923879532, T1Q, T1P);
207
T1o = FMA(KP923879532, TJ, TC);
208
TK = FNMS(KP923879532, TJ, TC);
212
T2D = FMA(KP923879532, T2C, T2B);
213
T2J = FNMS(KP923879532, T2C, T2B);
216
T1g = FMA(KP534511135, TK, TR);
217
TS = FNMS(KP534511135, TR, TK);
218
T1f = FNMS(KP831469612, Tw, Td);
219
Tx = FMA(KP831469612, Tw, Td);
220
T2N = FNMS(KP831469612, T2K, T2J);
221
T2L = FMA(KP831469612, T2K, T2J);
222
T1d = FNMS(KP534511135, T1c, T15);
223
T1h = FMA(KP534511135, T15, T1c);
226
E T25, T28, T2p, T2q;
227
T1D = FNMS(KP923879532, T1C, T1z);
228
T25 = FMA(KP923879532, T1C, T1z);
230
E T2O, T1e, T2M, T1i;
235
Ci[WS(csi, 5)] = FNMS(KP881921264, T2O, T2N);
236
Ci[WS(csi, 10)] = -(FMA(KP881921264, T2O, T2N));
237
Cr[WS(csr, 2)] = FMA(KP881921264, T1e, Tx);
238
Cr[WS(csr, 13)] = FNMS(KP881921264, T1e, Tx);
239
Ci[WS(csi, 2)] = -(FMA(KP881921264, T2M, T2L));
240
Ci[WS(csi, 13)] = FNMS(KP881921264, T2M, T2L);
241
Cr[WS(csr, 5)] = FMA(KP881921264, T1i, T1f);
242
Cr[WS(csr, 10)] = FNMS(KP881921264, T1i, T1f);
246
T2v = FNMS(KP923879532, T2o, T2n);
247
T2p = FMA(KP923879532, T2o, T2n);
250
T2i = FMA(KP098491403, T2a, T2b);
251
T2c = FNMS(KP098491403, T2b, T2a);
252
T2h = FNMS(KP980785280, T28, T25);
253
T29 = FMA(KP980785280, T28, T25);
254
T2t = FNMS(KP980785280, T2q, T2p);
255
T2r = FMA(KP980785280, T2q, T2p);
256
T2f = FMA(KP098491403, T2e, T2d);
257
T2j = FNMS(KP098491403, T2d, T2e);
261
E T1x, T1q, T1v, T1n, T2H, T2F, T1t, T1w;
263
E T2u, T2g, T2s, T2k;
268
Ci[WS(csi, 7)] = FMA(KP995184726, T2u, T2t);
269
Ci[WS(csi, 8)] = FMS(KP995184726, T2u, T2t);
270
Cr[0] = FMA(KP995184726, T2g, T29);
271
Cr[WS(csr, 15)] = FNMS(KP995184726, T2g, T29);
272
Ci[0] = -(FMA(KP995184726, T2s, T2r));
273
Ci[WS(csi, 15)] = FNMS(KP995184726, T2s, T2r);
274
Cr[WS(csr, 7)] = FMA(KP995184726, T2k, T2h);
275
Cr[WS(csr, 8)] = FNMS(KP995184726, T2k, T2h);
277
T1x = FNMS(KP303346683, T1o, T1p);
278
T1q = FMA(KP303346683, T1p, T1o);
279
T1v = FNMS(KP831469612, T1m, T1j);
280
T1n = FMA(KP831469612, T1m, T1j);
281
T2H = FNMS(KP831469612, T2E, T2D);
282
T2F = FMA(KP831469612, T2E, T2D);
283
T1t = FMA(KP303346683, T1s, T1r);
284
T1w = FNMS(KP303346683, T1r, T1s);
286
E T2I, T1u, T2G, T1y;
291
Ci[WS(csi, 6)] = -(FMA(KP956940335, T2I, T2H));
292
Ci[WS(csi, 9)] = FNMS(KP956940335, T2I, T2H);
293
Cr[WS(csr, 1)] = FMA(KP956940335, T1u, T1n);
294
Cr[WS(csr, 14)] = FNMS(KP956940335, T1u, T1n);
295
Ci[WS(csi, 1)] = FMA(KP956940335, T2G, T2F);
296
Ci[WS(csi, 14)] = FMS(KP956940335, T2G, T2F);
297
Cr[WS(csr, 6)] = FMA(KP956940335, T1y, T1v);
298
Cr[WS(csr, 9)] = FNMS(KP956940335, T1y, T1v);
300
T23 = FNMS(KP820678790, T1O, T1R);
301
T1S = FMA(KP820678790, T1R, T1O);
302
T21 = FNMS(KP980785280, T1K, T1D);
303
T1L = FMA(KP980785280, T1K, T1D);
304
T2z = FMA(KP980785280, T2w, T2v);
305
T2x = FNMS(KP980785280, T2w, T2v);
306
T1Z = FNMS(KP820678790, T1Y, T1V);
307
T22 = FMA(KP820678790, T1V, T1Y);
312
E T20, T2A, T24, T2y;
317
Ci[WS(csi, 4)] = FMS(KP773010453, T2A, T2z);
318
Ci[WS(csi, 11)] = FMA(KP773010453, T2A, T2z);
319
Cr[WS(csr, 3)] = FMA(KP773010453, T20, T1L);
320
Cr[WS(csr, 12)] = FNMS(KP773010453, T20, T1L);
321
Ci[WS(csi, 3)] = FMA(KP773010453, T2y, T2x);
322
Ci[WS(csi, 12)] = FMS(KP773010453, T2y, T2x);
323
Cr[WS(csr, 4)] = FMA(KP773010453, T24, T21);
324
Cr[WS(csr, 11)] = FNMS(KP773010453, T24, T21);
56
for (i = v; i > 0; i = i - 1, R0 = R0 + ivs, R1 = R1 + ivs, Cr = Cr + ovs, Ci = Ci + ovs, MAKE_VOLATILE_STRIDE(rs), MAKE_VOLATILE_STRIDE(csr), MAKE_VOLATILE_STRIDE(csi)) {
57
E T23, T1S, T21, T1L, T2z, T2x, T1Z, T22;
59
E T2n, T2B, T1z, T5, T1C, T2C, T2o, Tc, T27, T1J, T1l, Tm, T26, T1G, T1k;
60
E Tv, T1s, T1c, T2e, T1Y, T1r, T15, T2d, T1V, TP, TF, T1M, TC, T1P, TN;
63
E T1A, T8, Te, Tj, Tf, T1B, Tb, Tg;
65
E T1, T2l, T2, T3, T9, Ta;
77
T1A = FNMS(KP414213562, T6, T7);
78
T8 = FMA(KP414213562, T7, T6);
79
T2n = FMA(KP707106781, T2m, T2l);
80
T2B = FNMS(KP707106781, T2m, T2l);
81
T1z = FMA(KP707106781, T4, T1);
82
T5 = FNMS(KP707106781, T4, T1);
88
T1B = FMS(KP414213562, T9, Ta);
89
Tb = FMA(KP414213562, Ta, T9);
93
E Tn, Ts, To, T1I, Tl, T1H, Ti, Tp, Tk, Th, T1T, T1U;
103
T1I = FMA(KP707106781, Tk, Tj);
104
Tl = FNMS(KP707106781, Tk, Tj);
105
T1H = FMA(KP707106781, Th, Te);
106
Ti = FNMS(KP707106781, Th, Te);
109
E TT, T16, TY, T17, TW, TZ, T11, T12, Tt, Tq;
111
T27 = FNMS(KP198912367, T1H, T1I);
112
T1J = FMA(KP198912367, T1I, T1H);
113
T1l = FMA(KP668178637, Ti, Tl);
114
Tm = FNMS(KP668178637, Tl, Ti);
119
E TU, T1F, Tu, T1E, Tr, TV;
121
T1F = FMA(KP707106781, Tt, Ts);
122
Tu = FNMS(KP707106781, Tt, Ts);
123
T1E = FMA(KP707106781, Tq, Tn);
124
Tr = FNMS(KP707106781, Tq, Tn);
127
T26 = FNMS(KP198912367, T1E, T1F);
128
T1G = FMA(KP198912367, T1F, T1E);
129
T1k = FMA(KP668178637, Tr, Tu);
130
Tv = FNMS(KP668178637, Tu, Tr);
135
T12 = R1[WS(rs, 13)];
138
E TX, T1a, T10, T19, T13, T1W, T18, T1b, T14, T1X;
139
T1T = FMS(KP707106781, TW, TT);
140
TX = FMA(KP707106781, TW, TT);
141
T1a = FNMS(KP414213562, TY, TZ);
142
T10 = FMA(KP414213562, TZ, TY);
143
T19 = FMS(KP414213562, T11, T12);
144
T13 = FMA(KP414213562, T12, T11);
145
T1W = FMA(KP707106781, T17, T16);
146
T18 = FNMS(KP707106781, T17, T16);
151
T1s = FMA(KP923879532, T1b, T18);
152
T1c = FNMS(KP923879532, T1b, T18);
153
T2e = FMA(KP923879532, T1X, T1W);
154
T1Y = FNMS(KP923879532, T1X, T1W);
155
T1r = FNMS(KP923879532, T14, TX);
156
T15 = FMA(KP923879532, T14, TX);
160
E Ty, TL, TG, TM, TB, TH;
166
T2d = FMA(KP923879532, T1U, T1T);
167
T1V = FNMS(KP923879532, T1U, T1T);
174
TP = FNMS(KP414213562, TD, TE);
175
TF = FMA(KP414213562, TE, TD);
178
T1M = FMA(KP707106781, TB, Ty);
179
TC = FNMS(KP707106781, TB, Ty);
180
T1P = FMA(KP707106781, TM, TL);
181
TN = FNMS(KP707106781, TM, TL);
182
TO = FMS(KP414213562, TG, TH);
183
TI = FMA(KP414213562, TH, TG);
188
E T1j, T1O, T1p, T1R, T1o, T2E, T2D, T1m, T1D, T2w, T2v, T1K, T2i, T2c, T2h;
189
E T29, T2t, T2r, T2f, T2j;
191
E T2a, T2b, T1g, TS, T1f, Tx, T2N, T2L, T1d, T1h;
193
E Td, TR, TK, Tw, T2J, T2K;
194
T1j = FMA(KP923879532, Tc, T5);
195
Td = FNMS(KP923879532, Tc, T5);
202
T2a = FMA(KP923879532, T1N, T1M);
203
T1O = FNMS(KP923879532, T1N, T1M);
204
T1p = FMA(KP923879532, TQ, TN);
205
TR = FNMS(KP923879532, TQ, TN);
206
T2b = FMA(KP923879532, T1Q, T1P);
207
T1R = FNMS(KP923879532, T1Q, T1P);
208
T1o = FMA(KP923879532, TJ, TC);
209
TK = FNMS(KP923879532, TJ, TC);
213
T2D = FMA(KP923879532, T2C, T2B);
214
T2J = FNMS(KP923879532, T2C, T2B);
217
T1g = FMA(KP534511135, TK, TR);
218
TS = FNMS(KP534511135, TR, TK);
219
T1f = FNMS(KP831469612, Tw, Td);
220
Tx = FMA(KP831469612, Tw, Td);
221
T2N = FNMS(KP831469612, T2K, T2J);
222
T2L = FMA(KP831469612, T2K, T2J);
223
T1d = FNMS(KP534511135, T1c, T15);
224
T1h = FMA(KP534511135, T15, T1c);
227
E T25, T28, T2p, T2q;
228
T1D = FNMS(KP923879532, T1C, T1z);
229
T25 = FMA(KP923879532, T1C, T1z);
231
E T2O, T1e, T2M, T1i;
236
Ci[WS(csi, 5)] = FNMS(KP881921264, T2O, T2N);
237
Ci[WS(csi, 10)] = -(FMA(KP881921264, T2O, T2N));
238
Cr[WS(csr, 2)] = FMA(KP881921264, T1e, Tx);
239
Cr[WS(csr, 13)] = FNMS(KP881921264, T1e, Tx);
240
Ci[WS(csi, 2)] = -(FMA(KP881921264, T2M, T2L));
241
Ci[WS(csi, 13)] = FNMS(KP881921264, T2M, T2L);
242
Cr[WS(csr, 5)] = FMA(KP881921264, T1i, T1f);
243
Cr[WS(csr, 10)] = FNMS(KP881921264, T1i, T1f);
247
T2v = FNMS(KP923879532, T2o, T2n);
248
T2p = FMA(KP923879532, T2o, T2n);
251
T2i = FMA(KP098491403, T2a, T2b);
252
T2c = FNMS(KP098491403, T2b, T2a);
253
T2h = FNMS(KP980785280, T28, T25);
254
T29 = FMA(KP980785280, T28, T25);
255
T2t = FNMS(KP980785280, T2q, T2p);
256
T2r = FMA(KP980785280, T2q, T2p);
257
T2f = FMA(KP098491403, T2e, T2d);
258
T2j = FNMS(KP098491403, T2d, T2e);
262
E T1x, T1q, T1v, T1n, T2H, T2F, T1t, T1w;
264
E T2u, T2g, T2s, T2k;
269
Ci[WS(csi, 7)] = FMA(KP995184726, T2u, T2t);
270
Ci[WS(csi, 8)] = FMS(KP995184726, T2u, T2t);
271
Cr[0] = FMA(KP995184726, T2g, T29);
272
Cr[WS(csr, 15)] = FNMS(KP995184726, T2g, T29);
273
Ci[0] = -(FMA(KP995184726, T2s, T2r));
274
Ci[WS(csi, 15)] = FNMS(KP995184726, T2s, T2r);
275
Cr[WS(csr, 7)] = FMA(KP995184726, T2k, T2h);
276
Cr[WS(csr, 8)] = FNMS(KP995184726, T2k, T2h);
278
T1x = FNMS(KP303346683, T1o, T1p);
279
T1q = FMA(KP303346683, T1p, T1o);
280
T1v = FNMS(KP831469612, T1m, T1j);
281
T1n = FMA(KP831469612, T1m, T1j);
282
T2H = FNMS(KP831469612, T2E, T2D);
283
T2F = FMA(KP831469612, T2E, T2D);
284
T1t = FMA(KP303346683, T1s, T1r);
285
T1w = FNMS(KP303346683, T1r, T1s);
287
E T2I, T1u, T2G, T1y;
292
Ci[WS(csi, 6)] = -(FMA(KP956940335, T2I, T2H));
293
Ci[WS(csi, 9)] = FNMS(KP956940335, T2I, T2H);
294
Cr[WS(csr, 1)] = FMA(KP956940335, T1u, T1n);
295
Cr[WS(csr, 14)] = FNMS(KP956940335, T1u, T1n);
296
Ci[WS(csi, 1)] = FMA(KP956940335, T2G, T2F);
297
Ci[WS(csi, 14)] = FMS(KP956940335, T2G, T2F);
298
Cr[WS(csr, 6)] = FMA(KP956940335, T1y, T1v);
299
Cr[WS(csr, 9)] = FNMS(KP956940335, T1y, T1v);
301
T23 = FNMS(KP820678790, T1O, T1R);
302
T1S = FMA(KP820678790, T1R, T1O);
303
T21 = FNMS(KP980785280, T1K, T1D);
304
T1L = FMA(KP980785280, T1K, T1D);
305
T2z = FMA(KP980785280, T2w, T2v);
306
T2x = FNMS(KP980785280, T2w, T2v);
307
T1Z = FNMS(KP820678790, T1Y, T1V);
308
T22 = FMA(KP820678790, T1V, T1Y);
313
E T20, T2A, T24, T2y;
318
Ci[WS(csi, 4)] = FMS(KP773010453, T2A, T2z);
319
Ci[WS(csi, 11)] = FMA(KP773010453, T2A, T2z);
320
Cr[WS(csr, 3)] = FMA(KP773010453, T20, T1L);
321
Cr[WS(csr, 12)] = FNMS(KP773010453, T20, T1L);
322
Ci[WS(csi, 3)] = FMA(KP773010453, T2y, T2x);
323
Ci[WS(csi, 12)] = FMS(KP773010453, T2y, T2x);
324
Cr[WS(csr, 4)] = FMA(KP773010453, T24, T21);
325
Cr[WS(csr, 11)] = FNMS(KP773010453, T24, T21);
360
362
DK(KP382683432, +0.382683432365089771728459984030398866761344562);
361
363
DK(KP923879532, +0.923879532511286756128183189396788286822416626);
362
364
DK(KP707106781, +0.707106781186547524400844362104849039284835938);
364
for (i = v; i > 0; i = i - 1, R0 = R0 + ivs, R1 = R1 + ivs, Cr = Cr + ovs, Ci = Ci + ovs, MAKE_VOLATILE_STRIDE(rs), MAKE_VOLATILE_STRIDE(csr), MAKE_VOLATILE_STRIDE(csi)) {
365
E T5, T2D, T1z, T2q, Tc, T2C, T1C, T2n, Tm, T1k, T1J, T26, Tv, T1l, T1G;
366
E T27, T15, T1r, T1Y, T2e, T1c, T1s, T1V, T2d, TK, T1o, T1R, T2b, TR, T1p;
369
E T1, T2p, T4, T2o, T2, T3;
374
T4 = KP707106781 * (T2 - T3);
375
T2o = KP707106781 * (T2 + T3);
387
T8 = FNMS(KP382683432, T7, KP923879532 * T6);
388
T1A = FMA(KP382683432, T6, KP923879532 * T7);
391
Tb = FNMS(KP923879532, Ta, KP382683432 * T9);
392
T1B = FMA(KP923879532, T9, KP382683432 * Ta);
400
E Te, Tk, Th, Tj, Tf, Tg;
405
Th = KP707106781 * (Tf - Tg);
406
Tj = KP707106781 * (Tf + Tg);
411
Tm = FNMS(KP195090322, Tl, KP980785280 * Ti);
412
T1k = FMA(KP195090322, Ti, KP980785280 * Tl);
415
T1J = FNMS(KP555570233, T1I, KP831469612 * T1H);
416
T26 = FMA(KP831469612, T1I, KP555570233 * T1H);
420
E Tq, Tt, Tp, Ts, Tn, To;
425
Tp = KP707106781 * (Tn - To);
426
Ts = KP707106781 * (Tn + To);
431
Tv = FMA(KP980785280, Tr, KP195090322 * Tu);
432
T1l = FNMS(KP980785280, Tu, KP195090322 * Tr);
435
T1G = FNMS(KP555570233, T1F, KP831469612 * T1E);
436
T27 = FMA(KP831469612, T1F, KP555570233 * T1E);
440
E TW, T1a, TV, T19, T10, T16, T13, T17, TT, TU;
445
TV = KP707106781 * (TT - TU);
446
T19 = KP707106781 * (TT + TU);
451
T10 = FNMS(KP382683432, TZ, KP923879532 * TY);
452
T16 = FMA(KP382683432, TY, KP923879532 * TZ);
454
T12 = R1[WS(rs, 13)];
455
T13 = FNMS(KP923879532, T12, KP382683432 * T11);
456
T17 = FMA(KP923879532, T11, KP382683432 * T12);
470
E T18, T1b, T1T, T1U;
482
E Ty, TP, TB, TO, TF, TL, TI, TM, Tz, TA;
487
TB = KP707106781 * (Tz - TA);
488
TO = KP707106781 * (Tz + TA);
493
TF = FNMS(KP382683432, TE, KP923879532 * TD);
494
TL = FMA(KP382683432, TD, KP923879532 * TE);
497
TI = FNMS(KP923879532, TH, KP382683432 * TG);
498
TM = FMA(KP923879532, TG, KP382683432 * TH);
524
E Tx, T1f, T2s, T2u, T1e, T2l, T1i, T2t;
538
TS = FMA(KP098017140, TK, KP995184726 * TR);
539
T1d = FNMS(KP995184726, T1c, KP098017140 * T15);
542
T1g = FNMS(KP098017140, TR, KP995184726 * TK);
543
T1h = FMA(KP995184726, T15, KP098017140 * T1c);
547
Cr[WS(csr, 8)] = Tx - T1e;
548
Ci[WS(csi, 8)] = T2t - T2u;
549
Cr[WS(csr, 7)] = Tx + T1e;
550
Ci[WS(csi, 7)] = T2t + T2u;
551
Cr[WS(csr, 15)] = T1f - T1i;
552
Ci[WS(csi, 15)] = T2l - T2s;
557
E T29, T2h, T2M, T2O, T2g, T2J, T2k, T2N;
559
E T25, T28, T2K, T2L;
570
E T2c, T2f, T2i, T2j;
571
T2c = FMA(KP956940335, T2a, KP290284677 * T2b);
572
T2f = FNMS(KP290284677, T2e, KP956940335 * T2d);
575
T2i = FMA(KP290284677, T2d, KP956940335 * T2e);
576
T2j = FNMS(KP290284677, T2a, KP956940335 * T2b);
580
Cr[WS(csr, 14)] = T29 - T2g;
581
Ci[WS(csi, 14)] = T2N - T2O;
582
Cr[WS(csr, 1)] = T29 + T2g;
583
Ci[WS(csi, 1)] = T2N + T2O;
584
Cr[WS(csr, 9)] = T2h - T2k;
585
Ci[WS(csi, 9)] = T2J - T2M;
586
Cr[WS(csr, 6)] = T2h + T2k;
587
Ci[WS(csi, 6)] = T2J + T2M;
590
E T1n, T1v, T2y, T2A, T1u, T2v, T1y, T2z;
592
E T1j, T1m, T2w, T2x;
603
E T1q, T1t, T1w, T1x;
604
T1q = FMA(KP773010453, T1o, KP634393284 * T1p);
605
T1t = FNMS(KP634393284, T1s, KP773010453 * T1r);
608
T1w = FMA(KP634393284, T1r, KP773010453 * T1s);
609
T1x = FNMS(KP634393284, T1o, KP773010453 * T1p);
613
Cr[WS(csr, 12)] = T1n - T1u;
614
Ci[WS(csi, 12)] = T2z - T2A;
615
Cr[WS(csr, 3)] = T1n + T1u;
616
Ci[WS(csi, 3)] = T2z + T2A;
617
Cr[WS(csr, 11)] = T1v - T1y;
618
Ci[WS(csi, 11)] = T2v - T2y;
619
Cr[WS(csr, 4)] = T1v + T1y;
620
Ci[WS(csi, 4)] = T2v + T2y;
623
E T1L, T21, T2G, T2I, T20, T2H, T24, T2B;
625
E T1D, T1K, T2E, T2F;
636
E T1S, T1Z, T22, T23;
637
T1S = FMA(KP881921264, T1O, KP471396736 * T1R);
638
T1Z = FMA(KP881921264, T1V, KP471396736 * T1Y);
641
T22 = FNMS(KP471396736, T1V, KP881921264 * T1Y);
642
T23 = FNMS(KP471396736, T1O, KP881921264 * T1R);
646
Cr[WS(csr, 13)] = T1L - T20;
647
Ci[WS(csi, 13)] = T2B - T2G;
648
Cr[WS(csr, 2)] = T1L + T20;
649
Ci[WS(csi, 2)] = T2B + T2G;
650
Cr[WS(csr, 10)] = T21 - T24;
651
Ci[WS(csi, 10)] = T2I - T2H;
652
Cr[WS(csr, 5)] = T21 + T24;
653
Ci[WS(csi, 5)] = -(T2H + T2I);
367
for (i = v; i > 0; i = i - 1, R0 = R0 + ivs, R1 = R1 + ivs, Cr = Cr + ovs, Ci = Ci + ovs, MAKE_VOLATILE_STRIDE(rs), MAKE_VOLATILE_STRIDE(csr), MAKE_VOLATILE_STRIDE(csi)) {
368
E T5, T2D, T1z, T2q, Tc, T2C, T1C, T2n, Tm, T1k, T1J, T26, Tv, T1l, T1G;
369
E T27, T15, T1r, T1Y, T2e, T1c, T1s, T1V, T2d, TK, T1o, T1R, T2b, TR, T1p;
372
E T1, T2p, T4, T2o, T2, T3;
377
T4 = KP707106781 * (T2 - T3);
378
T2o = KP707106781 * (T2 + T3);
390
T8 = FNMS(KP382683432, T7, KP923879532 * T6);
391
T1A = FMA(KP382683432, T6, KP923879532 * T7);
394
Tb = FNMS(KP923879532, Ta, KP382683432 * T9);
395
T1B = FMA(KP923879532, T9, KP382683432 * Ta);
403
E Te, Tk, Th, Tj, Tf, Tg;
408
Th = KP707106781 * (Tf - Tg);
409
Tj = KP707106781 * (Tf + Tg);
414
Tm = FNMS(KP195090322, Tl, KP980785280 * Ti);
415
T1k = FMA(KP195090322, Ti, KP980785280 * Tl);
418
T1J = FNMS(KP555570233, T1I, KP831469612 * T1H);
419
T26 = FMA(KP831469612, T1I, KP555570233 * T1H);
423
E Tq, Tt, Tp, Ts, Tn, To;
428
Tp = KP707106781 * (Tn - To);
429
Ts = KP707106781 * (Tn + To);
434
Tv = FMA(KP980785280, Tr, KP195090322 * Tu);
435
T1l = FNMS(KP980785280, Tu, KP195090322 * Tr);
438
T1G = FNMS(KP555570233, T1F, KP831469612 * T1E);
439
T27 = FMA(KP831469612, T1F, KP555570233 * T1E);
443
E TW, T1a, TV, T19, T10, T16, T13, T17, TT, TU;
448
TV = KP707106781 * (TT - TU);
449
T19 = KP707106781 * (TT + TU);
454
T10 = FNMS(KP382683432, TZ, KP923879532 * TY);
455
T16 = FMA(KP382683432, TY, KP923879532 * TZ);
457
T12 = R1[WS(rs, 13)];
458
T13 = FNMS(KP923879532, T12, KP382683432 * T11);
459
T17 = FMA(KP923879532, T11, KP382683432 * T12);
473
E T18, T1b, T1T, T1U;
485
E Ty, TP, TB, TO, TF, TL, TI, TM, Tz, TA;
490
TB = KP707106781 * (Tz - TA);
491
TO = KP707106781 * (Tz + TA);
496
TF = FNMS(KP382683432, TE, KP923879532 * TD);
497
TL = FMA(KP382683432, TD, KP923879532 * TE);
500
TI = FNMS(KP923879532, TH, KP382683432 * TG);
501
TM = FMA(KP923879532, TG, KP382683432 * TH);
527
E Tx, T1f, T2s, T2u, T1e, T2l, T1i, T2t;
541
TS = FMA(KP098017140, TK, KP995184726 * TR);
542
T1d = FNMS(KP995184726, T1c, KP098017140 * T15);
545
T1g = FNMS(KP098017140, TR, KP995184726 * TK);
546
T1h = FMA(KP995184726, T15, KP098017140 * T1c);
550
Cr[WS(csr, 8)] = Tx - T1e;
551
Ci[WS(csi, 8)] = T2t - T2u;
552
Cr[WS(csr, 7)] = Tx + T1e;
553
Ci[WS(csi, 7)] = T2t + T2u;
554
Cr[WS(csr, 15)] = T1f - T1i;
555
Ci[WS(csi, 15)] = T2l - T2s;
560
E T29, T2h, T2M, T2O, T2g, T2J, T2k, T2N;
562
E T25, T28, T2K, T2L;
573
E T2c, T2f, T2i, T2j;
574
T2c = FMA(KP956940335, T2a, KP290284677 * T2b);
575
T2f = FNMS(KP290284677, T2e, KP956940335 * T2d);
578
T2i = FMA(KP290284677, T2d, KP956940335 * T2e);
579
T2j = FNMS(KP290284677, T2a, KP956940335 * T2b);
583
Cr[WS(csr, 14)] = T29 - T2g;
584
Ci[WS(csi, 14)] = T2N - T2O;
585
Cr[WS(csr, 1)] = T29 + T2g;
586
Ci[WS(csi, 1)] = T2N + T2O;
587
Cr[WS(csr, 9)] = T2h - T2k;
588
Ci[WS(csi, 9)] = T2J - T2M;
589
Cr[WS(csr, 6)] = T2h + T2k;
590
Ci[WS(csi, 6)] = T2J + T2M;
593
E T1n, T1v, T2y, T2A, T1u, T2v, T1y, T2z;
595
E T1j, T1m, T2w, T2x;
606
E T1q, T1t, T1w, T1x;
607
T1q = FMA(KP773010453, T1o, KP634393284 * T1p);
608
T1t = FNMS(KP634393284, T1s, KP773010453 * T1r);
611
T1w = FMA(KP634393284, T1r, KP773010453 * T1s);
612
T1x = FNMS(KP634393284, T1o, KP773010453 * T1p);
616
Cr[WS(csr, 12)] = T1n - T1u;
617
Ci[WS(csi, 12)] = T2z - T2A;
618
Cr[WS(csr, 3)] = T1n + T1u;
619
Ci[WS(csi, 3)] = T2z + T2A;
620
Cr[WS(csr, 11)] = T1v - T1y;
621
Ci[WS(csi, 11)] = T2v - T2y;
622
Cr[WS(csr, 4)] = T1v + T1y;
623
Ci[WS(csi, 4)] = T2v + T2y;
626
E T1L, T21, T2G, T2I, T20, T2H, T24, T2B;
628
E T1D, T1K, T2E, T2F;
639
E T1S, T1Z, T22, T23;
640
T1S = FMA(KP881921264, T1O, KP471396736 * T1R);
641
T1Z = FMA(KP881921264, T1V, KP471396736 * T1Y);
644
T22 = FNMS(KP471396736, T1V, KP881921264 * T1Y);
645
T23 = FNMS(KP471396736, T1O, KP881921264 * T1R);
649
Cr[WS(csr, 13)] = T1L - T20;
650
Ci[WS(csi, 13)] = T2B - T2G;
651
Cr[WS(csr, 2)] = T1L + T20;
652
Ci[WS(csi, 2)] = T2B + T2G;
653
Cr[WS(csr, 10)] = T21 - T24;
654
Ci[WS(csi, 10)] = T2I - T2H;
655
Cr[WS(csr, 5)] = T21 + T24;
656
Ci[WS(csi, 5)] = -(T2H + T2I);