21
21
/* This file was automatically generated --- DO NOT EDIT */
22
/* Generated on Sat Jul 5 21:40:06 EDT 2003 */
22
/* Generated on Tue Mar 7 09:46:58 EST 2006 */
24
24
#include "codelet-dft.h"
26
/* Generated by: /homee/stevenj/cvs/fftw3.0.1/genfft/gen_notw_c -simd -compact -variables 4 -n 4 -name n1fv_4 -include n1f.h */
28
/* Generated by: ../../../genfft/gen_notw_c -fma -reorder-insns -schedule-for-pipeline -simd -compact -variables 4 -pipeline-latency 8 -n 4 -name n1fv_4 -include n1f.h */
31
* This function contains 8 FP additions, 2 FP multiplications,
32
* (or, 6 additions, 0 multiplications, 2 fused multiply/add),
33
* 11 stack variables, and 8 memory accesses
37
* $Id: algsimp.ml,v 1.9 2006-02-12 23:34:12 athena Exp $
38
* $Id: fft.ml,v 1.4 2006-01-05 03:04:27 stevenj Exp $
39
* $Id: gen_notw_c.ml,v 1.17 2006-02-12 23:34:12 athena Exp $
44
static void n1fv_4(const R *ri, const R *ii, R *ro, R *io, stride is, stride os, INT v, INT ivs, INT ovs)
51
for (i = v; i > 0; i = i - VL, xi = xi + (VL * ivs), xo = xo + (VL * ovs), MAKE_VOLATILE_STRIDE(is), MAKE_VOLATILE_STRIDE(os)) {
53
T1 = LD(&(xi[0]), ivs, &(xi[0]));
54
T2 = LD(&(xi[WS(is, 2)]), ivs, &(xi[0]));
55
T4 = LD(&(xi[WS(is, 1)]), ivs, &(xi[WS(is, 1)]));
56
T5 = LD(&(xi[WS(is, 3)]), ivs, &(xi[WS(is, 1)]));
63
ST(&(xo[WS(os, 2)]), VSUB(T7, T8), ovs, &(xo[0]));
64
ST(&(xo[0]), VADD(T7, T8), ovs, &(xo[0]));
65
ST(&(xo[WS(os, 3)]), VFMAI(T6, T3), ovs, &(xo[WS(os, 1)]));
66
ST(&(xo[WS(os, 1)]), VFNMSI(T6, T3), ovs, &(xo[WS(os, 1)]));
71
static const kdft_desc desc = { 4, "n1fv_4", {6, 0, 2, 0}, &GENUS, 0, 0, 0, 0 };
72
void X(codelet_n1fv_4) (planner *p) {
73
X(kdft_register) (p, n1fv_4, &desc);
78
/* Generated by: ../../../genfft/gen_notw_c -simd -compact -variables 4 -pipeline-latency 8 -n 4 -name n1fv_4 -include n1f.h */
29
81
* This function contains 8 FP additions, 0 FP multiplications,
35
* $Id: algsimp.ml,v 1.7 2003/03/15 20:29:42 stevenj Exp $
36
* $Id: fft.ml,v 1.2 2003/03/15 20:29:42 stevenj Exp $
37
* $Id: gen_notw_c.ml,v 1.9 2003/04/16 21:21:53 athena Exp $
87
* $Id: algsimp.ml,v 1.9 2006-02-12 23:34:12 athena Exp $
88
* $Id: fft.ml,v 1.4 2006-01-05 03:04:27 stevenj Exp $
89
* $Id: gen_notw_c.ml,v 1.17 2006-02-12 23:34:12 athena Exp $
42
static void n1fv_4(const R *ri, const R *ii, R *ro, R *io, stride is, stride os, int v, int ivs, int ovs)
94
static void n1fv_4(const R *ri, const R *ii, R *ro, R *io, stride is, stride os, INT v, INT ivs, INT ovs)
50
for (i = v; i > 0; i = i - VL, xi = xi + (VL * ivs), xo = xo + (VL * ovs)) {
101
for (i = v; i > 0; i = i - VL, xi = xi + (VL * ivs), xo = xo + (VL * ovs), MAKE_VOLATILE_STRIDE(is), MAKE_VOLATILE_STRIDE(os)) {
65
116
ST(&(xo[WS(os, 3)]), VADD(T3, T6), ovs, &(xo[WS(os, 1)]));
66
117
ST(&(xo[WS(os, 2)]), VSUB(T7, T8), ovs, &(xo[0]));
71
121
static const kdft_desc desc = { 4, "n1fv_4", {8, 0, 0, 0}, &GENUS, 0, 0, 0, 0 };
72
122
void X(codelet_n1fv_4) (planner *p) {
73
123
X(kdft_register) (p, n1fv_4, &desc);
126
#endif /* HAVE_FMA */