forked from FFTW/fftw3
-
Notifications
You must be signed in to change notification settings - Fork 0
/
rdft.h
176 lines (143 loc) · 5.56 KB
/
rdft.h
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
/*
* Copyright (c) 2003, 2007-14 Matteo Frigo
* Copyright (c) 2003, 2007-14 Massachusetts Institute of Technology
*
* This program is free software; you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation; either version 2 of the License, or
* (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with this program; if not, write to the Free Software
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
*
*/
#ifndef __RDFT_H__
#define __RDFT_H__
#include "kernel/ifftw.h"
#include "rdft/codelet-rdft.h"
#ifdef __cplusplus
extern "C"
{
#endif /* __cplusplus */
/* problem.c: */
typedef struct {
problem super;
tensor *sz, *vecsz;
R *I, *O;
#if defined(STRUCT_HACK_KR)
rdft_kind kind[1];
#elif defined(STRUCT_HACK_C99)
rdft_kind kind[];
#else
rdft_kind *kind;
#endif
} problem_rdft;
void X(rdft_zerotens)(tensor *sz, R *I);
problem *X(mkproblem_rdft)(const tensor *sz, const tensor *vecsz,
R *I, R *O, const rdft_kind *kind);
problem *X(mkproblem_rdft_d)(tensor *sz, tensor *vecsz,
R *I, R *O, const rdft_kind *kind);
problem *X(mkproblem_rdft_0_d)(tensor *vecsz, R *I, R *O);
problem *X(mkproblem_rdft_1)(const tensor *sz, const tensor *vecsz,
R *I, R *O, rdft_kind kind);
problem *X(mkproblem_rdft_1_d)(tensor *sz, tensor *vecsz,
R *I, R *O, rdft_kind kind);
const char *X(rdft_kind_str)(rdft_kind kind);
/* solve.c: */
void X(rdft_solve)(const plan *ego_, const problem *p_);
/* plan.c: */
typedef void (*rdftapply) (const plan *ego, R *I, R *O);
typedef struct {
plan super;
rdftapply apply;
} plan_rdft;
plan *X(mkplan_rdft)(size_t size, const plan_adt *adt, rdftapply apply);
#define MKPLAN_RDFT(type, adt, apply) \
(type *)X(mkplan_rdft)(sizeof(type), adt, apply)
/* various solvers */
solver *X(mksolver_rdft_r2c_direct)(kr2c k, const kr2c_desc *desc);
solver *X(mksolver_rdft_r2c_directbuf)(kr2c k, const kr2c_desc *desc);
solver *X(mksolver_rdft_r2r_direct)(kr2r k, const kr2r_desc *desc);
void X(rdft_rank0_register)(planner *p);
void X(rdft_vrank3_transpose_register)(planner *p);
void X(rdft_rank_geq2_register)(planner *p);
void X(rdft_indirect_register)(planner *p);
void X(rdft_vrank_geq1_register)(planner *p);
void X(rdft_buffered_register)(planner *p);
void X(rdft_generic_register)(planner *p);
void X(rdft_rader_hc2hc_register)(planner *p);
void X(rdft_dht_register)(planner *p);
void X(dht_r2hc_register)(planner *p);
void X(dht_rader_register)(planner *p);
void X(dft_r2hc_register)(planner *p);
void X(rdft_nop_register)(planner *p);
void X(hc2hc_generic_register)(planner *p);
/****************************************************************************/
/* problem2.c: */
/*
An RDFT2 problem transforms a 1d real array r[n] with stride is/os
to/from an "unpacked" complex array {rio,iio}[n/2 + 1] with stride
os/is. R0 points to the first even element of the real array.
R1 points to the first odd element of the real array.
Strides on the real side of the transform express distances
between consecutive elements of the same array (even or odd).
E.g., for a contiguous input
R0 R1 R2 R3 ...
the input stride would be 2, not 1. This convention is necessary
for hc2c codelets to work, since they transpose even/odd with
real/imag.
Multidimensional transforms use complex DFTs for the
noncontiguous dimensions. vecsz has the usual interpretation.
*/
typedef struct {
problem super;
tensor *sz;
tensor *vecsz;
R *r0, *r1;
R *cr, *ci;
rdft_kind kind; /* assert(kind < DHT) */
} problem_rdft2;
problem *X(mkproblem_rdft2)(const tensor *sz, const tensor *vecsz,
R *r0, R *r1, R *cr, R *ci, rdft_kind kind);
problem *X(mkproblem_rdft2_d)(tensor *sz, tensor *vecsz,
R *r0, R *r1, R *cr, R *ci, rdft_kind kind);
problem *X(mkproblem_rdft2_d_3pointers)(tensor *sz, tensor *vecsz,
R *r, R *cr, R *ci, rdft_kind kind);
int X(rdft2_inplace_strides)(const problem_rdft2 *p, int vdim);
INT X(rdft2_tensor_max_index)(const tensor *sz, rdft_kind k);
void X(rdft2_strides)(rdft_kind kind, const iodim *d, INT *rs, INT *cs);
INT X(rdft2_complex_n)(INT real_n, rdft_kind kind);
/* verify.c: */
void X(rdft2_verify)(plan *pln, const problem_rdft2 *p, int rounds);
/* solve.c: */
void X(rdft2_solve)(const plan *ego_, const problem *p_);
/* plan.c: */
typedef void (*rdft2apply) (const plan *ego, R *r0, R *r1, R *cr, R *ci);
typedef struct {
plan super;
rdft2apply apply;
} plan_rdft2;
plan *X(mkplan_rdft2)(size_t size, const plan_adt *adt, rdft2apply apply);
#define MKPLAN_RDFT2(type, adt, apply) \
(type *)X(mkplan_rdft2)(sizeof(type), adt, apply)
/* various solvers */
solver *X(mksolver_rdft2_direct)(kr2c k, const kr2c_desc *desc);
void X(rdft2_vrank_geq1_register)(planner *p);
void X(rdft2_buffered_register)(planner *p);
void X(rdft2_rdft_register)(planner *p);
void X(rdft2_nop_register)(planner *p);
void X(rdft2_rank0_register)(planner *p);
void X(rdft2_rank_geq2_register)(planner *p);
/****************************************************************************/
/* configurations */
void X(rdft_conf_standard)(planner *p);
#ifdef __cplusplus
} /* extern "C" */
#endif /* __cplusplus */
#endif /* __RDFT_H__ */