Chris@10: /* Chris@10: * Copyright (c) 2003, 2007-11 Matteo Frigo Chris@10: * Copyright (c) 2003, 2007-11 Massachusetts Institute of Technology Chris@10: * Chris@10: * This program is free software; you can redistribute it and/or modify Chris@10: * it under the terms of the GNU General Public License as published by Chris@10: * the Free Software Foundation; either version 2 of the License, or Chris@10: * (at your option) any later version. Chris@10: * Chris@10: * This program is distributed in the hope that it will be useful, Chris@10: * but WITHOUT ANY WARRANTY; without even the implied warranty of Chris@10: * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the Chris@10: * GNU General Public License for more details. Chris@10: * Chris@10: * You should have received a copy of the GNU General Public License Chris@10: * along with this program; if not, write to the Free Software Chris@10: * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA Chris@10: * Chris@10: */ Chris@10: Chris@10: #ifndef __RDFT_H__ Chris@10: #define __RDFT_H__ Chris@10: Chris@10: #include "ifftw.h" Chris@10: #include "codelet-rdft.h" Chris@10: Chris@10: #ifdef __cplusplus Chris@10: extern "C" Chris@10: { Chris@10: #endif /* __cplusplus */ Chris@10: Chris@10: /* problem.c: */ Chris@10: typedef struct { Chris@10: problem super; Chris@10: tensor *sz, *vecsz; Chris@10: R *I, *O; Chris@10: #if defined(STRUCT_HACK_KR) Chris@10: rdft_kind kind[1]; Chris@10: #elif defined(STRUCT_HACK_C99) Chris@10: rdft_kind kind[]; Chris@10: #else Chris@10: rdft_kind *kind; Chris@10: #endif Chris@10: } problem_rdft; Chris@10: Chris@10: void X(rdft_zerotens)(tensor *sz, R *I); Chris@10: problem *X(mkproblem_rdft)(const tensor *sz, const tensor *vecsz, Chris@10: R *I, R *O, const rdft_kind *kind); Chris@10: problem *X(mkproblem_rdft_d)(tensor *sz, tensor *vecsz, Chris@10: R *I, R *O, const rdft_kind *kind); Chris@10: problem *X(mkproblem_rdft_0_d)(tensor *vecsz, R *I, R *O); Chris@10: problem *X(mkproblem_rdft_1)(const tensor *sz, const tensor *vecsz, Chris@10: R *I, R *O, rdft_kind kind); Chris@10: problem *X(mkproblem_rdft_1_d)(tensor *sz, tensor *vecsz, Chris@10: R *I, R *O, rdft_kind kind); Chris@10: Chris@10: const char *X(rdft_kind_str)(rdft_kind kind); Chris@10: Chris@10: /* solve.c: */ Chris@10: void X(rdft_solve)(const plan *ego_, const problem *p_); Chris@10: Chris@10: /* plan.c: */ Chris@10: typedef void (*rdftapply) (const plan *ego, R *I, R *O); Chris@10: Chris@10: typedef struct { Chris@10: plan super; Chris@10: rdftapply apply; Chris@10: } plan_rdft; Chris@10: Chris@10: plan *X(mkplan_rdft)(size_t size, const plan_adt *adt, rdftapply apply); Chris@10: Chris@10: #define MKPLAN_RDFT(type, adt, apply) \ Chris@10: (type *)X(mkplan_rdft)(sizeof(type), adt, apply) Chris@10: Chris@10: /* various solvers */ Chris@10: Chris@10: solver *X(mksolver_rdft_r2c_direct)(kr2c k, const kr2c_desc *desc); Chris@10: solver *X(mksolver_rdft_r2c_directbuf)(kr2c k, const kr2c_desc *desc); Chris@10: solver *X(mksolver_rdft_r2r_direct)(kr2r k, const kr2r_desc *desc); Chris@10: Chris@10: void X(rdft_rank0_register)(planner *p); Chris@10: void X(rdft_vrank3_transpose_register)(planner *p); Chris@10: void X(rdft_rank_geq2_register)(planner *p); Chris@10: void X(rdft_indirect_register)(planner *p); Chris@10: void X(rdft_vrank_geq1_register)(planner *p); Chris@10: void X(rdft_buffered_register)(planner *p); Chris@10: void X(rdft_generic_register)(planner *p); Chris@10: void X(rdft_rader_hc2hc_register)(planner *p); Chris@10: void X(rdft_dht_register)(planner *p); Chris@10: void X(dht_r2hc_register)(planner *p); Chris@10: void X(dht_rader_register)(planner *p); Chris@10: void X(dft_r2hc_register)(planner *p); Chris@10: void X(rdft_nop_register)(planner *p); Chris@10: void X(hc2hc_generic_register)(planner *p); Chris@10: Chris@10: /****************************************************************************/ Chris@10: /* problem2.c: */ Chris@10: /* Chris@10: An RDFT2 problem transforms a 1d real array r[n] with stride is/os Chris@10: to/from an "unpacked" complex array {rio,iio}[n/2 + 1] with stride Chris@10: os/is. R0 points to the first even element of the real array. Chris@10: R1 points to the first odd element of the real array. Chris@10: Chris@10: Strides on the real side of the transform express distances Chris@10: between consecutive elements of the same array (even or odd). Chris@10: E.g., for a contiguous input Chris@10: Chris@10: R0 R1 R2 R3 ... Chris@10: Chris@10: the input stride would be 2, not 1. This convention is necessary Chris@10: for hc2c codelets to work, since they transpose even/odd with Chris@10: real/imag. Chris@10: Chris@10: Multidimensional transforms use complex DFTs for the Chris@10: noncontiguous dimensions. vecsz has the usual interpretation. Chris@10: */ Chris@10: typedef struct { Chris@10: problem super; Chris@10: tensor *sz; Chris@10: tensor *vecsz; Chris@10: R *r0, *r1; Chris@10: R *cr, *ci; Chris@10: rdft_kind kind; /* assert(kind < DHT) */ Chris@10: } problem_rdft2; Chris@10: Chris@10: problem *X(mkproblem_rdft2)(const tensor *sz, const tensor *vecsz, Chris@10: R *r0, R *r1, R *cr, R *ci, rdft_kind kind); Chris@10: problem *X(mkproblem_rdft2_d)(tensor *sz, tensor *vecsz, Chris@10: R *r0, R *r1, R *cr, R *ci, rdft_kind kind); Chris@10: problem *X(mkproblem_rdft2_d_3pointers)(tensor *sz, tensor *vecsz, Chris@10: R *r, R *cr, R *ci, rdft_kind kind); Chris@10: int X(rdft2_inplace_strides)(const problem_rdft2 *p, int vdim); Chris@10: INT X(rdft2_tensor_max_index)(const tensor *sz, rdft_kind k); Chris@10: void X(rdft2_strides)(rdft_kind kind, const iodim *d, INT *rs, INT *cs); Chris@10: INT X(rdft2_complex_n)(INT real_n, rdft_kind kind); Chris@10: Chris@10: /* verify.c: */ Chris@10: void X(rdft2_verify)(plan *pln, const problem_rdft2 *p, int rounds); Chris@10: Chris@10: /* solve.c: */ Chris@10: void X(rdft2_solve)(const plan *ego_, const problem *p_); Chris@10: Chris@10: /* plan.c: */ Chris@10: typedef void (*rdft2apply) (const plan *ego, R *r0, R *r1, R *cr, R *ci); Chris@10: Chris@10: typedef struct { Chris@10: plan super; Chris@10: rdft2apply apply; Chris@10: } plan_rdft2; Chris@10: Chris@10: plan *X(mkplan_rdft2)(size_t size, const plan_adt *adt, rdft2apply apply); Chris@10: Chris@10: #define MKPLAN_RDFT2(type, adt, apply) \ Chris@10: (type *)X(mkplan_rdft2)(sizeof(type), adt, apply) Chris@10: Chris@10: /* various solvers */ Chris@10: Chris@10: solver *X(mksolver_rdft2_direct)(kr2c k, const kr2c_desc *desc); Chris@10: Chris@10: void X(rdft2_vrank_geq1_register)(planner *p); Chris@10: void X(rdft2_buffered_register)(planner *p); Chris@10: void X(rdft2_rdft_register)(planner *p); Chris@10: void X(rdft2_nop_register)(planner *p); Chris@10: void X(rdft2_rank0_register)(planner *p); Chris@10: void X(rdft2_rank_geq2_register)(planner *p); Chris@10: Chris@10: /****************************************************************************/ Chris@10: Chris@10: /* configurations */ Chris@10: void X(rdft_conf_standard)(planner *p); Chris@10: Chris@10: #ifdef __cplusplus Chris@10: } /* extern "C" */ Chris@10: #endif /* __cplusplus */ Chris@10: Chris@10: #endif /* __RDFT_H__ */