annotate src/fftw-3.3.3/dft/indirect.c @ 83:ae30d91d2ffe

Replace these with versions built using an older toolset (so as to avoid ABI compatibilities when linking on Ubuntu 14.04 for packaging purposes)
author Chris Cannam
date Fri, 07 Feb 2020 11:51:13 +0000
parents 37bf6b4a2645
children
rev   line source
Chris@10 1 /*
Chris@10 2 * Copyright (c) 2003, 2007-11 Matteo Frigo
Chris@10 3 * Copyright (c) 2003, 2007-11 Massachusetts Institute of Technology
Chris@10 4 *
Chris@10 5 * This program is free software; you can redistribute it and/or modify
Chris@10 6 * it under the terms of the GNU General Public License as published by
Chris@10 7 * the Free Software Foundation; either version 2 of the License, or
Chris@10 8 * (at your option) any later version.
Chris@10 9 *
Chris@10 10 * This program is distributed in the hope that it will be useful,
Chris@10 11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
Chris@10 12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
Chris@10 13 * GNU General Public License for more details.
Chris@10 14 *
Chris@10 15 * You should have received a copy of the GNU General Public License
Chris@10 16 * along with this program; if not, write to the Free Software
Chris@10 17 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
Chris@10 18 *
Chris@10 19 */
Chris@10 20
Chris@10 21
Chris@10 22
Chris@10 23 /* solvers/plans for vectors of small DFT's that cannot be done
Chris@10 24 in-place directly. Use a rank-0 plan to rearrange the data
Chris@10 25 before or after the transform. Can also change an out-of-place
Chris@10 26 plan into a copy + in-place (where the in-place transform
Chris@10 27 is e.g. unit stride). */
Chris@10 28
Chris@10 29 /* FIXME: merge with rank-geq2.c(?), since this is just a special case
Chris@10 30 of a rank split where the first/second transform has rank 0. */
Chris@10 31
Chris@10 32 #include "dft.h"
Chris@10 33
Chris@10 34 typedef problem *(*mkcld_t) (const problem_dft *p);
Chris@10 35
Chris@10 36 typedef struct {
Chris@10 37 dftapply apply;
Chris@10 38 problem *(*mkcld)(const problem_dft *p);
Chris@10 39 const char *nam;
Chris@10 40 } ndrct_adt;
Chris@10 41
Chris@10 42 typedef struct {
Chris@10 43 solver super;
Chris@10 44 const ndrct_adt *adt;
Chris@10 45 } S;
Chris@10 46
Chris@10 47 typedef struct {
Chris@10 48 plan_dft super;
Chris@10 49 plan *cldcpy, *cld;
Chris@10 50 const S *slv;
Chris@10 51 } P;
Chris@10 52
Chris@10 53 /*-----------------------------------------------------------------------*/
Chris@10 54 /* first rearrange, then transform */
Chris@10 55 static void apply_before(const plan *ego_, R *ri, R *ii, R *ro, R *io)
Chris@10 56 {
Chris@10 57 const P *ego = (const P *) ego_;
Chris@10 58
Chris@10 59 {
Chris@10 60 plan_dft *cldcpy = (plan_dft *) ego->cldcpy;
Chris@10 61 cldcpy->apply(ego->cldcpy, ri, ii, ro, io);
Chris@10 62 }
Chris@10 63 {
Chris@10 64 plan_dft *cld = (plan_dft *) ego->cld;
Chris@10 65 cld->apply(ego->cld, ro, io, ro, io);
Chris@10 66 }
Chris@10 67 }
Chris@10 68
Chris@10 69 static problem *mkcld_before(const problem_dft *p)
Chris@10 70 {
Chris@10 71 return X(mkproblem_dft_d)(X(tensor_copy_inplace)(p->sz, INPLACE_OS),
Chris@10 72 X(tensor_copy_inplace)(p->vecsz, INPLACE_OS),
Chris@10 73 p->ro, p->io, p->ro, p->io);
Chris@10 74 }
Chris@10 75
Chris@10 76 static const ndrct_adt adt_before =
Chris@10 77 {
Chris@10 78 apply_before, mkcld_before, "dft-indirect-before"
Chris@10 79 };
Chris@10 80
Chris@10 81 /*-----------------------------------------------------------------------*/
Chris@10 82 /* first transform, then rearrange */
Chris@10 83
Chris@10 84 static void apply_after(const plan *ego_, R *ri, R *ii, R *ro, R *io)
Chris@10 85 {
Chris@10 86 const P *ego = (const P *) ego_;
Chris@10 87
Chris@10 88 {
Chris@10 89 plan_dft *cld = (plan_dft *) ego->cld;
Chris@10 90 cld->apply(ego->cld, ri, ii, ri, ii);
Chris@10 91 }
Chris@10 92 {
Chris@10 93 plan_dft *cldcpy = (plan_dft *) ego->cldcpy;
Chris@10 94 cldcpy->apply(ego->cldcpy, ri, ii, ro, io);
Chris@10 95 }
Chris@10 96 }
Chris@10 97
Chris@10 98 static problem *mkcld_after(const problem_dft *p)
Chris@10 99 {
Chris@10 100 return X(mkproblem_dft_d)(X(tensor_copy_inplace)(p->sz, INPLACE_IS),
Chris@10 101 X(tensor_copy_inplace)(p->vecsz, INPLACE_IS),
Chris@10 102 p->ri, p->ii, p->ri, p->ii);
Chris@10 103 }
Chris@10 104
Chris@10 105 static const ndrct_adt adt_after =
Chris@10 106 {
Chris@10 107 apply_after, mkcld_after, "dft-indirect-after"
Chris@10 108 };
Chris@10 109
Chris@10 110 /*-----------------------------------------------------------------------*/
Chris@10 111 static void destroy(plan *ego_)
Chris@10 112 {
Chris@10 113 P *ego = (P *) ego_;
Chris@10 114 X(plan_destroy_internal)(ego->cld);
Chris@10 115 X(plan_destroy_internal)(ego->cldcpy);
Chris@10 116 }
Chris@10 117
Chris@10 118 static void awake(plan *ego_, enum wakefulness wakefulness)
Chris@10 119 {
Chris@10 120 P *ego = (P *) ego_;
Chris@10 121 X(plan_awake)(ego->cldcpy, wakefulness);
Chris@10 122 X(plan_awake)(ego->cld, wakefulness);
Chris@10 123 }
Chris@10 124
Chris@10 125 static void print(const plan *ego_, printer *p)
Chris@10 126 {
Chris@10 127 const P *ego = (const P *) ego_;
Chris@10 128 const S *s = ego->slv;
Chris@10 129 p->print(p, "(%s%(%p%)%(%p%))", s->adt->nam, ego->cld, ego->cldcpy);
Chris@10 130 }
Chris@10 131
Chris@10 132 static int applicable0(const solver *ego_, const problem *p_,
Chris@10 133 const planner *plnr)
Chris@10 134 {
Chris@10 135 const S *ego = (const S *) ego_;
Chris@10 136 const problem_dft *p = (const problem_dft *) p_;
Chris@10 137 return (1
Chris@10 138 && FINITE_RNK(p->vecsz->rnk)
Chris@10 139
Chris@10 140 /* problem must be a nontrivial transform, not just a copy */
Chris@10 141 && p->sz->rnk > 0
Chris@10 142
Chris@10 143 && (0
Chris@10 144
Chris@10 145 /* problem must be in-place & require some
Chris@10 146 rearrangement of the data; to prevent
Chris@10 147 infinite loops with indirect-transpose, we
Chris@10 148 further require that at least some transform
Chris@10 149 strides must decrease */
Chris@10 150 || (p->ri == p->ro
Chris@10 151 && !X(tensor_inplace_strides2)(p->sz, p->vecsz)
Chris@10 152 && X(tensor_strides_decrease)(
Chris@10 153 p->sz, p->vecsz,
Chris@10 154 ego->adt->apply == apply_after ?
Chris@10 155 INPLACE_IS : INPLACE_OS))
Chris@10 156
Chris@10 157 /* or problem must be out of place, transforming
Chris@10 158 from stride 1/2 to bigger stride, for apply_after */
Chris@10 159 || (p->ri != p->ro && ego->adt->apply == apply_after
Chris@10 160 && !NO_DESTROY_INPUTP(plnr)
Chris@10 161 && X(tensor_min_istride)(p->sz) <= 2
Chris@10 162 && X(tensor_min_ostride)(p->sz) > 2)
Chris@10 163
Chris@10 164 /* or problem must be out of place, transforming
Chris@10 165 to stride 1/2 from bigger stride, for apply_before */
Chris@10 166 || (p->ri != p->ro && ego->adt->apply == apply_before
Chris@10 167 && X(tensor_min_ostride)(p->sz) <= 2
Chris@10 168 && X(tensor_min_istride)(p->sz) > 2)
Chris@10 169 )
Chris@10 170 );
Chris@10 171 }
Chris@10 172
Chris@10 173 static int applicable(const solver *ego_, const problem *p_,
Chris@10 174 const planner *plnr)
Chris@10 175 {
Chris@10 176 if (!applicable0(ego_, p_, plnr)) return 0;
Chris@10 177 {
Chris@10 178 const problem_dft *p = (const problem_dft *) p_;
Chris@10 179 if (NO_INDIRECT_OP_P(plnr) && p->ri != p->ro) return 0;
Chris@10 180 }
Chris@10 181 return 1;
Chris@10 182 }
Chris@10 183
Chris@10 184 static plan *mkplan(const solver *ego_, const problem *p_, planner *plnr)
Chris@10 185 {
Chris@10 186 const problem_dft *p = (const problem_dft *) p_;
Chris@10 187 const S *ego = (const S *) ego_;
Chris@10 188 P *pln;
Chris@10 189 plan *cld = 0, *cldcpy = 0;
Chris@10 190
Chris@10 191 static const plan_adt padt = {
Chris@10 192 X(dft_solve), awake, print, destroy
Chris@10 193 };
Chris@10 194
Chris@10 195 if (!applicable(ego_, p_, plnr))
Chris@10 196 return (plan *) 0;
Chris@10 197
Chris@10 198 cldcpy =
Chris@10 199 X(mkplan_d)(plnr,
Chris@10 200 X(mkproblem_dft_d)(X(mktensor_0d)(),
Chris@10 201 X(tensor_append)(p->vecsz, p->sz),
Chris@10 202 p->ri, p->ii, p->ro, p->io));
Chris@10 203
Chris@10 204 if (!cldcpy) goto nada;
Chris@10 205
Chris@10 206 cld = X(mkplan_f_d)(plnr, ego->adt->mkcld(p), NO_BUFFERING, 0, 0);
Chris@10 207 if (!cld) goto nada;
Chris@10 208
Chris@10 209 pln = MKPLAN_DFT(P, &padt, ego->adt->apply);
Chris@10 210 pln->cld = cld;
Chris@10 211 pln->cldcpy = cldcpy;
Chris@10 212 pln->slv = ego;
Chris@10 213 X(ops_add)(&cld->ops, &cldcpy->ops, &pln->super.super.ops);
Chris@10 214
Chris@10 215 return &(pln->super.super);
Chris@10 216
Chris@10 217 nada:
Chris@10 218 X(plan_destroy_internal)(cld);
Chris@10 219 X(plan_destroy_internal)(cldcpy);
Chris@10 220 return (plan *)0;
Chris@10 221 }
Chris@10 222
Chris@10 223 static solver *mksolver(const ndrct_adt *adt)
Chris@10 224 {
Chris@10 225 static const solver_adt sadt = { PROBLEM_DFT, mkplan, 0 };
Chris@10 226 S *slv = MKSOLVER(S, &sadt);
Chris@10 227 slv->adt = adt;
Chris@10 228 return &(slv->super);
Chris@10 229 }
Chris@10 230
Chris@10 231 void X(dft_indirect_register)(planner *p)
Chris@10 232 {
Chris@10 233 unsigned i;
Chris@10 234 static const ndrct_adt *const adts[] = {
Chris@10 235 &adt_before, &adt_after
Chris@10 236 };
Chris@10 237
Chris@10 238 for (i = 0; i < sizeof(adts) / sizeof(adts[0]); ++i)
Chris@10 239 REGISTER_SOLVER(p, mksolver(adts[i]));
Chris@10 240 }