annotate src/fftw-3.3.5/dft/dftw-generic.c @ 84:08ae793730bd

Add null config files
author Chris Cannam
date Mon, 02 Mar 2020 14:03:47 +0000
parents 2cd0e3b3e1fd
children
rev   line source
Chris@42 1 /*
Chris@42 2 * Copyright (c) 2003, 2007-14 Matteo Frigo
Chris@42 3 * Copyright (c) 2003, 2007-14 Massachusetts Institute of Technology
Chris@42 4 *
Chris@42 5 * This program is free software; you can redistribute it and/or modify
Chris@42 6 * it under the terms of the GNU General Public License as published by
Chris@42 7 * the Free Software Foundation; either version 2 of the License, or
Chris@42 8 * (at your option) any later version.
Chris@42 9 *
Chris@42 10 * This program is distributed in the hope that it will be useful,
Chris@42 11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
Chris@42 12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
Chris@42 13 * GNU General Public License for more details.
Chris@42 14 *
Chris@42 15 * You should have received a copy of the GNU General Public License
Chris@42 16 * along with this program; if not, write to the Free Software
Chris@42 17 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
Chris@42 18 *
Chris@42 19 */
Chris@42 20
Chris@42 21 /* express a twiddle problem in terms of dft + multiplication by
Chris@42 22 twiddle factors */
Chris@42 23
Chris@42 24 #include "ct.h"
Chris@42 25
Chris@42 26 typedef ct_solver S;
Chris@42 27
Chris@42 28 typedef struct {
Chris@42 29 plan_dftw super;
Chris@42 30
Chris@42 31 INT r, rs, m, mb, me, ms, v, vs;
Chris@42 32
Chris@42 33 plan *cld;
Chris@42 34
Chris@42 35 twid *td;
Chris@42 36
Chris@42 37 const S *slv;
Chris@42 38 int dec;
Chris@42 39 } P;
Chris@42 40
Chris@42 41 static void mktwiddle(P *ego, enum wakefulness wakefulness)
Chris@42 42 {
Chris@42 43 static const tw_instr tw[] = { { TW_FULL, 0, 0 }, { TW_NEXT, 1, 0 } };
Chris@42 44
Chris@42 45 /* note that R and M are swapped, to allow for sequential
Chris@42 46 access both to data and twiddles */
Chris@42 47 X(twiddle_awake)(wakefulness, &ego->td, tw,
Chris@42 48 ego->r * ego->m, ego->m, ego->r);
Chris@42 49 }
Chris@42 50
Chris@42 51 static void bytwiddle(const P *ego, R *rio, R *iio)
Chris@42 52 {
Chris@42 53 INT iv, ir, im;
Chris@42 54 INT r = ego->r, rs = ego->rs;
Chris@42 55 INT m = ego->m, mb = ego->mb, me = ego->me, ms = ego->ms;
Chris@42 56 INT v = ego->v, vs = ego->vs;
Chris@42 57 const R *W = ego->td->W;
Chris@42 58
Chris@42 59 mb += (mb == 0); /* skip m=0 iteration */
Chris@42 60 for (iv = 0; iv < v; ++iv) {
Chris@42 61 for (ir = 1; ir < r; ++ir) {
Chris@42 62 for (im = mb; im < me; ++im) {
Chris@42 63 R *pr = rio + ms * im + rs * ir;
Chris@42 64 R *pi = iio + ms * im + rs * ir;
Chris@42 65 E xr = *pr;
Chris@42 66 E xi = *pi;
Chris@42 67 E wr = W[2 * im + (2 * (m-1)) * ir - 2];
Chris@42 68 E wi = W[2 * im + (2 * (m-1)) * ir - 1];
Chris@42 69 *pr = xr * wr + xi * wi;
Chris@42 70 *pi = xi * wr - xr * wi;
Chris@42 71 }
Chris@42 72 }
Chris@42 73 rio += vs;
Chris@42 74 iio += vs;
Chris@42 75 }
Chris@42 76 }
Chris@42 77
Chris@42 78 static int applicable(INT irs, INT ors, INT ivs, INT ovs,
Chris@42 79 const planner *plnr)
Chris@42 80 {
Chris@42 81 return (1
Chris@42 82 && irs == ors
Chris@42 83 && ivs == ovs
Chris@42 84 && !NO_SLOWP(plnr)
Chris@42 85 );
Chris@42 86 }
Chris@42 87
Chris@42 88 static void apply_dit(const plan *ego_, R *rio, R *iio)
Chris@42 89 {
Chris@42 90 const P *ego = (const P *) ego_;
Chris@42 91 plan_dft *cld;
Chris@42 92 INT dm = ego->ms * ego->mb;
Chris@42 93
Chris@42 94 bytwiddle(ego, rio, iio);
Chris@42 95
Chris@42 96 cld = (plan_dft *) ego->cld;
Chris@42 97 cld->apply(ego->cld, rio + dm, iio + dm, rio + dm, iio + dm);
Chris@42 98 }
Chris@42 99
Chris@42 100 static void apply_dif(const plan *ego_, R *rio, R *iio)
Chris@42 101 {
Chris@42 102 const P *ego = (const P *) ego_;
Chris@42 103 plan_dft *cld;
Chris@42 104 INT dm = ego->ms * ego->mb;
Chris@42 105
Chris@42 106 cld = (plan_dft *) ego->cld;
Chris@42 107 cld->apply(ego->cld, rio + dm, iio + dm, rio + dm, iio + dm);
Chris@42 108
Chris@42 109 bytwiddle(ego, rio, iio);
Chris@42 110 }
Chris@42 111
Chris@42 112 static void awake(plan *ego_, enum wakefulness wakefulness)
Chris@42 113 {
Chris@42 114 P *ego = (P *) ego_;
Chris@42 115 X(plan_awake)(ego->cld, wakefulness);
Chris@42 116 mktwiddle(ego, wakefulness);
Chris@42 117 }
Chris@42 118
Chris@42 119 static void destroy(plan *ego_)
Chris@42 120 {
Chris@42 121 P *ego = (P *) ego_;
Chris@42 122 X(plan_destroy_internal)(ego->cld);
Chris@42 123 }
Chris@42 124
Chris@42 125 static void print(const plan *ego_, printer *p)
Chris@42 126 {
Chris@42 127 const P *ego = (const P *) ego_;
Chris@42 128 p->print(p, "(dftw-generic-%s-%D-%D%v%(%p%))",
Chris@42 129 ego->dec == DECDIT ? "dit" : "dif",
Chris@42 130 ego->r, ego->m, ego->v, ego->cld);
Chris@42 131 }
Chris@42 132
Chris@42 133 static plan *mkcldw(const ct_solver *ego_,
Chris@42 134 INT r, INT irs, INT ors,
Chris@42 135 INT m, INT ms,
Chris@42 136 INT v, INT ivs, INT ovs,
Chris@42 137 INT mstart, INT mcount,
Chris@42 138 R *rio, R *iio,
Chris@42 139 planner *plnr)
Chris@42 140 {
Chris@42 141 const S *ego = (const S *)ego_;
Chris@42 142 P *pln;
Chris@42 143 plan *cld = 0;
Chris@42 144 INT dm = ms * mstart;
Chris@42 145
Chris@42 146 static const plan_adt padt = {
Chris@42 147 0, awake, print, destroy
Chris@42 148 };
Chris@42 149
Chris@42 150 A(mstart >= 0 && mstart + mcount <= m);
Chris@42 151 if (!applicable(irs, ors, ivs, ovs, plnr))
Chris@42 152 return (plan *)0;
Chris@42 153
Chris@42 154 cld = X(mkplan_d)(plnr,
Chris@42 155 X(mkproblem_dft_d)(
Chris@42 156 X(mktensor_1d)(r, irs, irs),
Chris@42 157 X(mktensor_2d)(mcount, ms, ms, v, ivs, ivs),
Chris@42 158 rio + dm, iio + dm, rio + dm, iio + dm)
Chris@42 159 );
Chris@42 160 if (!cld) goto nada;
Chris@42 161
Chris@42 162 pln = MKPLAN_DFTW(P, &padt, ego->dec == DECDIT ? apply_dit : apply_dif);
Chris@42 163 pln->slv = ego;
Chris@42 164 pln->cld = cld;
Chris@42 165 pln->r = r;
Chris@42 166 pln->rs = irs;
Chris@42 167 pln->m = m;
Chris@42 168 pln->ms = ms;
Chris@42 169 pln->v = v;
Chris@42 170 pln->vs = ivs;
Chris@42 171 pln->mb = mstart;
Chris@42 172 pln->me = mstart + mcount;
Chris@42 173 pln->dec = ego->dec;
Chris@42 174 pln->td = 0;
Chris@42 175
Chris@42 176 {
Chris@42 177 double n0 = (r - 1) * (mcount - 1) * v;
Chris@42 178 pln->super.super.ops = cld->ops;
Chris@42 179 pln->super.super.ops.mul += 8 * n0;
Chris@42 180 pln->super.super.ops.add += 4 * n0;
Chris@42 181 pln->super.super.ops.other += 8 * n0;
Chris@42 182 }
Chris@42 183 return &(pln->super.super);
Chris@42 184
Chris@42 185 nada:
Chris@42 186 X(plan_destroy_internal)(cld);
Chris@42 187 return (plan *) 0;
Chris@42 188 }
Chris@42 189
Chris@42 190 static void regsolver(planner *plnr, INT r, int dec)
Chris@42 191 {
Chris@42 192 S *slv = (S *)X(mksolver_ct)(sizeof(S), r, dec, mkcldw, 0);
Chris@42 193 REGISTER_SOLVER(plnr, &(slv->super));
Chris@42 194 if (X(mksolver_ct_hook)) {
Chris@42 195 slv = (S *)X(mksolver_ct_hook)(sizeof(S), r, dec, mkcldw, 0);
Chris@42 196 REGISTER_SOLVER(plnr, &(slv->super));
Chris@42 197 }
Chris@42 198 }
Chris@42 199
Chris@42 200 void X(ct_generic_register)(planner *p)
Chris@42 201 {
Chris@42 202 regsolver(p, 0, DECDIT);
Chris@42 203 regsolver(p, 0, DECDIF);
Chris@42 204 }