annotate fft/fftw/fftw-3.3.4/rdft/ct-hc2c.c @ 40:223f770b5341 kissfft-double tip

Try a double-precision kissfft
author Chris Cannam
date Wed, 07 Sep 2016 10:40:32 +0100
parents 26056e866c29
children
rev   line source
Chris@19 1 /*
Chris@19 2 * Copyright (c) 2003, 2007-14 Matteo Frigo
Chris@19 3 * Copyright (c) 2003, 2007-14 Massachusetts Institute of Technology
Chris@19 4 *
Chris@19 5 * This program is free software; you can redistribute it and/or modify
Chris@19 6 * it under the terms of the GNU General Public License as published by
Chris@19 7 * the Free Software Foundation; either version 2 of the License, or
Chris@19 8 * (at your option) any later version.
Chris@19 9 *
Chris@19 10 * This program is distributed in the hope that it will be useful,
Chris@19 11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
Chris@19 12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
Chris@19 13 * GNU General Public License for more details.
Chris@19 14 *
Chris@19 15 * You should have received a copy of the GNU General Public License
Chris@19 16 * along with this program; if not, write to the Free Software
Chris@19 17 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
Chris@19 18 *
Chris@19 19 */
Chris@19 20
Chris@19 21 #include "ct-hc2c.h"
Chris@19 22 #include "dft.h"
Chris@19 23
Chris@19 24 typedef struct {
Chris@19 25 plan_rdft2 super;
Chris@19 26 plan *cld;
Chris@19 27 plan *cldw;
Chris@19 28 INT r;
Chris@19 29 } P;
Chris@19 30
Chris@19 31 static void apply_dit(const plan *ego_, R *r0, R *r1, R *cr, R *ci)
Chris@19 32 {
Chris@19 33 const P *ego = (const P *) ego_;
Chris@19 34 plan_rdft *cld;
Chris@19 35 plan_hc2c *cldw;
Chris@19 36 UNUSED(r1);
Chris@19 37
Chris@19 38 cld = (plan_rdft *) ego->cld;
Chris@19 39 cld->apply(ego->cld, r0, cr);
Chris@19 40
Chris@19 41 cldw = (plan_hc2c *) ego->cldw;
Chris@19 42 cldw->apply(ego->cldw, cr, ci);
Chris@19 43 }
Chris@19 44
Chris@19 45 static void apply_dif(const plan *ego_, R *r0, R *r1, R *cr, R *ci)
Chris@19 46 {
Chris@19 47 const P *ego = (const P *) ego_;
Chris@19 48 plan_rdft *cld;
Chris@19 49 plan_hc2c *cldw;
Chris@19 50 UNUSED(r1);
Chris@19 51
Chris@19 52 cldw = (plan_hc2c *) ego->cldw;
Chris@19 53 cldw->apply(ego->cldw, cr, ci);
Chris@19 54
Chris@19 55 cld = (plan_rdft *) ego->cld;
Chris@19 56 cld->apply(ego->cld, cr, r0);
Chris@19 57 }
Chris@19 58
Chris@19 59 static void apply_dit_dft(const plan *ego_, R *r0, R *r1, R *cr, R *ci)
Chris@19 60 {
Chris@19 61 const P *ego = (const P *) ego_;
Chris@19 62 plan_dft *cld;
Chris@19 63 plan_hc2c *cldw;
Chris@19 64
Chris@19 65 cld = (plan_dft *) ego->cld;
Chris@19 66 cld->apply(ego->cld, r0, r1, cr, ci);
Chris@19 67
Chris@19 68 cldw = (plan_hc2c *) ego->cldw;
Chris@19 69 cldw->apply(ego->cldw, cr, ci);
Chris@19 70 }
Chris@19 71
Chris@19 72 static void apply_dif_dft(const plan *ego_, R *r0, R *r1, R *cr, R *ci)
Chris@19 73 {
Chris@19 74 const P *ego = (const P *) ego_;
Chris@19 75 plan_dft *cld;
Chris@19 76 plan_hc2c *cldw;
Chris@19 77
Chris@19 78 cldw = (plan_hc2c *) ego->cldw;
Chris@19 79 cldw->apply(ego->cldw, cr, ci);
Chris@19 80
Chris@19 81 cld = (plan_dft *) ego->cld;
Chris@19 82 cld->apply(ego->cld, ci, cr, r1, r0);
Chris@19 83 }
Chris@19 84
Chris@19 85 static void awake(plan *ego_, enum wakefulness wakefulness)
Chris@19 86 {
Chris@19 87 P *ego = (P *) ego_;
Chris@19 88 X(plan_awake)(ego->cld, wakefulness);
Chris@19 89 X(plan_awake)(ego->cldw, wakefulness);
Chris@19 90 }
Chris@19 91
Chris@19 92 static void destroy(plan *ego_)
Chris@19 93 {
Chris@19 94 P *ego = (P *) ego_;
Chris@19 95 X(plan_destroy_internal)(ego->cldw);
Chris@19 96 X(plan_destroy_internal)(ego->cld);
Chris@19 97 }
Chris@19 98
Chris@19 99 static void print(const plan *ego_, printer *p)
Chris@19 100 {
Chris@19 101 const P *ego = (const P *) ego_;
Chris@19 102 p->print(p, "(rdft2-ct-%s/%D%(%p%)%(%p%))",
Chris@19 103 (ego->super.apply == apply_dit ||
Chris@19 104 ego->super.apply == apply_dit_dft)
Chris@19 105 ? "dit" : "dif",
Chris@19 106 ego->r, ego->cldw, ego->cld);
Chris@19 107 }
Chris@19 108
Chris@19 109 static int applicable0(const hc2c_solver *ego, const problem *p_, planner *plnr)
Chris@19 110 {
Chris@19 111 const problem_rdft2 *p = (const problem_rdft2 *) p_;
Chris@19 112 INT r;
Chris@19 113
Chris@19 114 return (1
Chris@19 115 && p->sz->rnk == 1
Chris@19 116 && p->vecsz->rnk <= 1
Chris@19 117
Chris@19 118 && (/* either the problem is R2HC, which is solved by DIT */
Chris@19 119 (p->kind == R2HC)
Chris@19 120 ||
Chris@19 121 /* or the problem is HC2R, in which case it is solved
Chris@19 122 by DIF, which destroys the input */
Chris@19 123 (p->kind == HC2R &&
Chris@19 124 (p->r0 == p->cr || !NO_DESTROY_INPUTP(plnr))))
Chris@19 125
Chris@19 126 && ((r = X(choose_radix)(ego->r, p->sz->dims[0].n)) > 0)
Chris@19 127 && p->sz->dims[0].n > r);
Chris@19 128 }
Chris@19 129
Chris@19 130 int X(hc2c_applicable)(const hc2c_solver *ego, const problem *p_,
Chris@19 131 planner *plnr)
Chris@19 132 {
Chris@19 133 const problem_rdft2 *p;
Chris@19 134
Chris@19 135 if (!applicable0(ego, p_, plnr))
Chris@19 136 return 0;
Chris@19 137
Chris@19 138 p = (const problem_rdft2 *) p_;
Chris@19 139
Chris@19 140 return (0
Chris@19 141 || p->vecsz->rnk == 0
Chris@19 142 || !NO_VRECURSEP(plnr)
Chris@19 143 );
Chris@19 144 }
Chris@19 145
Chris@19 146 static plan *mkplan(const solver *ego_, const problem *p_, planner *plnr)
Chris@19 147 {
Chris@19 148 const hc2c_solver *ego = (const hc2c_solver *) ego_;
Chris@19 149 const problem_rdft2 *p;
Chris@19 150 P *pln = 0;
Chris@19 151 plan *cld = 0, *cldw = 0;
Chris@19 152 INT n, r, m, v, ivs, ovs;
Chris@19 153 iodim *d;
Chris@19 154
Chris@19 155 static const plan_adt padt = {
Chris@19 156 X(rdft2_solve), awake, print, destroy
Chris@19 157 };
Chris@19 158
Chris@19 159 if (!X(hc2c_applicable)(ego, p_, plnr))
Chris@19 160 return (plan *) 0;
Chris@19 161
Chris@19 162 p = (const problem_rdft2 *) p_;
Chris@19 163 d = p->sz->dims;
Chris@19 164 n = d[0].n;
Chris@19 165 r = X(choose_radix)(ego->r, n);
Chris@19 166 A((r % 2) == 0);
Chris@19 167 m = n / r;
Chris@19 168
Chris@19 169 X(tensor_tornk1)(p->vecsz, &v, &ivs, &ovs);
Chris@19 170
Chris@19 171 switch (p->kind) {
Chris@19 172 case R2HC:
Chris@19 173 cldw = ego->mkcldw(ego, R2HC,
Chris@19 174 r, m * d[0].os,
Chris@19 175 m, d[0].os,
Chris@19 176 v, ovs,
Chris@19 177 p->cr, p->ci, plnr);
Chris@19 178 if (!cldw) goto nada;
Chris@19 179
Chris@19 180 switch (ego->hc2ckind) {
Chris@19 181 case HC2C_VIA_RDFT:
Chris@19 182 cld = X(mkplan_d)(
Chris@19 183 plnr,
Chris@19 184 X(mkproblem_rdft_1_d)(
Chris@19 185 X(mktensor_1d)(m, (r/2)*d[0].is, d[0].os),
Chris@19 186 X(mktensor_3d)(
Chris@19 187 2, p->r1 - p->r0, p->ci - p->cr,
Chris@19 188 r / 2, d[0].is, m * d[0].os,
Chris@19 189 v, ivs, ovs),
Chris@19 190 p->r0, p->cr, R2HC)
Chris@19 191 );
Chris@19 192 if (!cld) goto nada;
Chris@19 193
Chris@19 194 pln = MKPLAN_RDFT2(P, &padt, apply_dit);
Chris@19 195 break;
Chris@19 196
Chris@19 197 case HC2C_VIA_DFT:
Chris@19 198 cld = X(mkplan_d)(
Chris@19 199 plnr,
Chris@19 200 X(mkproblem_dft_d)(
Chris@19 201 X(mktensor_1d)(m, (r/2)*d[0].is, d[0].os),
Chris@19 202 X(mktensor_2d)(
Chris@19 203 r / 2, d[0].is, m * d[0].os,
Chris@19 204 v, ivs, ovs),
Chris@19 205 p->r0, p->r1, p->cr, p->ci)
Chris@19 206 );
Chris@19 207 if (!cld) goto nada;
Chris@19 208
Chris@19 209 pln = MKPLAN_RDFT2(P, &padt, apply_dit_dft);
Chris@19 210 break;
Chris@19 211 }
Chris@19 212 break;
Chris@19 213
Chris@19 214 case HC2R:
Chris@19 215 cldw = ego->mkcldw(ego, HC2R,
Chris@19 216 r, m * d[0].is,
Chris@19 217 m, d[0].is,
Chris@19 218 v, ivs,
Chris@19 219 p->cr, p->ci, plnr);
Chris@19 220 if (!cldw) goto nada;
Chris@19 221
Chris@19 222 switch (ego->hc2ckind) {
Chris@19 223 case HC2C_VIA_RDFT:
Chris@19 224 cld = X(mkplan_d)(
Chris@19 225 plnr,
Chris@19 226 X(mkproblem_rdft_1_d)(
Chris@19 227 X(mktensor_1d)(m, d[0].is, (r/2)*d[0].os),
Chris@19 228 X(mktensor_3d)(
Chris@19 229 2, p->ci - p->cr, p->r1 - p->r0,
Chris@19 230 r / 2, m * d[0].is, d[0].os,
Chris@19 231 v, ivs, ovs),
Chris@19 232 p->cr, p->r0, HC2R)
Chris@19 233 );
Chris@19 234 if (!cld) goto nada;
Chris@19 235
Chris@19 236 pln = MKPLAN_RDFT2(P, &padt, apply_dif);
Chris@19 237 break;
Chris@19 238
Chris@19 239 case HC2C_VIA_DFT:
Chris@19 240 cld = X(mkplan_d)(
Chris@19 241 plnr,
Chris@19 242 X(mkproblem_dft_d)(
Chris@19 243 X(mktensor_1d)(m, d[0].is, (r/2)*d[0].os),
Chris@19 244 X(mktensor_2d)(
Chris@19 245 r / 2, m * d[0].is, d[0].os,
Chris@19 246 v, ivs, ovs),
Chris@19 247 p->ci, p->cr, p->r1, p->r0)
Chris@19 248 );
Chris@19 249 if (!cld) goto nada;
Chris@19 250
Chris@19 251 pln = MKPLAN_RDFT2(P, &padt, apply_dif_dft);
Chris@19 252 break;
Chris@19 253 }
Chris@19 254 break;
Chris@19 255
Chris@19 256 default:
Chris@19 257 A(0);
Chris@19 258 }
Chris@19 259
Chris@19 260 pln->cld = cld;
Chris@19 261 pln->cldw = cldw;
Chris@19 262 pln->r = r;
Chris@19 263 X(ops_add)(&cld->ops, &cldw->ops, &pln->super.super.ops);
Chris@19 264
Chris@19 265 /* inherit could_prune_now_p attribute from cldw */
Chris@19 266 pln->super.super.could_prune_now_p = cldw->could_prune_now_p;
Chris@19 267
Chris@19 268 return &(pln->super.super);
Chris@19 269
Chris@19 270 nada:
Chris@19 271 X(plan_destroy_internal)(cldw);
Chris@19 272 X(plan_destroy_internal)(cld);
Chris@19 273 return (plan *) 0;
Chris@19 274 }
Chris@19 275
Chris@19 276 hc2c_solver *X(mksolver_hc2c)(size_t size, INT r,
Chris@19 277 hc2c_kind hc2ckind,
Chris@19 278 hc2c_mkinferior mkcldw)
Chris@19 279 {
Chris@19 280 static const solver_adt sadt = { PROBLEM_RDFT2, mkplan, 0 };
Chris@19 281 hc2c_solver *slv = (hc2c_solver *)X(mksolver)(size, &sadt);
Chris@19 282 slv->r = r;
Chris@19 283 slv->hc2ckind = hc2ckind;
Chris@19 284 slv->mkcldw = mkcldw;
Chris@19 285 return slv;
Chris@19 286 }
Chris@19 287
Chris@19 288 plan *X(mkplan_hc2c)(size_t size, const plan_adt *adt, hc2capply apply)
Chris@19 289 {
Chris@19 290 plan_hc2c *ego;
Chris@19 291
Chris@19 292 ego = (plan_hc2c *) X(mkplan)(size, adt);
Chris@19 293 ego->apply = apply;
Chris@19 294
Chris@19 295 return &(ego->super);
Chris@19 296 }