annotate src/fftw-3.3.8/rdft/rank-geq2-rdft2.c @ 83:ae30d91d2ffe

Replace these with versions built using an older toolset (so as to avoid ABI compatibilities when linking on Ubuntu 14.04 for packaging purposes)
author Chris Cannam
date Fri, 07 Feb 2020 11:51:13 +0000
parents d0c2a83c1364
children
rev   line source
Chris@82 1 /*
Chris@82 2 * Copyright (c) 2003, 2007-14 Matteo Frigo
Chris@82 3 * Copyright (c) 2003, 2007-14 Massachusetts Institute of Technology
Chris@82 4 *
Chris@82 5 * This program is free software; you can redistribute it and/or modify
Chris@82 6 * it under the terms of the GNU General Public License as published by
Chris@82 7 * the Free Software Foundation; either version 2 of the License, or
Chris@82 8 * (at your option) any later version.
Chris@82 9 *
Chris@82 10 * This program is distributed in the hope that it will be useful,
Chris@82 11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
Chris@82 12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
Chris@82 13 * GNU General Public License for more details.
Chris@82 14 *
Chris@82 15 * You should have received a copy of the GNU General Public License
Chris@82 16 * along with this program; if not, write to the Free Software
Chris@82 17 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
Chris@82 18 *
Chris@82 19 */
Chris@82 20
Chris@82 21
Chris@82 22 /* plans for RDFT2 of rank >= 2 (multidimensional) */
Chris@82 23
Chris@82 24 #include "rdft/rdft.h"
Chris@82 25 #include "dft/dft.h"
Chris@82 26
Chris@82 27 typedef struct {
Chris@82 28 solver super;
Chris@82 29 int spltrnk;
Chris@82 30 const int *buddies;
Chris@82 31 size_t nbuddies;
Chris@82 32 } S;
Chris@82 33
Chris@82 34 typedef struct {
Chris@82 35 plan_dft super;
Chris@82 36 plan *cldr, *cldc;
Chris@82 37 const S *solver;
Chris@82 38 } P;
Chris@82 39
Chris@82 40 static void apply_r2hc(const plan *ego_, R *r0, R *r1, R *cr, R *ci)
Chris@82 41 {
Chris@82 42 const P *ego = (const P *) ego_;
Chris@82 43
Chris@82 44 {
Chris@82 45 plan_rdft2 *cldr = (plan_rdft2 *) ego->cldr;
Chris@82 46 cldr->apply((plan *) cldr, r0, r1, cr, ci);
Chris@82 47 }
Chris@82 48
Chris@82 49 {
Chris@82 50 plan_dft *cldc = (plan_dft *) ego->cldc;
Chris@82 51 cldc->apply((plan *) cldc, cr, ci, cr, ci);
Chris@82 52 }
Chris@82 53 }
Chris@82 54
Chris@82 55 static void apply_hc2r(const plan *ego_, R *r0, R *r1, R *cr, R *ci)
Chris@82 56 {
Chris@82 57 const P *ego = (const P *) ego_;
Chris@82 58
Chris@82 59 {
Chris@82 60 plan_dft *cldc = (plan_dft *) ego->cldc;
Chris@82 61 cldc->apply((plan *) cldc, ci, cr, ci, cr);
Chris@82 62 }
Chris@82 63
Chris@82 64 {
Chris@82 65 plan_rdft2 *cldr = (plan_rdft2 *) ego->cldr;
Chris@82 66 cldr->apply((plan *) cldr, r0, r1, cr, ci);
Chris@82 67 }
Chris@82 68
Chris@82 69 }
Chris@82 70
Chris@82 71 static void awake(plan *ego_, enum wakefulness wakefulness)
Chris@82 72 {
Chris@82 73 P *ego = (P *) ego_;
Chris@82 74 X(plan_awake)(ego->cldr, wakefulness);
Chris@82 75 X(plan_awake)(ego->cldc, wakefulness);
Chris@82 76 }
Chris@82 77
Chris@82 78 static void destroy(plan *ego_)
Chris@82 79 {
Chris@82 80 P *ego = (P *) ego_;
Chris@82 81 X(plan_destroy_internal)(ego->cldr);
Chris@82 82 X(plan_destroy_internal)(ego->cldc);
Chris@82 83 }
Chris@82 84
Chris@82 85 static void print(const plan *ego_, printer *p)
Chris@82 86 {
Chris@82 87 const P *ego = (const P *) ego_;
Chris@82 88 const S *s = ego->solver;
Chris@82 89 p->print(p, "(rdft2-rank>=2/%d%(%p%)%(%p%))",
Chris@82 90 s->spltrnk, ego->cldr, ego->cldc);
Chris@82 91 }
Chris@82 92
Chris@82 93 static int picksplit(const S *ego, const tensor *sz, int *rp)
Chris@82 94 {
Chris@82 95 A(sz->rnk > 1); /* cannot split rnk <= 1 */
Chris@82 96 if (!X(pickdim)(ego->spltrnk, ego->buddies, ego->nbuddies, sz, 1, rp))
Chris@82 97 return 0;
Chris@82 98 *rp += 1; /* convert from dim. index to rank */
Chris@82 99 if (*rp >= sz->rnk) /* split must reduce rank */
Chris@82 100 return 0;
Chris@82 101 return 1;
Chris@82 102 }
Chris@82 103
Chris@82 104 static int applicable0(const solver *ego_, const problem *p_, int *rp,
Chris@82 105 const planner *plnr)
Chris@82 106 {
Chris@82 107 const problem_rdft2 *p = (const problem_rdft2 *) p_;
Chris@82 108 const S *ego = (const S *)ego_;
Chris@82 109 return (1
Chris@82 110 && FINITE_RNK(p->sz->rnk) && FINITE_RNK(p->vecsz->rnk)
Chris@82 111
Chris@82 112 /* FIXME: multidimensional R2HCII ? */
Chris@82 113 && (p->kind == R2HC || p->kind == HC2R)
Chris@82 114
Chris@82 115 && p->sz->rnk >= 2
Chris@82 116 && picksplit(ego, p->sz, rp)
Chris@82 117 && (0
Chris@82 118
Chris@82 119 /* can work out-of-place, but HC2R destroys input */
Chris@82 120 || (p->r0 != p->cr &&
Chris@82 121 (p->kind == R2HC || !NO_DESTROY_INPUTP(plnr)))
Chris@82 122
Chris@82 123 /* FIXME: what are sufficient conditions for inplace? */
Chris@82 124 || (p->r0 == p->cr))
Chris@82 125 );
Chris@82 126 }
Chris@82 127
Chris@82 128 /* TODO: revise this. */
Chris@82 129 static int applicable(const solver *ego_, const problem *p_,
Chris@82 130 const planner *plnr, int *rp)
Chris@82 131 {
Chris@82 132 const S *ego = (const S *)ego_;
Chris@82 133
Chris@82 134 if (!applicable0(ego_, p_, rp, plnr)) return 0;
Chris@82 135
Chris@82 136 if (NO_RANK_SPLITSP(plnr) && (ego->spltrnk != ego->buddies[0]))
Chris@82 137 return 0;
Chris@82 138
Chris@82 139 if (NO_UGLYP(plnr)) {
Chris@82 140 const problem_rdft2 *p = (const problem_rdft2 *) p_;
Chris@82 141
Chris@82 142 /* Heuristic: if the vector stride is greater than the transform
Chris@82 143 size, don't use (prefer to do the vector loop first with a
Chris@82 144 vrank-geq1 plan). */
Chris@82 145 if (p->vecsz->rnk > 0 &&
Chris@82 146 X(tensor_min_stride)(p->vecsz)
Chris@82 147 > X(rdft2_tensor_max_index)(p->sz, p->kind))
Chris@82 148 return 0;
Chris@82 149 }
Chris@82 150
Chris@82 151 return 1;
Chris@82 152 }
Chris@82 153
Chris@82 154 static plan *mkplan(const solver *ego_, const problem *p_, planner *plnr)
Chris@82 155 {
Chris@82 156 const S *ego = (const S *) ego_;
Chris@82 157 const problem_rdft2 *p;
Chris@82 158 P *pln;
Chris@82 159 plan *cldr = 0, *cldc = 0;
Chris@82 160 tensor *sz1, *sz2, *vecszi, *sz2i;
Chris@82 161 int spltrnk;
Chris@82 162 inplace_kind k;
Chris@82 163 problem *cldp;
Chris@82 164
Chris@82 165 static const plan_adt padt = {
Chris@82 166 X(rdft2_solve), awake, print, destroy
Chris@82 167 };
Chris@82 168
Chris@82 169 if (!applicable(ego_, p_, plnr, &spltrnk))
Chris@82 170 return (plan *) 0;
Chris@82 171
Chris@82 172 p = (const problem_rdft2 *) p_;
Chris@82 173 X(tensor_split)(p->sz, &sz1, spltrnk, &sz2);
Chris@82 174
Chris@82 175 k = p->kind == R2HC ? INPLACE_OS : INPLACE_IS;
Chris@82 176 vecszi = X(tensor_copy_inplace)(p->vecsz, k);
Chris@82 177 sz2i = X(tensor_copy_inplace)(sz2, k);
Chris@82 178
Chris@82 179 /* complex data is ~half of real */
Chris@82 180 sz2i->dims[sz2i->rnk - 1].n = sz2i->dims[sz2i->rnk - 1].n/2 + 1;
Chris@82 181
Chris@82 182 cldr = X(mkplan_d)(plnr,
Chris@82 183 X(mkproblem_rdft2_d)(X(tensor_copy)(sz2),
Chris@82 184 X(tensor_append)(p->vecsz, sz1),
Chris@82 185 p->r0, p->r1,
Chris@82 186 p->cr, p->ci, p->kind));
Chris@82 187 if (!cldr) goto nada;
Chris@82 188
Chris@82 189 if (p->kind == R2HC)
Chris@82 190 cldp = X(mkproblem_dft_d)(X(tensor_copy_inplace)(sz1, k),
Chris@82 191 X(tensor_append)(vecszi, sz2i),
Chris@82 192 p->cr, p->ci, p->cr, p->ci);
Chris@82 193 else /* HC2R must swap re/im parts to get IDFT */
Chris@82 194 cldp = X(mkproblem_dft_d)(X(tensor_copy_inplace)(sz1, k),
Chris@82 195 X(tensor_append)(vecszi, sz2i),
Chris@82 196 p->ci, p->cr, p->ci, p->cr);
Chris@82 197 cldc = X(mkplan_d)(plnr, cldp);
Chris@82 198 if (!cldc) goto nada;
Chris@82 199
Chris@82 200 pln = MKPLAN_RDFT2(P, &padt, p->kind == R2HC ? apply_r2hc : apply_hc2r);
Chris@82 201
Chris@82 202 pln->cldr = cldr;
Chris@82 203 pln->cldc = cldc;
Chris@82 204
Chris@82 205 pln->solver = ego;
Chris@82 206 X(ops_add)(&cldr->ops, &cldc->ops, &pln->super.super.ops);
Chris@82 207
Chris@82 208 X(tensor_destroy4)(sz2i, vecszi, sz2, sz1);
Chris@82 209
Chris@82 210 return &(pln->super.super);
Chris@82 211
Chris@82 212 nada:
Chris@82 213 X(plan_destroy_internal)(cldr);
Chris@82 214 X(plan_destroy_internal)(cldc);
Chris@82 215 X(tensor_destroy4)(sz2i, vecszi, sz2, sz1);
Chris@82 216 return (plan *) 0;
Chris@82 217 }
Chris@82 218
Chris@82 219 static solver *mksolver(int spltrnk, const int *buddies, size_t nbuddies)
Chris@82 220 {
Chris@82 221 static const solver_adt sadt = { PROBLEM_RDFT2, mkplan, 0 };
Chris@82 222 S *slv = MKSOLVER(S, &sadt);
Chris@82 223 slv->spltrnk = spltrnk;
Chris@82 224 slv->buddies = buddies;
Chris@82 225 slv->nbuddies = nbuddies;
Chris@82 226 return &(slv->super);
Chris@82 227 }
Chris@82 228
Chris@82 229 void X(rdft2_rank_geq2_register)(planner *p)
Chris@82 230 {
Chris@82 231 static const int buddies[] = { 1, 0, -2 };
Chris@82 232 size_t i;
Chris@82 233
Chris@82 234 for (i = 0; i < NELEM(buddies); ++i)
Chris@82 235 REGISTER_SOLVER(p, mksolver(buddies[i], buddies, NELEM(buddies)));
Chris@82 236
Chris@82 237 /* FIXME: Should we try more buddies? See also dft/rank-geq2. */
Chris@82 238 }