annotate src/fftw-3.3.8/rdft/rank-geq2.c @ 83:ae30d91d2ffe

Replace these with versions built using an older toolset (so as to avoid ABI compatibilities when linking on Ubuntu 14.04 for packaging purposes)
author Chris Cannam
date Fri, 07 Feb 2020 11:51:13 +0000
parents d0c2a83c1364
children
rev   line source
Chris@82 1 /*
Chris@82 2 * Copyright (c) 2003, 2007-14 Matteo Frigo
Chris@82 3 * Copyright (c) 2003, 2007-14 Massachusetts Institute of Technology
Chris@82 4 *
Chris@82 5 * This program is free software; you can redistribute it and/or modify
Chris@82 6 * it under the terms of the GNU General Public License as published by
Chris@82 7 * the Free Software Foundation; either version 2 of the License, or
Chris@82 8 * (at your option) any later version.
Chris@82 9 *
Chris@82 10 * This program is distributed in the hope that it will be useful,
Chris@82 11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
Chris@82 12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
Chris@82 13 * GNU General Public License for more details.
Chris@82 14 *
Chris@82 15 * You should have received a copy of the GNU General Public License
Chris@82 16 * along with this program; if not, write to the Free Software
Chris@82 17 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
Chris@82 18 *
Chris@82 19 */
Chris@82 20
Chris@82 21
Chris@82 22 /* plans for RDFT of rank >= 2 (multidimensional) */
Chris@82 23
Chris@82 24 /* FIXME: this solver cannot strictly be applied to multidimensional
Chris@82 25 DHTs, since the latter are not separable...up to rnk-1 additional
Chris@82 26 post-processing passes may be required. See also:
Chris@82 27
Chris@82 28 R. N. Bracewell, O. Buneman, H. Hao, and J. Villasenor, "Fast
Chris@82 29 two-dimensional Hartley transform," Proc. IEEE 74, 1282-1283 (1986).
Chris@82 30
Chris@82 31 H. Hao and R. N. Bracewell, "A three-dimensional DFT algorithm
Chris@82 32 using the fast Hartley transform," Proc. IEEE 75(2), 264-266 (1987).
Chris@82 33 */
Chris@82 34
Chris@82 35 #include "rdft/rdft.h"
Chris@82 36
Chris@82 37 typedef struct {
Chris@82 38 solver super;
Chris@82 39 int spltrnk;
Chris@82 40 const int *buddies;
Chris@82 41 size_t nbuddies;
Chris@82 42 } S;
Chris@82 43
Chris@82 44 typedef struct {
Chris@82 45 plan_rdft super;
Chris@82 46
Chris@82 47 plan *cld1, *cld2;
Chris@82 48 const S *solver;
Chris@82 49 } P;
Chris@82 50
Chris@82 51 /* Compute multi-dimensional RDFT by applying the two cld plans
Chris@82 52 (lower-rnk RDFTs). */
Chris@82 53 static void apply(const plan *ego_, R *I, R *O)
Chris@82 54 {
Chris@82 55 const P *ego = (const P *) ego_;
Chris@82 56 plan_rdft *cld1, *cld2;
Chris@82 57
Chris@82 58 cld1 = (plan_rdft *) ego->cld1;
Chris@82 59 cld1->apply(ego->cld1, I, O);
Chris@82 60
Chris@82 61 cld2 = (plan_rdft *) ego->cld2;
Chris@82 62 cld2->apply(ego->cld2, O, O);
Chris@82 63 }
Chris@82 64
Chris@82 65
Chris@82 66 static void awake(plan *ego_, enum wakefulness wakefulness)
Chris@82 67 {
Chris@82 68 P *ego = (P *) ego_;
Chris@82 69 X(plan_awake)(ego->cld1, wakefulness);
Chris@82 70 X(plan_awake)(ego->cld2, wakefulness);
Chris@82 71 }
Chris@82 72
Chris@82 73 static void destroy(plan *ego_)
Chris@82 74 {
Chris@82 75 P *ego = (P *) ego_;
Chris@82 76 X(plan_destroy_internal)(ego->cld2);
Chris@82 77 X(plan_destroy_internal)(ego->cld1);
Chris@82 78 }
Chris@82 79
Chris@82 80 static void print(const plan *ego_, printer *p)
Chris@82 81 {
Chris@82 82 const P *ego = (const P *) ego_;
Chris@82 83 const S *s = ego->solver;
Chris@82 84 p->print(p, "(rdft-rank>=2/%d%(%p%)%(%p%))",
Chris@82 85 s->spltrnk, ego->cld1, ego->cld2);
Chris@82 86 }
Chris@82 87
Chris@82 88 static int picksplit(const S *ego, const tensor *sz, int *rp)
Chris@82 89 {
Chris@82 90 A(sz->rnk > 1); /* cannot split rnk <= 1 */
Chris@82 91 if (!X(pickdim)(ego->spltrnk, ego->buddies, ego->nbuddies, sz, 1, rp))
Chris@82 92 return 0;
Chris@82 93 *rp += 1; /* convert from dim. index to rank */
Chris@82 94 if (*rp >= sz->rnk) /* split must reduce rank */
Chris@82 95 return 0;
Chris@82 96 return 1;
Chris@82 97 }
Chris@82 98
Chris@82 99 static int applicable0(const solver *ego_, const problem *p_, int *rp)
Chris@82 100 {
Chris@82 101 const problem_rdft *p = (const problem_rdft *) p_;
Chris@82 102 const S *ego = (const S *)ego_;
Chris@82 103 return (1
Chris@82 104 && FINITE_RNK(p->sz->rnk) && FINITE_RNK(p->vecsz->rnk)
Chris@82 105 && p->sz->rnk >= 2
Chris@82 106 && picksplit(ego, p->sz, rp)
Chris@82 107 );
Chris@82 108 }
Chris@82 109
Chris@82 110 /* TODO: revise this. */
Chris@82 111 static int applicable(const solver *ego_, const problem *p_,
Chris@82 112 const planner *plnr, int *rp)
Chris@82 113 {
Chris@82 114 const S *ego = (const S *)ego_;
Chris@82 115
Chris@82 116 if (!applicable0(ego_, p_, rp)) return 0;
Chris@82 117
Chris@82 118 if (NO_RANK_SPLITSP(plnr) && (ego->spltrnk != ego->buddies[0]))
Chris@82 119 return 0;
Chris@82 120
Chris@82 121 if (NO_UGLYP(plnr)) {
Chris@82 122 /* Heuristic: if the vector stride is greater than the transform
Chris@82 123 sz, don't use (prefer to do the vector loop first with a
Chris@82 124 vrank-geq1 plan). */
Chris@82 125 const problem_rdft *p = (const problem_rdft *) p_;
Chris@82 126
Chris@82 127 if (p->vecsz->rnk > 0 &&
Chris@82 128 X(tensor_min_stride)(p->vecsz) > X(tensor_max_index)(p->sz))
Chris@82 129 return 0;
Chris@82 130 }
Chris@82 131
Chris@82 132 return 1;
Chris@82 133 }
Chris@82 134
Chris@82 135 static plan *mkplan(const solver *ego_, const problem *p_, planner *plnr)
Chris@82 136 {
Chris@82 137 const S *ego = (const S *) ego_;
Chris@82 138 const problem_rdft *p;
Chris@82 139 P *pln;
Chris@82 140 plan *cld1 = 0, *cld2 = 0;
Chris@82 141 tensor *sz1, *sz2, *vecszi, *sz2i;
Chris@82 142 int spltrnk;
Chris@82 143
Chris@82 144 static const plan_adt padt = {
Chris@82 145 X(rdft_solve), awake, print, destroy
Chris@82 146 };
Chris@82 147
Chris@82 148 if (!applicable(ego_, p_, plnr, &spltrnk))
Chris@82 149 return (plan *) 0;
Chris@82 150
Chris@82 151 p = (const problem_rdft *) p_;
Chris@82 152 X(tensor_split)(p->sz, &sz1, spltrnk, &sz2);
Chris@82 153 vecszi = X(tensor_copy_inplace)(p->vecsz, INPLACE_OS);
Chris@82 154 sz2i = X(tensor_copy_inplace)(sz2, INPLACE_OS);
Chris@82 155
Chris@82 156 cld1 = X(mkplan_d)(plnr,
Chris@82 157 X(mkproblem_rdft_d)(X(tensor_copy)(sz2),
Chris@82 158 X(tensor_append)(p->vecsz, sz1),
Chris@82 159 p->I, p->O, p->kind + spltrnk));
Chris@82 160 if (!cld1) goto nada;
Chris@82 161
Chris@82 162 cld2 = X(mkplan_d)(plnr,
Chris@82 163 X(mkproblem_rdft_d)(
Chris@82 164 X(tensor_copy_inplace)(sz1, INPLACE_OS),
Chris@82 165 X(tensor_append)(vecszi, sz2i),
Chris@82 166 p->O, p->O, p->kind));
Chris@82 167 if (!cld2) goto nada;
Chris@82 168
Chris@82 169 pln = MKPLAN_RDFT(P, &padt, apply);
Chris@82 170
Chris@82 171 pln->cld1 = cld1;
Chris@82 172 pln->cld2 = cld2;
Chris@82 173
Chris@82 174 pln->solver = ego;
Chris@82 175 X(ops_add)(&cld1->ops, &cld2->ops, &pln->super.super.ops);
Chris@82 176
Chris@82 177 X(tensor_destroy4)(sz2, sz1, vecszi, sz2i);
Chris@82 178
Chris@82 179 return &(pln->super.super);
Chris@82 180
Chris@82 181 nada:
Chris@82 182 X(plan_destroy_internal)(cld2);
Chris@82 183 X(plan_destroy_internal)(cld1);
Chris@82 184 X(tensor_destroy4)(sz2, sz1, vecszi, sz2i);
Chris@82 185 return (plan *) 0;
Chris@82 186 }
Chris@82 187
Chris@82 188 static solver *mksolver(int spltrnk, const int *buddies, size_t nbuddies)
Chris@82 189 {
Chris@82 190 static const solver_adt sadt = { PROBLEM_RDFT, mkplan, 0 };
Chris@82 191 S *slv = MKSOLVER(S, &sadt);
Chris@82 192 slv->spltrnk = spltrnk;
Chris@82 193 slv->buddies = buddies;
Chris@82 194 slv->nbuddies = nbuddies;
Chris@82 195 return &(slv->super);
Chris@82 196 }
Chris@82 197
Chris@82 198 void X(rdft_rank_geq2_register)(planner *p)
Chris@82 199 {
Chris@82 200 static const int buddies[] = { 1, 0, -2 };
Chris@82 201 size_t i;
Chris@82 202
Chris@82 203 for (i = 0; i < NELEM(buddies); ++i)
Chris@82 204 REGISTER_SOLVER(p, mksolver(buddies[i], buddies, NELEM(buddies)));
Chris@82 205
Chris@82 206 /* FIXME: Should we try more buddies? See also dft/rank-geq2. */
Chris@82 207 }