annotate src/fftw-3.3.8/rdft/direct2.c @ 83:ae30d91d2ffe

Replace these with versions built using an older toolset (so as to avoid ABI compatibilities when linking on Ubuntu 14.04 for packaging purposes)
author Chris Cannam
date Fri, 07 Feb 2020 11:51:13 +0000
parents d0c2a83c1364
children
rev   line source
Chris@82 1 /*
Chris@82 2 * Copyright (c) 2003, 2007-14 Matteo Frigo
Chris@82 3 * Copyright (c) 2003, 2007-14 Massachusetts Institute of Technology
Chris@82 4 *
Chris@82 5 * This program is free software; you can redistribute it and/or modify
Chris@82 6 * it under the terms of the GNU General Public License as published by
Chris@82 7 * the Free Software Foundation; either version 2 of the License, or
Chris@82 8 * (at your option) any later version.
Chris@82 9 *
Chris@82 10 * This program is distributed in the hope that it will be useful,
Chris@82 11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
Chris@82 12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
Chris@82 13 * GNU General Public License for more details.
Chris@82 14 *
Chris@82 15 * You should have received a copy of the GNU General Public License
Chris@82 16 * along with this program; if not, write to the Free Software
Chris@82 17 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
Chris@82 18 *
Chris@82 19 */
Chris@82 20
Chris@82 21
Chris@82 22 /* direct RDFT2 R2HC/HC2R solver, if we have a codelet */
Chris@82 23
Chris@82 24 #include "rdft/rdft.h"
Chris@82 25
Chris@82 26 typedef struct {
Chris@82 27 solver super;
Chris@82 28 const kr2c_desc *desc;
Chris@82 29 kr2c k;
Chris@82 30 } S;
Chris@82 31
Chris@82 32 typedef struct {
Chris@82 33 plan_rdft2 super;
Chris@82 34
Chris@82 35 stride rs, cs;
Chris@82 36 INT vl;
Chris@82 37 INT ivs, ovs;
Chris@82 38 kr2c k;
Chris@82 39 const S *slv;
Chris@82 40 INT ilast;
Chris@82 41 } P;
Chris@82 42
Chris@82 43 static void apply(const plan *ego_, R *r0, R *r1, R *cr, R *ci)
Chris@82 44 {
Chris@82 45 const P *ego = (const P *) ego_;
Chris@82 46 ASSERT_ALIGNED_DOUBLE;
Chris@82 47 ego->k(r0, r1, cr, ci,
Chris@82 48 ego->rs, ego->cs, ego->cs,
Chris@82 49 ego->vl, ego->ivs, ego->ovs);
Chris@82 50 }
Chris@82 51
Chris@82 52 static void apply_r2hc(const plan *ego_, R *r0, R *r1, R *cr, R *ci)
Chris@82 53 {
Chris@82 54 const P *ego = (const P *) ego_;
Chris@82 55 INT i, vl = ego->vl, ovs = ego->ovs;
Chris@82 56 ASSERT_ALIGNED_DOUBLE;
Chris@82 57 ego->k(r0, r1, cr, ci,
Chris@82 58 ego->rs, ego->cs, ego->cs,
Chris@82 59 vl, ego->ivs, ovs);
Chris@82 60 for (i = 0; i < vl; ++i, ci += ovs)
Chris@82 61 ci[0] = ci[ego->ilast] = 0;
Chris@82 62 }
Chris@82 63
Chris@82 64 static void destroy(plan *ego_)
Chris@82 65 {
Chris@82 66 P *ego = (P *) ego_;
Chris@82 67 X(stride_destroy)(ego->rs);
Chris@82 68 X(stride_destroy)(ego->cs);
Chris@82 69 }
Chris@82 70
Chris@82 71 static void print(const plan *ego_, printer *p)
Chris@82 72 {
Chris@82 73 const P *ego = (const P *) ego_;
Chris@82 74 const S *s = ego->slv;
Chris@82 75
Chris@82 76 p->print(p, "(rdft2-%s-direct-%D%v \"%s\")",
Chris@82 77 X(rdft_kind_str)(s->desc->genus->kind), s->desc->n,
Chris@82 78 ego->vl, s->desc->nam);
Chris@82 79 }
Chris@82 80
Chris@82 81 static int applicable(const solver *ego_, const problem *p_)
Chris@82 82 {
Chris@82 83 const S *ego = (const S *) ego_;
Chris@82 84 const kr2c_desc *desc = ego->desc;
Chris@82 85 const problem_rdft2 *p = (const problem_rdft2 *) p_;
Chris@82 86 INT vl;
Chris@82 87 INT ivs, ovs;
Chris@82 88
Chris@82 89 return (
Chris@82 90 1
Chris@82 91 && p->sz->rnk == 1
Chris@82 92 && p->vecsz->rnk <= 1
Chris@82 93 && p->sz->dims[0].n == desc->n
Chris@82 94 && p->kind == desc->genus->kind
Chris@82 95
Chris@82 96 /* check strides etc */
Chris@82 97 && X(tensor_tornk1)(p->vecsz, &vl, &ivs, &ovs)
Chris@82 98
Chris@82 99 && (0
Chris@82 100 /* can operate out-of-place */
Chris@82 101 || p->r0 != p->cr
Chris@82 102
Chris@82 103 /*
Chris@82 104 * can compute one transform in-place, no matter
Chris@82 105 * what the strides are.
Chris@82 106 */
Chris@82 107 || p->vecsz->rnk == 0
Chris@82 108
Chris@82 109 /* can operate in-place as long as strides are the same */
Chris@82 110 || X(rdft2_inplace_strides)(p, RNK_MINFTY)
Chris@82 111 )
Chris@82 112 );
Chris@82 113 }
Chris@82 114
Chris@82 115 static plan *mkplan(const solver *ego_, const problem *p_, planner *plnr)
Chris@82 116 {
Chris@82 117 const S *ego = (const S *) ego_;
Chris@82 118 P *pln;
Chris@82 119 const problem_rdft2 *p;
Chris@82 120 iodim *d;
Chris@82 121 int r2hc_kindp;
Chris@82 122
Chris@82 123 static const plan_adt padt = {
Chris@82 124 X(rdft2_solve), X(null_awake), print, destroy
Chris@82 125 };
Chris@82 126
Chris@82 127 UNUSED(plnr);
Chris@82 128
Chris@82 129 if (!applicable(ego_, p_))
Chris@82 130 return (plan *)0;
Chris@82 131
Chris@82 132 p = (const problem_rdft2 *) p_;
Chris@82 133
Chris@82 134 r2hc_kindp = R2HC_KINDP(p->kind);
Chris@82 135 A(r2hc_kindp || HC2R_KINDP(p->kind));
Chris@82 136
Chris@82 137 pln = MKPLAN_RDFT2(P, &padt, p->kind == R2HC ? apply_r2hc : apply);
Chris@82 138
Chris@82 139 d = p->sz->dims;
Chris@82 140
Chris@82 141 pln->k = ego->k;
Chris@82 142
Chris@82 143 pln->rs = X(mkstride)(d->n, r2hc_kindp ? d->is : d->os);
Chris@82 144 pln->cs = X(mkstride)(d->n, r2hc_kindp ? d->os : d->is);
Chris@82 145
Chris@82 146 X(tensor_tornk1)(p->vecsz, &pln->vl, &pln->ivs, &pln->ovs);
Chris@82 147
Chris@82 148 /* Nyquist freq., if any */
Chris@82 149 pln->ilast = (d->n % 2) ? 0 : (d->n/2) * d->os;
Chris@82 150
Chris@82 151 pln->slv = ego;
Chris@82 152 X(ops_zero)(&pln->super.super.ops);
Chris@82 153 X(ops_madd2)(pln->vl / ego->desc->genus->vl,
Chris@82 154 &ego->desc->ops,
Chris@82 155 &pln->super.super.ops);
Chris@82 156 if (p->kind == R2HC)
Chris@82 157 pln->super.super.ops.other += 2 * pln->vl; /* + 2 stores */
Chris@82 158
Chris@82 159 pln->super.super.could_prune_now_p = 1;
Chris@82 160 return &(pln->super.super);
Chris@82 161 }
Chris@82 162
Chris@82 163 /* constructor */
Chris@82 164 solver *X(mksolver_rdft2_direct)(kr2c k, const kr2c_desc *desc)
Chris@82 165 {
Chris@82 166 static const solver_adt sadt = { PROBLEM_RDFT2, mkplan, 0 };
Chris@82 167 S *slv = MKSOLVER(S, &sadt);
Chris@82 168 slv->k = k;
Chris@82 169 slv->desc = desc;
Chris@82 170 return &(slv->super);
Chris@82 171 }