annotate src/fftw-3.3.8/kernel/twiddle.c @ 82:d0c2a83c1364

Add FFTW 3.3.8 source, and a Linux build
author Chris Cannam
date Tue, 19 Nov 2019 14:52:55 +0000
parents
children
rev   line source
Chris@82 1 /*
Chris@82 2 * Copyright (c) 2003, 2007-14 Matteo Frigo
Chris@82 3 * Copyright (c) 2003, 2007-14 Massachusetts Institute of Technology
Chris@82 4 *
Chris@82 5 * This program is free software; you can redistribute it and/or modify
Chris@82 6 * it under the terms of the GNU General Public License as published by
Chris@82 7 * the Free Software Foundation; either version 2 of the License, or
Chris@82 8 * (at your option) any later version.
Chris@82 9 *
Chris@82 10 * This program is distributed in the hope that it will be useful,
Chris@82 11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
Chris@82 12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
Chris@82 13 * GNU General Public License for more details.
Chris@82 14 *
Chris@82 15 * You should have received a copy of the GNU General Public License
Chris@82 16 * along with this program; if not, write to the Free Software
Chris@82 17 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
Chris@82 18 *
Chris@82 19 */
Chris@82 20
Chris@82 21
Chris@82 22 /* Twiddle manipulation */
Chris@82 23
Chris@82 24 #include "kernel/ifftw.h"
Chris@82 25 #include <math.h>
Chris@82 26
Chris@82 27 #define HASHSZ 109
Chris@82 28
Chris@82 29 /* hash table of known twiddle factors */
Chris@82 30 static twid *twlist[HASHSZ];
Chris@82 31
Chris@82 32 static INT hash(INT n, INT r)
Chris@82 33 {
Chris@82 34 INT h = n * 17 + r;
Chris@82 35
Chris@82 36 if (h < 0) h = -h;
Chris@82 37
Chris@82 38 return (h % HASHSZ);
Chris@82 39 }
Chris@82 40
Chris@82 41 static int equal_instr(const tw_instr *p, const tw_instr *q)
Chris@82 42 {
Chris@82 43 if (p == q)
Chris@82 44 return 1;
Chris@82 45
Chris@82 46 for (;; ++p, ++q) {
Chris@82 47 if (p->op != q->op)
Chris@82 48 return 0;
Chris@82 49
Chris@82 50 switch (p->op) {
Chris@82 51 case TW_NEXT:
Chris@82 52 return (p->v == q->v); /* p->i is ignored */
Chris@82 53
Chris@82 54 case TW_FULL:
Chris@82 55 case TW_HALF:
Chris@82 56 if (p->v != q->v) return 0; /* p->i is ignored */
Chris@82 57 break;
Chris@82 58
Chris@82 59 default:
Chris@82 60 if (p->v != q->v || p->i != q->i) return 0;
Chris@82 61 break;
Chris@82 62 }
Chris@82 63 }
Chris@82 64 A(0 /* can't happen */);
Chris@82 65 }
Chris@82 66
Chris@82 67 static int ok_twid(const twid *t,
Chris@82 68 enum wakefulness wakefulness,
Chris@82 69 const tw_instr *q, INT n, INT r, INT m)
Chris@82 70 {
Chris@82 71 return (wakefulness == t->wakefulness &&
Chris@82 72 n == t->n &&
Chris@82 73 r == t->r &&
Chris@82 74 m <= t->m &&
Chris@82 75 equal_instr(t->instr, q));
Chris@82 76 }
Chris@82 77
Chris@82 78 static twid *lookup(enum wakefulness wakefulness,
Chris@82 79 const tw_instr *q, INT n, INT r, INT m)
Chris@82 80 {
Chris@82 81 twid *p;
Chris@82 82
Chris@82 83 for (p = twlist[hash(n,r)];
Chris@82 84 p && !ok_twid(p, wakefulness, q, n, r, m);
Chris@82 85 p = p->cdr)
Chris@82 86 ;
Chris@82 87 return p;
Chris@82 88 }
Chris@82 89
Chris@82 90 static INT twlen0(INT r, const tw_instr *p, INT *vl)
Chris@82 91 {
Chris@82 92 INT ntwiddle = 0;
Chris@82 93
Chris@82 94 /* compute length of bytecode program */
Chris@82 95 A(r > 0);
Chris@82 96 for ( ; p->op != TW_NEXT; ++p) {
Chris@82 97 switch (p->op) {
Chris@82 98 case TW_FULL:
Chris@82 99 ntwiddle += (r - 1) * 2;
Chris@82 100 break;
Chris@82 101 case TW_HALF:
Chris@82 102 ntwiddle += (r - 1);
Chris@82 103 break;
Chris@82 104 case TW_CEXP:
Chris@82 105 ntwiddle += 2;
Chris@82 106 break;
Chris@82 107 case TW_COS:
Chris@82 108 case TW_SIN:
Chris@82 109 ntwiddle += 1;
Chris@82 110 break;
Chris@82 111 }
Chris@82 112 }
Chris@82 113
Chris@82 114 *vl = (INT)p->v;
Chris@82 115 return ntwiddle;
Chris@82 116 }
Chris@82 117
Chris@82 118 INT X(twiddle_length)(INT r, const tw_instr *p)
Chris@82 119 {
Chris@82 120 INT vl;
Chris@82 121 return twlen0(r, p, &vl);
Chris@82 122 }
Chris@82 123
Chris@82 124 static R *compute(enum wakefulness wakefulness,
Chris@82 125 const tw_instr *instr, INT n, INT r, INT m)
Chris@82 126 {
Chris@82 127 INT ntwiddle, j, vl;
Chris@82 128 R *W, *W0;
Chris@82 129 const tw_instr *p;
Chris@82 130 triggen *t = X(mktriggen)(wakefulness, n);
Chris@82 131
Chris@82 132 p = instr;
Chris@82 133 ntwiddle = twlen0(r, p, &vl);
Chris@82 134
Chris@82 135 A(m % vl == 0);
Chris@82 136
Chris@82 137 W0 = W = (R *)MALLOC((ntwiddle * (m / vl)) * sizeof(R), TWIDDLES);
Chris@82 138
Chris@82 139 for (j = 0; j < m; j += vl) {
Chris@82 140 for (p = instr; p->op != TW_NEXT; ++p) {
Chris@82 141 switch (p->op) {
Chris@82 142 case TW_FULL: {
Chris@82 143 INT i;
Chris@82 144 for (i = 1; i < r; ++i) {
Chris@82 145 A((j + (INT)p->v) * i < n);
Chris@82 146 A((j + (INT)p->v) * i > -n);
Chris@82 147 t->cexp(t, (j + (INT)p->v) * i, W);
Chris@82 148 W += 2;
Chris@82 149 }
Chris@82 150 break;
Chris@82 151 }
Chris@82 152
Chris@82 153 case TW_HALF: {
Chris@82 154 INT i;
Chris@82 155 A((r % 2) == 1);
Chris@82 156 for (i = 1; i + i < r; ++i) {
Chris@82 157 t->cexp(t, MULMOD(i, (j + (INT)p->v), n), W);
Chris@82 158 W += 2;
Chris@82 159 }
Chris@82 160 break;
Chris@82 161 }
Chris@82 162
Chris@82 163 case TW_COS: {
Chris@82 164 R d[2];
Chris@82 165
Chris@82 166 A((j + (INT)p->v) * p->i < n);
Chris@82 167 A((j + (INT)p->v) * p->i > -n);
Chris@82 168 t->cexp(t, (j + (INT)p->v) * (INT)p->i, d);
Chris@82 169 *W++ = d[0];
Chris@82 170 break;
Chris@82 171 }
Chris@82 172
Chris@82 173 case TW_SIN: {
Chris@82 174 R d[2];
Chris@82 175
Chris@82 176 A((j + (INT)p->v) * p->i < n);
Chris@82 177 A((j + (INT)p->v) * p->i > -n);
Chris@82 178 t->cexp(t, (j + (INT)p->v) * (INT)p->i, d);
Chris@82 179 *W++ = d[1];
Chris@82 180 break;
Chris@82 181 }
Chris@82 182
Chris@82 183 case TW_CEXP:
Chris@82 184 A((j + (INT)p->v) * p->i < n);
Chris@82 185 A((j + (INT)p->v) * p->i > -n);
Chris@82 186 t->cexp(t, (j + (INT)p->v) * (INT)p->i, W);
Chris@82 187 W += 2;
Chris@82 188 break;
Chris@82 189 }
Chris@82 190 }
Chris@82 191 }
Chris@82 192
Chris@82 193 X(triggen_destroy)(t);
Chris@82 194 return W0;
Chris@82 195 }
Chris@82 196
Chris@82 197 static void mktwiddle(enum wakefulness wakefulness,
Chris@82 198 twid **pp, const tw_instr *instr, INT n, INT r, INT m)
Chris@82 199 {
Chris@82 200 twid *p;
Chris@82 201 INT h;
Chris@82 202
Chris@82 203 if ((p = lookup(wakefulness, instr, n, r, m))) {
Chris@82 204 ++p->refcnt;
Chris@82 205 } else {
Chris@82 206 p = (twid *) MALLOC(sizeof(twid), TWIDDLES);
Chris@82 207 p->n = n;
Chris@82 208 p->r = r;
Chris@82 209 p->m = m;
Chris@82 210 p->instr = instr;
Chris@82 211 p->refcnt = 1;
Chris@82 212 p->wakefulness = wakefulness;
Chris@82 213 p->W = compute(wakefulness, instr, n, r, m);
Chris@82 214
Chris@82 215 /* cons! onto twlist */
Chris@82 216 h = hash(n, r);
Chris@82 217 p->cdr = twlist[h];
Chris@82 218 twlist[h] = p;
Chris@82 219 }
Chris@82 220
Chris@82 221 *pp = p;
Chris@82 222 }
Chris@82 223
Chris@82 224 static void twiddle_destroy(twid **pp)
Chris@82 225 {
Chris@82 226 twid *p = *pp;
Chris@82 227 twid **q;
Chris@82 228
Chris@82 229 if ((--p->refcnt) == 0) {
Chris@82 230 /* remove p from twiddle list */
Chris@82 231 for (q = &twlist[hash(p->n, p->r)]; *q; q = &((*q)->cdr)) {
Chris@82 232 if (*q == p) {
Chris@82 233 *q = p->cdr;
Chris@82 234 X(ifree)(p->W);
Chris@82 235 X(ifree)(p);
Chris@82 236 *pp = 0;
Chris@82 237 return;
Chris@82 238 }
Chris@82 239 }
Chris@82 240 A(0 /* can't happen */ );
Chris@82 241 }
Chris@82 242 }
Chris@82 243
Chris@82 244
Chris@82 245 void X(twiddle_awake)(enum wakefulness wakefulness, twid **pp,
Chris@82 246 const tw_instr *instr, INT n, INT r, INT m)
Chris@82 247 {
Chris@82 248 switch (wakefulness) {
Chris@82 249 case SLEEPY:
Chris@82 250 twiddle_destroy(pp);
Chris@82 251 break;
Chris@82 252 default:
Chris@82 253 mktwiddle(wakefulness, pp, instr, n, r, m);
Chris@82 254 break;
Chris@82 255 }
Chris@82 256 }