annotate fft/fftw/fftw-3.3.4/libbench2/problem.c @ 40:223f770b5341 kissfft-double tip

Try a double-precision kissfft
author Chris Cannam
date Wed, 07 Sep 2016 10:40:32 +0100
parents 26056e866c29
children
rev   line source
Chris@19 1 /*
Chris@19 2 * Copyright (c) 2001 Matteo Frigo
Chris@19 3 * Copyright (c) 2001 Massachusetts Institute of Technology
Chris@19 4 *
Chris@19 5 * This program is free software; you can redistribute it and/or modify
Chris@19 6 * it under the terms of the GNU General Public License as published by
Chris@19 7 * the Free Software Foundation; either version 2 of the License, or
Chris@19 8 * (at your option) any later version.
Chris@19 9 *
Chris@19 10 * This program is distributed in the hope that it will be useful,
Chris@19 11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
Chris@19 12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
Chris@19 13 * GNU General Public License for more details.
Chris@19 14 *
Chris@19 15 * You should have received a copy of the GNU General Public License
Chris@19 16 * along with this program; if not, write to the Free Software
Chris@19 17 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
Chris@19 18 *
Chris@19 19 */
Chris@19 20
Chris@19 21
Chris@19 22 #include "config.h"
Chris@19 23 #include "bench.h"
Chris@19 24 #include <stdio.h>
Chris@19 25 #include <stdlib.h>
Chris@19 26 #include <string.h>
Chris@19 27 #include <ctype.h>
Chris@19 28
Chris@19 29 int always_pad_real = 0; /* by default, only pad in-place case */
Chris@19 30
Chris@19 31 typedef enum {
Chris@19 32 SAME, PADDED, HALFISH
Chris@19 33 } n_transform;
Chris@19 34
Chris@19 35 /* funny transformations for last dimension of PROBLEM_REAL */
Chris@19 36 static int transform_n(int n, n_transform nt)
Chris@19 37 {
Chris@19 38 switch (nt) {
Chris@19 39 case SAME: return n;
Chris@19 40 case PADDED: return 2*(n/2+1);
Chris@19 41 case HALFISH: return (n/2+1);
Chris@19 42 default: BENCH_ASSERT(0); return 0;
Chris@19 43 }
Chris@19 44 }
Chris@19 45
Chris@19 46 /* do what I mean */
Chris@19 47 static bench_tensor *dwim(bench_tensor *t, bench_iodim **last_iodim,
Chris@19 48 n_transform nti, n_transform nto,
Chris@19 49 bench_iodim *dt)
Chris@19 50 {
Chris@19 51 int i;
Chris@19 52 bench_iodim *d, *d1;
Chris@19 53
Chris@19 54 if (!FINITE_RNK(t->rnk) || t->rnk < 1)
Chris@19 55 return t;
Chris@19 56
Chris@19 57 i = t->rnk;
Chris@19 58 d1 = *last_iodim;
Chris@19 59
Chris@19 60 while (--i >= 0) {
Chris@19 61 d = t->dims + i;
Chris@19 62 if (!d->is)
Chris@19 63 d->is = d1->is * transform_n(d1->n, d1==dt ? nti : SAME);
Chris@19 64 if (!d->os)
Chris@19 65 d->os = d1->os * transform_n(d1->n, d1==dt ? nto : SAME);
Chris@19 66 d1 = d;
Chris@19 67 }
Chris@19 68
Chris@19 69 *last_iodim = d1;
Chris@19 70 return t;
Chris@19 71 }
Chris@19 72
Chris@19 73 static void transpose_tensor(bench_tensor *t)
Chris@19 74 {
Chris@19 75 if (!FINITE_RNK(t->rnk) || t->rnk < 2)
Chris@19 76 return;
Chris@19 77
Chris@19 78 t->dims[0].os = t->dims[1].os;
Chris@19 79 t->dims[1].os = t->dims[0].os * t->dims[0].n;
Chris@19 80 }
Chris@19 81
Chris@19 82 static const char *parseint(const char *s, int *n)
Chris@19 83 {
Chris@19 84 int sign = 1;
Chris@19 85
Chris@19 86 *n = 0;
Chris@19 87
Chris@19 88 if (*s == '-') {
Chris@19 89 sign = -1;
Chris@19 90 ++s;
Chris@19 91 } else if (*s == '+') {
Chris@19 92 sign = +1;
Chris@19 93 ++s;
Chris@19 94 }
Chris@19 95
Chris@19 96 BENCH_ASSERT(isdigit(*s));
Chris@19 97 while (isdigit(*s)) {
Chris@19 98 *n = *n * 10 + (*s - '0');
Chris@19 99 ++s;
Chris@19 100 }
Chris@19 101
Chris@19 102 *n *= sign;
Chris@19 103
Chris@19 104 if (*s == 'k' || *s == 'K') {
Chris@19 105 *n *= 1024;
Chris@19 106 ++s;
Chris@19 107 }
Chris@19 108
Chris@19 109 if (*s == 'm' || *s == 'M') {
Chris@19 110 *n *= 1024 * 1024;
Chris@19 111 ++s;
Chris@19 112 }
Chris@19 113
Chris@19 114 return s;
Chris@19 115 }
Chris@19 116
Chris@19 117 struct dimlist { bench_iodim car; r2r_kind_t k; struct dimlist *cdr; };
Chris@19 118
Chris@19 119 static const char *parsetensor(const char *s, bench_tensor **tp,
Chris@19 120 r2r_kind_t **k)
Chris@19 121 {
Chris@19 122 struct dimlist *l = 0, *m;
Chris@19 123 bench_tensor *t;
Chris@19 124 int rnk = 0;
Chris@19 125
Chris@19 126 L1:
Chris@19 127 m = (struct dimlist *)bench_malloc(sizeof(struct dimlist));
Chris@19 128 /* nconc onto l */
Chris@19 129 m->cdr = l; l = m;
Chris@19 130 ++rnk;
Chris@19 131
Chris@19 132 s = parseint(s, &m->car.n);
Chris@19 133
Chris@19 134 if (*s == ':') {
Chris@19 135 /* read input stride */
Chris@19 136 ++s;
Chris@19 137 s = parseint(s, &m->car.is);
Chris@19 138 if (*s == ':') {
Chris@19 139 /* read output stride */
Chris@19 140 ++s;
Chris@19 141 s = parseint(s, &m->car.os);
Chris@19 142 } else {
Chris@19 143 /* default */
Chris@19 144 m->car.os = m->car.is;
Chris@19 145 }
Chris@19 146 } else {
Chris@19 147 m->car.is = 0;
Chris@19 148 m->car.os = 0;
Chris@19 149 }
Chris@19 150
Chris@19 151 if (*s == 'f' || *s == 'F') {
Chris@19 152 m->k = R2R_R2HC;
Chris@19 153 ++s;
Chris@19 154 }
Chris@19 155 else if (*s == 'b' || *s == 'B') {
Chris@19 156 m->k = R2R_HC2R;
Chris@19 157 ++s;
Chris@19 158 }
Chris@19 159 else if (*s == 'h' || *s == 'H') {
Chris@19 160 m->k = R2R_DHT;
Chris@19 161 ++s;
Chris@19 162 }
Chris@19 163 else if (*s == 'e' || *s == 'E' || *s == 'o' || *s == 'O') {
Chris@19 164 char c = *(s++);
Chris@19 165 int ab;
Chris@19 166
Chris@19 167 s = parseint(s, &ab);
Chris@19 168
Chris@19 169 if (c == 'e' || c == 'E') {
Chris@19 170 if (ab == 0)
Chris@19 171 m->k = R2R_REDFT00;
Chris@19 172 else if (ab == 1)
Chris@19 173 m->k = R2R_REDFT01;
Chris@19 174 else if (ab == 10)
Chris@19 175 m->k = R2R_REDFT10;
Chris@19 176 else if (ab == 11)
Chris@19 177 m->k = R2R_REDFT11;
Chris@19 178 else
Chris@19 179 BENCH_ASSERT(0);
Chris@19 180 }
Chris@19 181 else {
Chris@19 182 if (ab == 0)
Chris@19 183 m->k = R2R_RODFT00;
Chris@19 184 else if (ab == 1)
Chris@19 185 m->k = R2R_RODFT01;
Chris@19 186 else if (ab == 10)
Chris@19 187 m->k = R2R_RODFT10;
Chris@19 188 else if (ab == 11)
Chris@19 189 m->k = R2R_RODFT11;
Chris@19 190 else
Chris@19 191 BENCH_ASSERT(0);
Chris@19 192 }
Chris@19 193 }
Chris@19 194 else
Chris@19 195 m->k = R2R_R2HC;
Chris@19 196
Chris@19 197 if (*s == 'x' || *s == 'X') {
Chris@19 198 ++s;
Chris@19 199 goto L1;
Chris@19 200 }
Chris@19 201
Chris@19 202 /* now we have a dimlist. Build bench_tensor, etc. */
Chris@19 203
Chris@19 204 if (k && rnk > 0) {
Chris@19 205 int i;
Chris@19 206 *k = (r2r_kind_t *) bench_malloc(sizeof(r2r_kind_t) * rnk);
Chris@19 207 for (m = l, i = rnk - 1; i >= 0; --i, m = m->cdr) {
Chris@19 208 BENCH_ASSERT(m);
Chris@19 209 (*k)[i] = m->k;
Chris@19 210 }
Chris@19 211 }
Chris@19 212
Chris@19 213 t = mktensor(rnk);
Chris@19 214 while (--rnk >= 0) {
Chris@19 215 bench_iodim *d = t->dims + rnk;
Chris@19 216 BENCH_ASSERT(l);
Chris@19 217 m = l; l = m->cdr;
Chris@19 218 d->n = m->car.n;
Chris@19 219 d->is = m->car.is;
Chris@19 220 d->os = m->car.os;
Chris@19 221 bench_free(m);
Chris@19 222 }
Chris@19 223
Chris@19 224 *tp = t;
Chris@19 225 return s;
Chris@19 226 }
Chris@19 227
Chris@19 228 /* parse a problem description, return a problem */
Chris@19 229 bench_problem *problem_parse(const char *s)
Chris@19 230 {
Chris@19 231 bench_problem *p;
Chris@19 232 bench_iodim last_iodim0 = {1,1,1}, *last_iodim = &last_iodim0;
Chris@19 233 bench_iodim *sz_last_iodim;
Chris@19 234 bench_tensor *sz;
Chris@19 235 n_transform nti = SAME, nto = SAME;
Chris@19 236 int transpose = 0;
Chris@19 237
Chris@19 238 p = (bench_problem *) bench_malloc(sizeof(bench_problem));
Chris@19 239 p->kind = PROBLEM_COMPLEX;
Chris@19 240 p->k = 0;
Chris@19 241 p->sign = -1;
Chris@19 242 p->in = p->out = 0;
Chris@19 243 p->inphys = p->outphys = 0;
Chris@19 244 p->iphyssz = p->ophyssz = 0;
Chris@19 245 p->in_place = 0;
Chris@19 246 p->destroy_input = 0;
Chris@19 247 p->split = 0;
Chris@19 248 p->userinfo = 0;
Chris@19 249 p->scrambled_in = p->scrambled_out = 0;
Chris@19 250 p->sz = p->vecsz = 0;
Chris@19 251 p->ini = p->outi = 0;
Chris@19 252 p->pstring = (char *) bench_malloc(sizeof(char) * (strlen(s) + 1));
Chris@19 253 strcpy(p->pstring, s);
Chris@19 254
Chris@19 255 L1:
Chris@19 256 switch (tolower(*s)) {
Chris@19 257 case 'i': p->in_place = 1; ++s; goto L1;
Chris@19 258 case 'o': p->in_place = 0; ++s; goto L1;
Chris@19 259 case 'd': p->destroy_input = 1; ++s; goto L1;
Chris@19 260 case '/': p->split = 1; ++s; goto L1;
Chris@19 261 case 'f':
Chris@19 262 case '-': p->sign = -1; ++s; goto L1;
Chris@19 263 case 'b':
Chris@19 264 case '+': p->sign = 1; ++s; goto L1;
Chris@19 265 case 'r': p->kind = PROBLEM_REAL; ++s; goto L1;
Chris@19 266 case 'c': p->kind = PROBLEM_COMPLEX; ++s; goto L1;
Chris@19 267 case 'k': p->kind = PROBLEM_R2R; ++s; goto L1;
Chris@19 268 case 't': transpose = 1; ++s; goto L1;
Chris@19 269
Chris@19 270 /* hack for MPI: */
Chris@19 271 case '[': p->scrambled_in = 1; ++s; goto L1;
Chris@19 272 case ']': p->scrambled_out = 1; ++s; goto L1;
Chris@19 273
Chris@19 274 default : ;
Chris@19 275 }
Chris@19 276
Chris@19 277 s = parsetensor(s, &sz, p->kind == PROBLEM_R2R ? &p->k : 0);
Chris@19 278
Chris@19 279 if (p->kind == PROBLEM_REAL) {
Chris@19 280 if (p->sign < 0) {
Chris@19 281 nti = p->in_place || always_pad_real ? PADDED : SAME;
Chris@19 282 nto = HALFISH;
Chris@19 283 }
Chris@19 284 else {
Chris@19 285 nti = HALFISH;
Chris@19 286 nto = p->in_place || always_pad_real ? PADDED : SAME;
Chris@19 287 }
Chris@19 288 }
Chris@19 289
Chris@19 290 sz_last_iodim = sz->dims + sz->rnk - 1;
Chris@19 291 if (*s == '*') { /* "external" vector */
Chris@19 292 ++s;
Chris@19 293 p->sz = dwim(sz, &last_iodim, nti, nto, sz_last_iodim);
Chris@19 294 s = parsetensor(s, &sz, 0);
Chris@19 295 p->vecsz = dwim(sz, &last_iodim, nti, nto, sz_last_iodim);
Chris@19 296 } else if (*s == 'v' || *s == 'V') { /* "internal" vector */
Chris@19 297 bench_tensor *vecsz;
Chris@19 298 ++s;
Chris@19 299 s = parsetensor(s, &vecsz, 0);
Chris@19 300 p->vecsz = dwim(vecsz, &last_iodim, nti, nto, sz_last_iodim);
Chris@19 301 p->sz = dwim(sz, &last_iodim, nti, nto, sz_last_iodim);
Chris@19 302 } else {
Chris@19 303 p->sz = dwim(sz, &last_iodim, nti, nto, sz_last_iodim);
Chris@19 304 p->vecsz = mktensor(0);
Chris@19 305 }
Chris@19 306
Chris@19 307 if (transpose) {
Chris@19 308 transpose_tensor(p->sz);
Chris@19 309 transpose_tensor(p->vecsz);
Chris@19 310 }
Chris@19 311
Chris@19 312 if (!p->in_place)
Chris@19 313 p->out = ((bench_real *) p->in) + (1 << 20); /* whatever */
Chris@19 314
Chris@19 315 BENCH_ASSERT(p->sz && p->vecsz);
Chris@19 316 BENCH_ASSERT(!*s);
Chris@19 317 return p;
Chris@19 318 }
Chris@19 319
Chris@19 320 void problem_destroy(bench_problem *p)
Chris@19 321 {
Chris@19 322 BENCH_ASSERT(p);
Chris@19 323 problem_free(p);
Chris@19 324 bench_free0(p->k);
Chris@19 325 bench_free0(p->pstring);
Chris@19 326 bench_free(p);
Chris@19 327 }
Chris@19 328