annotate src/fftw-3.3.5/libbench2/problem.c @ 169:223a55898ab9 tip default

Add null config files
author Chris Cannam <cannam@all-day-breakfast.com>
date Mon, 02 Mar 2020 14:03:47 +0000
parents 7867fa7e1b6b
children
rev   line source
cannam@127 1 /*
cannam@127 2 * Copyright (c) 2001 Matteo Frigo
cannam@127 3 * Copyright (c) 2001 Massachusetts Institute of Technology
cannam@127 4 *
cannam@127 5 * This program is free software; you can redistribute it and/or modify
cannam@127 6 * it under the terms of the GNU General Public License as published by
cannam@127 7 * the Free Software Foundation; either version 2 of the License, or
cannam@127 8 * (at your option) any later version.
cannam@127 9 *
cannam@127 10 * This program is distributed in the hope that it will be useful,
cannam@127 11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
cannam@127 12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
cannam@127 13 * GNU General Public License for more details.
cannam@127 14 *
cannam@127 15 * You should have received a copy of the GNU General Public License
cannam@127 16 * along with this program; if not, write to the Free Software
cannam@127 17 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
cannam@127 18 *
cannam@127 19 */
cannam@127 20
cannam@127 21
cannam@127 22 #include "config.h"
cannam@127 23 #include "bench.h"
cannam@127 24 #include <stdio.h>
cannam@127 25 #include <stdlib.h>
cannam@127 26 #include <string.h>
cannam@127 27 #include <ctype.h>
cannam@127 28
cannam@127 29 int always_pad_real = 0; /* by default, only pad in-place case */
cannam@127 30
cannam@127 31 typedef enum {
cannam@127 32 SAME, PADDED, HALFISH
cannam@127 33 } n_transform;
cannam@127 34
cannam@127 35 /* funny transformations for last dimension of PROBLEM_REAL */
cannam@127 36 static int transform_n(int n, n_transform nt)
cannam@127 37 {
cannam@127 38 switch (nt) {
cannam@127 39 case SAME: return n;
cannam@127 40 case PADDED: return 2*(n/2+1);
cannam@127 41 case HALFISH: return (n/2+1);
cannam@127 42 default: BENCH_ASSERT(0); return 0;
cannam@127 43 }
cannam@127 44 }
cannam@127 45
cannam@127 46 /* do what I mean */
cannam@127 47 static bench_tensor *dwim(bench_tensor *t, bench_iodim **last_iodim,
cannam@127 48 n_transform nti, n_transform nto,
cannam@127 49 bench_iodim *dt)
cannam@127 50 {
cannam@127 51 int i;
cannam@127 52 bench_iodim *d, *d1;
cannam@127 53
cannam@127 54 if (!BENCH_FINITE_RNK(t->rnk) || t->rnk < 1)
cannam@127 55 return t;
cannam@127 56
cannam@127 57 i = t->rnk;
cannam@127 58 d1 = *last_iodim;
cannam@127 59
cannam@127 60 while (--i >= 0) {
cannam@127 61 d = t->dims + i;
cannam@127 62 if (!d->is)
cannam@127 63 d->is = d1->is * transform_n(d1->n, d1==dt ? nti : SAME);
cannam@127 64 if (!d->os)
cannam@127 65 d->os = d1->os * transform_n(d1->n, d1==dt ? nto : SAME);
cannam@127 66 d1 = d;
cannam@127 67 }
cannam@127 68
cannam@127 69 *last_iodim = d1;
cannam@127 70 return t;
cannam@127 71 }
cannam@127 72
cannam@127 73 static void transpose_tensor(bench_tensor *t)
cannam@127 74 {
cannam@127 75 if (!BENCH_FINITE_RNK(t->rnk) || t->rnk < 2)
cannam@127 76 return;
cannam@127 77
cannam@127 78 t->dims[0].os = t->dims[1].os;
cannam@127 79 t->dims[1].os = t->dims[0].os * t->dims[0].n;
cannam@127 80 }
cannam@127 81
cannam@127 82 static const char *parseint(const char *s, int *n)
cannam@127 83 {
cannam@127 84 int sign = 1;
cannam@127 85
cannam@127 86 *n = 0;
cannam@127 87
cannam@127 88 if (*s == '-') {
cannam@127 89 sign = -1;
cannam@127 90 ++s;
cannam@127 91 } else if (*s == '+') {
cannam@127 92 sign = +1;
cannam@127 93 ++s;
cannam@127 94 }
cannam@127 95
cannam@127 96 BENCH_ASSERT(isdigit(*s));
cannam@127 97 while (isdigit(*s)) {
cannam@127 98 *n = *n * 10 + (*s - '0');
cannam@127 99 ++s;
cannam@127 100 }
cannam@127 101
cannam@127 102 *n *= sign;
cannam@127 103
cannam@127 104 if (*s == 'k' || *s == 'K') {
cannam@127 105 *n *= 1024;
cannam@127 106 ++s;
cannam@127 107 }
cannam@127 108
cannam@127 109 if (*s == 'm' || *s == 'M') {
cannam@127 110 *n *= 1024 * 1024;
cannam@127 111 ++s;
cannam@127 112 }
cannam@127 113
cannam@127 114 return s;
cannam@127 115 }
cannam@127 116
cannam@127 117 struct dimlist { bench_iodim car; r2r_kind_t k; struct dimlist *cdr; };
cannam@127 118
cannam@127 119 static const char *parsetensor(const char *s, bench_tensor **tp,
cannam@127 120 r2r_kind_t **k)
cannam@127 121 {
cannam@127 122 struct dimlist *l = 0, *m;
cannam@127 123 bench_tensor *t;
cannam@127 124 int rnk = 0;
cannam@127 125
cannam@127 126 L1:
cannam@127 127 m = (struct dimlist *)bench_malloc(sizeof(struct dimlist));
cannam@127 128 /* nconc onto l */
cannam@127 129 m->cdr = l; l = m;
cannam@127 130 ++rnk;
cannam@127 131
cannam@127 132 s = parseint(s, &m->car.n);
cannam@127 133
cannam@127 134 if (*s == ':') {
cannam@127 135 /* read input stride */
cannam@127 136 ++s;
cannam@127 137 s = parseint(s, &m->car.is);
cannam@127 138 if (*s == ':') {
cannam@127 139 /* read output stride */
cannam@127 140 ++s;
cannam@127 141 s = parseint(s, &m->car.os);
cannam@127 142 } else {
cannam@127 143 /* default */
cannam@127 144 m->car.os = m->car.is;
cannam@127 145 }
cannam@127 146 } else {
cannam@127 147 m->car.is = 0;
cannam@127 148 m->car.os = 0;
cannam@127 149 }
cannam@127 150
cannam@127 151 if (*s == 'f' || *s == 'F') {
cannam@127 152 m->k = R2R_R2HC;
cannam@127 153 ++s;
cannam@127 154 }
cannam@127 155 else if (*s == 'b' || *s == 'B') {
cannam@127 156 m->k = R2R_HC2R;
cannam@127 157 ++s;
cannam@127 158 }
cannam@127 159 else if (*s == 'h' || *s == 'H') {
cannam@127 160 m->k = R2R_DHT;
cannam@127 161 ++s;
cannam@127 162 }
cannam@127 163 else if (*s == 'e' || *s == 'E' || *s == 'o' || *s == 'O') {
cannam@127 164 char c = *(s++);
cannam@127 165 int ab;
cannam@127 166
cannam@127 167 s = parseint(s, &ab);
cannam@127 168
cannam@127 169 if (c == 'e' || c == 'E') {
cannam@127 170 if (ab == 0)
cannam@127 171 m->k = R2R_REDFT00;
cannam@127 172 else if (ab == 1)
cannam@127 173 m->k = R2R_REDFT01;
cannam@127 174 else if (ab == 10)
cannam@127 175 m->k = R2R_REDFT10;
cannam@127 176 else if (ab == 11)
cannam@127 177 m->k = R2R_REDFT11;
cannam@127 178 else
cannam@127 179 BENCH_ASSERT(0);
cannam@127 180 }
cannam@127 181 else {
cannam@127 182 if (ab == 0)
cannam@127 183 m->k = R2R_RODFT00;
cannam@127 184 else if (ab == 1)
cannam@127 185 m->k = R2R_RODFT01;
cannam@127 186 else if (ab == 10)
cannam@127 187 m->k = R2R_RODFT10;
cannam@127 188 else if (ab == 11)
cannam@127 189 m->k = R2R_RODFT11;
cannam@127 190 else
cannam@127 191 BENCH_ASSERT(0);
cannam@127 192 }
cannam@127 193 }
cannam@127 194 else
cannam@127 195 m->k = R2R_R2HC;
cannam@127 196
cannam@127 197 if (*s == 'x' || *s == 'X') {
cannam@127 198 ++s;
cannam@127 199 goto L1;
cannam@127 200 }
cannam@127 201
cannam@127 202 /* now we have a dimlist. Build bench_tensor, etc. */
cannam@127 203
cannam@127 204 if (k && rnk > 0) {
cannam@127 205 int i;
cannam@127 206 *k = (r2r_kind_t *) bench_malloc(sizeof(r2r_kind_t) * rnk);
cannam@127 207 for (m = l, i = rnk - 1; i >= 0; --i, m = m->cdr) {
cannam@127 208 BENCH_ASSERT(m);
cannam@127 209 (*k)[i] = m->k;
cannam@127 210 }
cannam@127 211 }
cannam@127 212
cannam@127 213 t = mktensor(rnk);
cannam@127 214 while (--rnk >= 0) {
cannam@127 215 bench_iodim *d = t->dims + rnk;
cannam@127 216 BENCH_ASSERT(l);
cannam@127 217 m = l; l = m->cdr;
cannam@127 218 d->n = m->car.n;
cannam@127 219 d->is = m->car.is;
cannam@127 220 d->os = m->car.os;
cannam@127 221 bench_free(m);
cannam@127 222 }
cannam@127 223
cannam@127 224 *tp = t;
cannam@127 225 return s;
cannam@127 226 }
cannam@127 227
cannam@127 228 /* parse a problem description, return a problem */
cannam@127 229 bench_problem *problem_parse(const char *s)
cannam@127 230 {
cannam@127 231 bench_problem *p;
cannam@127 232 bench_iodim last_iodim0 = {1,1,1}, *last_iodim = &last_iodim0;
cannam@127 233 bench_iodim *sz_last_iodim;
cannam@127 234 bench_tensor *sz;
cannam@127 235 n_transform nti = SAME, nto = SAME;
cannam@127 236 int transpose = 0;
cannam@127 237
cannam@127 238 p = (bench_problem *) bench_malloc(sizeof(bench_problem));
cannam@127 239 p->kind = PROBLEM_COMPLEX;
cannam@127 240 p->k = 0;
cannam@127 241 p->sign = -1;
cannam@127 242 p->in = p->out = 0;
cannam@127 243 p->inphys = p->outphys = 0;
cannam@127 244 p->iphyssz = p->ophyssz = 0;
cannam@127 245 p->in_place = 0;
cannam@127 246 p->destroy_input = 0;
cannam@127 247 p->split = 0;
cannam@127 248 p->userinfo = 0;
cannam@127 249 p->scrambled_in = p->scrambled_out = 0;
cannam@127 250 p->sz = p->vecsz = 0;
cannam@127 251 p->ini = p->outi = 0;
cannam@127 252 p->pstring = (char *) bench_malloc(sizeof(char) * (strlen(s) + 1));
cannam@127 253 strcpy(p->pstring, s);
cannam@127 254
cannam@127 255 L1:
cannam@127 256 switch (tolower(*s)) {
cannam@127 257 case 'i': p->in_place = 1; ++s; goto L1;
cannam@127 258 case 'o': p->in_place = 0; ++s; goto L1;
cannam@127 259 case 'd': p->destroy_input = 1; ++s; goto L1;
cannam@127 260 case '/': p->split = 1; ++s; goto L1;
cannam@127 261 case 'f':
cannam@127 262 case '-': p->sign = -1; ++s; goto L1;
cannam@127 263 case 'b':
cannam@127 264 case '+': p->sign = 1; ++s; goto L1;
cannam@127 265 case 'r': p->kind = PROBLEM_REAL; ++s; goto L1;
cannam@127 266 case 'c': p->kind = PROBLEM_COMPLEX; ++s; goto L1;
cannam@127 267 case 'k': p->kind = PROBLEM_R2R; ++s; goto L1;
cannam@127 268 case 't': transpose = 1; ++s; goto L1;
cannam@127 269
cannam@127 270 /* hack for MPI: */
cannam@127 271 case '[': p->scrambled_in = 1; ++s; goto L1;
cannam@127 272 case ']': p->scrambled_out = 1; ++s; goto L1;
cannam@127 273
cannam@127 274 default : ;
cannam@127 275 }
cannam@127 276
cannam@127 277 s = parsetensor(s, &sz, p->kind == PROBLEM_R2R ? &p->k : 0);
cannam@127 278
cannam@127 279 if (p->kind == PROBLEM_REAL) {
cannam@127 280 if (p->sign < 0) {
cannam@127 281 nti = p->in_place || always_pad_real ? PADDED : SAME;
cannam@127 282 nto = HALFISH;
cannam@127 283 }
cannam@127 284 else {
cannam@127 285 nti = HALFISH;
cannam@127 286 nto = p->in_place || always_pad_real ? PADDED : SAME;
cannam@127 287 }
cannam@127 288 }
cannam@127 289
cannam@127 290 sz_last_iodim = sz->dims + sz->rnk - 1;
cannam@127 291 if (*s == '*') { /* "external" vector */
cannam@127 292 ++s;
cannam@127 293 p->sz = dwim(sz, &last_iodim, nti, nto, sz_last_iodim);
cannam@127 294 s = parsetensor(s, &sz, 0);
cannam@127 295 p->vecsz = dwim(sz, &last_iodim, nti, nto, sz_last_iodim);
cannam@127 296 } else if (*s == 'v' || *s == 'V') { /* "internal" vector */
cannam@127 297 bench_tensor *vecsz;
cannam@127 298 ++s;
cannam@127 299 s = parsetensor(s, &vecsz, 0);
cannam@127 300 p->vecsz = dwim(vecsz, &last_iodim, nti, nto, sz_last_iodim);
cannam@127 301 p->sz = dwim(sz, &last_iodim, nti, nto, sz_last_iodim);
cannam@127 302 } else {
cannam@127 303 p->sz = dwim(sz, &last_iodim, nti, nto, sz_last_iodim);
cannam@127 304 p->vecsz = mktensor(0);
cannam@127 305 }
cannam@127 306
cannam@127 307 if (transpose) {
cannam@127 308 transpose_tensor(p->sz);
cannam@127 309 transpose_tensor(p->vecsz);
cannam@127 310 }
cannam@127 311
cannam@127 312 if (!p->in_place)
cannam@127 313 p->out = ((bench_real *) p->in) + (1 << 20); /* whatever */
cannam@127 314
cannam@127 315 BENCH_ASSERT(p->sz && p->vecsz);
cannam@127 316 BENCH_ASSERT(!*s);
cannam@127 317 return p;
cannam@127 318 }
cannam@127 319
cannam@127 320 void problem_destroy(bench_problem *p)
cannam@127 321 {
cannam@127 322 BENCH_ASSERT(p);
cannam@127 323 problem_free(p);
cannam@127 324 bench_free0(p->k);
cannam@127 325 bench_free0(p->pstring);
cannam@127 326 bench_free(p);
cannam@127 327 }
cannam@127 328