cannam@167: /* cannam@167: * Copyright (c) 2001 Matteo Frigo cannam@167: * Copyright (c) 2001 Massachusetts Institute of Technology cannam@167: * cannam@167: * This program is free software; you can redistribute it and/or modify cannam@167: * it under the terms of the GNU General Public License as published by cannam@167: * the Free Software Foundation; either version 2 of the License, or cannam@167: * (at your option) any later version. cannam@167: * cannam@167: * This program is distributed in the hope that it will be useful, cannam@167: * but WITHOUT ANY WARRANTY; without even the implied warranty of cannam@167: * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the cannam@167: * GNU General Public License for more details. cannam@167: * cannam@167: * You should have received a copy of the GNU General Public License cannam@167: * along with this program; if not, write to the Free Software cannam@167: * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA cannam@167: * cannam@167: */ cannam@167: cannam@167: cannam@167: #include "config.h" cannam@167: #include "libbench2/bench.h" cannam@167: #include cannam@167: #include cannam@167: #include cannam@167: #include cannam@167: cannam@167: int always_pad_real = 0; /* by default, only pad in-place case */ cannam@167: cannam@167: typedef enum { cannam@167: SAME, PADDED, HALFISH cannam@167: } n_transform; cannam@167: cannam@167: /* funny transformations for last dimension of PROBLEM_REAL */ cannam@167: static int transform_n(int n, n_transform nt) cannam@167: { cannam@167: switch (nt) { cannam@167: case SAME: return n; cannam@167: case PADDED: return 2*(n/2+1); cannam@167: case HALFISH: return (n/2+1); cannam@167: default: BENCH_ASSERT(0); return 0; cannam@167: } cannam@167: } cannam@167: cannam@167: /* do what I mean */ cannam@167: static bench_tensor *dwim(bench_tensor *t, bench_iodim **last_iodim, cannam@167: n_transform nti, n_transform nto, cannam@167: bench_iodim *dt) cannam@167: { cannam@167: int i; cannam@167: bench_iodim *d, *d1; cannam@167: cannam@167: if (!BENCH_FINITE_RNK(t->rnk) || t->rnk < 1) cannam@167: return t; cannam@167: cannam@167: i = t->rnk; cannam@167: d1 = *last_iodim; cannam@167: cannam@167: while (--i >= 0) { cannam@167: d = t->dims + i; cannam@167: if (!d->is) cannam@167: d->is = d1->is * transform_n(d1->n, d1==dt ? nti : SAME); cannam@167: if (!d->os) cannam@167: d->os = d1->os * transform_n(d1->n, d1==dt ? nto : SAME); cannam@167: d1 = d; cannam@167: } cannam@167: cannam@167: *last_iodim = d1; cannam@167: return t; cannam@167: } cannam@167: cannam@167: static void transpose_tensor(bench_tensor *t) cannam@167: { cannam@167: if (!BENCH_FINITE_RNK(t->rnk) || t->rnk < 2) cannam@167: return; cannam@167: cannam@167: t->dims[0].os = t->dims[1].os; cannam@167: t->dims[1].os = t->dims[0].os * t->dims[0].n; cannam@167: } cannam@167: cannam@167: static const char *parseint(const char *s, int *n) cannam@167: { cannam@167: int sign = 1; cannam@167: cannam@167: *n = 0; cannam@167: cannam@167: if (*s == '-') { cannam@167: sign = -1; cannam@167: ++s; cannam@167: } else if (*s == '+') { cannam@167: sign = +1; cannam@167: ++s; cannam@167: } cannam@167: cannam@167: BENCH_ASSERT(isdigit(*s)); cannam@167: while (isdigit(*s)) { cannam@167: *n = *n * 10 + (*s - '0'); cannam@167: ++s; cannam@167: } cannam@167: cannam@167: *n *= sign; cannam@167: cannam@167: if (*s == 'k' || *s == 'K') { cannam@167: *n *= 1024; cannam@167: ++s; cannam@167: } cannam@167: cannam@167: if (*s == 'm' || *s == 'M') { cannam@167: *n *= 1024 * 1024; cannam@167: ++s; cannam@167: } cannam@167: cannam@167: return s; cannam@167: } cannam@167: cannam@167: struct dimlist { bench_iodim car; r2r_kind_t k; struct dimlist *cdr; }; cannam@167: cannam@167: static const char *parsetensor(const char *s, bench_tensor **tp, cannam@167: r2r_kind_t **k) cannam@167: { cannam@167: struct dimlist *l = 0, *m; cannam@167: bench_tensor *t; cannam@167: int rnk = 0; cannam@167: cannam@167: L1: cannam@167: m = (struct dimlist *)bench_malloc(sizeof(struct dimlist)); cannam@167: /* nconc onto l */ cannam@167: m->cdr = l; l = m; cannam@167: ++rnk; cannam@167: cannam@167: s = parseint(s, &m->car.n); cannam@167: cannam@167: if (*s == ':') { cannam@167: /* read input stride */ cannam@167: ++s; cannam@167: s = parseint(s, &m->car.is); cannam@167: if (*s == ':') { cannam@167: /* read output stride */ cannam@167: ++s; cannam@167: s = parseint(s, &m->car.os); cannam@167: } else { cannam@167: /* default */ cannam@167: m->car.os = m->car.is; cannam@167: } cannam@167: } else { cannam@167: m->car.is = 0; cannam@167: m->car.os = 0; cannam@167: } cannam@167: cannam@167: if (*s == 'f' || *s == 'F') { cannam@167: m->k = R2R_R2HC; cannam@167: ++s; cannam@167: } cannam@167: else if (*s == 'b' || *s == 'B') { cannam@167: m->k = R2R_HC2R; cannam@167: ++s; cannam@167: } cannam@167: else if (*s == 'h' || *s == 'H') { cannam@167: m->k = R2R_DHT; cannam@167: ++s; cannam@167: } cannam@167: else if (*s == 'e' || *s == 'E' || *s == 'o' || *s == 'O') { cannam@167: char c = *(s++); cannam@167: int ab; cannam@167: cannam@167: s = parseint(s, &ab); cannam@167: cannam@167: if (c == 'e' || c == 'E') { cannam@167: if (ab == 0) cannam@167: m->k = R2R_REDFT00; cannam@167: else if (ab == 1) cannam@167: m->k = R2R_REDFT01; cannam@167: else if (ab == 10) cannam@167: m->k = R2R_REDFT10; cannam@167: else if (ab == 11) cannam@167: m->k = R2R_REDFT11; cannam@167: else cannam@167: BENCH_ASSERT(0); cannam@167: } cannam@167: else { cannam@167: if (ab == 0) cannam@167: m->k = R2R_RODFT00; cannam@167: else if (ab == 1) cannam@167: m->k = R2R_RODFT01; cannam@167: else if (ab == 10) cannam@167: m->k = R2R_RODFT10; cannam@167: else if (ab == 11) cannam@167: m->k = R2R_RODFT11; cannam@167: else cannam@167: BENCH_ASSERT(0); cannam@167: } cannam@167: } cannam@167: else cannam@167: m->k = R2R_R2HC; cannam@167: cannam@167: if (*s == 'x' || *s == 'X') { cannam@167: ++s; cannam@167: goto L1; cannam@167: } cannam@167: cannam@167: /* now we have a dimlist. Build bench_tensor, etc. */ cannam@167: cannam@167: if (k && rnk > 0) { cannam@167: int i; cannam@167: *k = (r2r_kind_t *) bench_malloc(sizeof(r2r_kind_t) * rnk); cannam@167: for (m = l, i = rnk - 1; i >= 0; --i, m = m->cdr) { cannam@167: BENCH_ASSERT(m); cannam@167: (*k)[i] = m->k; cannam@167: } cannam@167: } cannam@167: cannam@167: t = mktensor(rnk); cannam@167: while (--rnk >= 0) { cannam@167: bench_iodim *d = t->dims + rnk; cannam@167: BENCH_ASSERT(l); cannam@167: m = l; l = m->cdr; cannam@167: d->n = m->car.n; cannam@167: d->is = m->car.is; cannam@167: d->os = m->car.os; cannam@167: bench_free(m); cannam@167: } cannam@167: cannam@167: *tp = t; cannam@167: return s; cannam@167: } cannam@167: cannam@167: /* parse a problem description, return a problem */ cannam@167: bench_problem *problem_parse(const char *s) cannam@167: { cannam@167: bench_problem *p; cannam@167: bench_iodim last_iodim0 = {1,1,1}, *last_iodim = &last_iodim0; cannam@167: bench_iodim *sz_last_iodim; cannam@167: bench_tensor *sz; cannam@167: n_transform nti = SAME, nto = SAME; cannam@167: int transpose = 0; cannam@167: cannam@167: p = (bench_problem *) bench_malloc(sizeof(bench_problem)); cannam@167: p->kind = PROBLEM_COMPLEX; cannam@167: p->k = 0; cannam@167: p->sign = -1; cannam@167: p->in = p->out = 0; cannam@167: p->inphys = p->outphys = 0; cannam@167: p->iphyssz = p->ophyssz = 0; cannam@167: p->in_place = 0; cannam@167: p->destroy_input = 0; cannam@167: p->split = 0; cannam@167: p->userinfo = 0; cannam@167: p->scrambled_in = p->scrambled_out = 0; cannam@167: p->sz = p->vecsz = 0; cannam@167: p->ini = p->outi = 0; cannam@167: p->pstring = (char *) bench_malloc(sizeof(char) * (strlen(s) + 1)); cannam@167: strcpy(p->pstring, s); cannam@167: cannam@167: L1: cannam@167: switch (tolower(*s)) { cannam@167: case 'i': p->in_place = 1; ++s; goto L1; cannam@167: case 'o': p->in_place = 0; ++s; goto L1; cannam@167: case 'd': p->destroy_input = 1; ++s; goto L1; cannam@167: case '/': p->split = 1; ++s; goto L1; cannam@167: case 'f': cannam@167: case '-': p->sign = -1; ++s; goto L1; cannam@167: case 'b': cannam@167: case '+': p->sign = 1; ++s; goto L1; cannam@167: case 'r': p->kind = PROBLEM_REAL; ++s; goto L1; cannam@167: case 'c': p->kind = PROBLEM_COMPLEX; ++s; goto L1; cannam@167: case 'k': p->kind = PROBLEM_R2R; ++s; goto L1; cannam@167: case 't': transpose = 1; ++s; goto L1; cannam@167: cannam@167: /* hack for MPI: */ cannam@167: case '[': p->scrambled_in = 1; ++s; goto L1; cannam@167: case ']': p->scrambled_out = 1; ++s; goto L1; cannam@167: cannam@167: default : ; cannam@167: } cannam@167: cannam@167: s = parsetensor(s, &sz, p->kind == PROBLEM_R2R ? &p->k : 0); cannam@167: cannam@167: if (p->kind == PROBLEM_REAL) { cannam@167: if (p->sign < 0) { cannam@167: nti = p->in_place || always_pad_real ? PADDED : SAME; cannam@167: nto = HALFISH; cannam@167: } cannam@167: else { cannam@167: nti = HALFISH; cannam@167: nto = p->in_place || always_pad_real ? PADDED : SAME; cannam@167: } cannam@167: } cannam@167: cannam@167: sz_last_iodim = sz->dims + sz->rnk - 1; cannam@167: if (*s == '*') { /* "external" vector */ cannam@167: ++s; cannam@167: p->sz = dwim(sz, &last_iodim, nti, nto, sz_last_iodim); cannam@167: s = parsetensor(s, &sz, 0); cannam@167: p->vecsz = dwim(sz, &last_iodim, nti, nto, sz_last_iodim); cannam@167: } else if (*s == 'v' || *s == 'V') { /* "internal" vector */ cannam@167: bench_tensor *vecsz; cannam@167: ++s; cannam@167: s = parsetensor(s, &vecsz, 0); cannam@167: p->vecsz = dwim(vecsz, &last_iodim, nti, nto, sz_last_iodim); cannam@167: p->sz = dwim(sz, &last_iodim, nti, nto, sz_last_iodim); cannam@167: } else { cannam@167: p->sz = dwim(sz, &last_iodim, nti, nto, sz_last_iodim); cannam@167: p->vecsz = mktensor(0); cannam@167: } cannam@167: cannam@167: if (transpose) { cannam@167: transpose_tensor(p->sz); cannam@167: transpose_tensor(p->vecsz); cannam@167: } cannam@167: cannam@167: if (!p->in_place) cannam@167: p->out = ((bench_real *) p->in) + (1 << 20); /* whatever */ cannam@167: cannam@167: BENCH_ASSERT(p->sz && p->vecsz); cannam@167: BENCH_ASSERT(!*s); cannam@167: return p; cannam@167: } cannam@167: cannam@167: void problem_destroy(bench_problem *p) cannam@167: { cannam@167: BENCH_ASSERT(p); cannam@167: problem_free(p); cannam@167: bench_free0(p->k); cannam@167: bench_free0(p->pstring); cannam@167: bench_free(p); cannam@167: } cannam@167: