annotate src/fftw-3.3.8/libbench2/bench-user.h @ 168:ceec0dd9ec9c

Replace these with versions built using an older toolset (so as to avoid ABI compatibilities when linking on Ubuntu 14.04 for packaging purposes)
author Chris Cannam <cannam@all-day-breakfast.com>
date Fri, 07 Feb 2020 11:51:13 +0000
parents bd3cc4d1df30
children
rev   line source
cannam@167 1 /*
cannam@167 2 * Copyright (c) 2001 Matteo Frigo
cannam@167 3 * Copyright (c) 2001 Massachusetts Institute of Technology
cannam@167 4 *
cannam@167 5 * This program is free software; you can redistribute it and/or modify
cannam@167 6 * it under the terms of the GNU General Public License as published by
cannam@167 7 * the Free Software Foundation; either version 2 of the License, or
cannam@167 8 * (at your option) any later version.
cannam@167 9 *
cannam@167 10 * This program is distributed in the hope that it will be useful,
cannam@167 11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
cannam@167 12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
cannam@167 13 * GNU General Public License for more details.
cannam@167 14 *
cannam@167 15 * You should have received a copy of the GNU General Public License
cannam@167 16 * along with this program; if not, write to the Free Software
cannam@167 17 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
cannam@167 18 *
cannam@167 19 */
cannam@167 20
cannam@167 21 #ifndef __BENCH_USER_H__
cannam@167 22 #define __BENCH_USER_H__
cannam@167 23
cannam@167 24 #ifdef __cplusplus
cannam@167 25 extern "C" {
cannam@167 26 #endif /* __cplusplus */
cannam@167 27
cannam@167 28 /* benchmark program definitions for user code */
cannam@167 29 #include "config.h"
cannam@167 30 #include <limits.h>
cannam@167 31
cannam@167 32 #if HAVE_STDDEF_H
cannam@167 33 #include <stddef.h>
cannam@167 34 #endif
cannam@167 35
cannam@167 36 #if HAVE_STDLIB_H
cannam@167 37 #include <stdlib.h>
cannam@167 38 #endif
cannam@167 39
cannam@167 40 #if defined(BENCHFFT_SINGLE)
cannam@167 41 typedef float bench_real;
cannam@167 42 #elif defined(BENCHFFT_LDOUBLE)
cannam@167 43 typedef long double bench_real;
cannam@167 44 #elif defined(BENCHFFT_QUAD)
cannam@167 45 typedef __float128 bench_real;
cannam@167 46 #else
cannam@167 47 typedef double bench_real;
cannam@167 48 #endif
cannam@167 49
cannam@167 50 typedef bench_real bench_complex[2];
cannam@167 51
cannam@167 52 #define c_re(c) ((c)[0])
cannam@167 53 #define c_im(c) ((c)[1])
cannam@167 54
cannam@167 55 #undef DOUBLE_PRECISION
cannam@167 56 #define DOUBLE_PRECISION (sizeof(bench_real) == sizeof(double))
cannam@167 57 #undef SINGLE_PRECISION
cannam@167 58 #define SINGLE_PRECISION (!DOUBLE_PRECISION && sizeof(bench_real) == sizeof(float))
cannam@167 59 #undef LDOUBLE_PRECISION
cannam@167 60 #define LDOUBLE_PRECISION (!DOUBLE_PRECISION && sizeof(bench_real) == sizeof(long double))
cannam@167 61
cannam@167 62 #undef QUAD_PRECISION
cannam@167 63 #ifdef BENCHFFT_QUAD
cannam@167 64 #define QUAD_PRECISION (!LDOUBLE_PRECISION && sizeof(bench_real) == sizeof(__float128))
cannam@167 65 #else
cannam@167 66 #define QUAD_PRECISION 0
cannam@167 67 #endif
cannam@167 68
cannam@167 69 typedef enum { PROBLEM_COMPLEX, PROBLEM_REAL, PROBLEM_R2R } problem_kind_t;
cannam@167 70
cannam@167 71 typedef enum {
cannam@167 72 R2R_R2HC, R2R_HC2R, R2R_DHT,
cannam@167 73 R2R_REDFT00, R2R_REDFT01, R2R_REDFT10, R2R_REDFT11,
cannam@167 74 R2R_RODFT00, R2R_RODFT01, R2R_RODFT10, R2R_RODFT11
cannam@167 75 } r2r_kind_t;
cannam@167 76
cannam@167 77 typedef struct {
cannam@167 78 int n;
cannam@167 79 int is; /* input stride */
cannam@167 80 int os; /* output stride */
cannam@167 81 } bench_iodim;
cannam@167 82
cannam@167 83 typedef struct {
cannam@167 84 int rnk;
cannam@167 85 bench_iodim *dims;
cannam@167 86 } bench_tensor;
cannam@167 87
cannam@167 88 bench_tensor *mktensor(int rnk);
cannam@167 89 void tensor_destroy(bench_tensor *sz);
cannam@167 90 size_t tensor_sz(const bench_tensor *sz);
cannam@167 91 bench_tensor *tensor_compress(const bench_tensor *sz);
cannam@167 92 int tensor_unitstridep(bench_tensor *t);
cannam@167 93 int tensor_rowmajorp(bench_tensor *t);
cannam@167 94 int tensor_real_rowmajorp(bench_tensor *t, int sign, int in_place);
cannam@167 95 bench_tensor *tensor_append(const bench_tensor *a, const bench_tensor *b);
cannam@167 96 bench_tensor *tensor_copy(const bench_tensor *sz);
cannam@167 97 bench_tensor *tensor_copy_sub(const bench_tensor *sz, int start_dim, int rnk);
cannam@167 98 bench_tensor *tensor_copy_swapio(const bench_tensor *sz);
cannam@167 99 void tensor_ibounds(bench_tensor *t, int *lbp, int *ubp);
cannam@167 100 void tensor_obounds(bench_tensor *t, int *lbp, int *ubp);
cannam@167 101
cannam@167 102 /*
cannam@167 103 Definition of rank -infinity.
cannam@167 104 This definition has the property that if you want rank 0 or 1,
cannam@167 105 you can simply test for rank <= 1. This is a common case.
cannam@167 106
cannam@167 107 A tensor of rank -infinity has size 0.
cannam@167 108 */
cannam@167 109 #define BENCH_RNK_MINFTY INT_MAX
cannam@167 110 #define BENCH_FINITE_RNK(rnk) ((rnk) != BENCH_RNK_MINFTY)
cannam@167 111
cannam@167 112 typedef struct {
cannam@167 113 problem_kind_t kind;
cannam@167 114 r2r_kind_t *k;
cannam@167 115 bench_tensor *sz;
cannam@167 116 bench_tensor *vecsz;
cannam@167 117 int sign;
cannam@167 118 int in_place;
cannam@167 119 int destroy_input;
cannam@167 120 int split;
cannam@167 121 void *in, *out;
cannam@167 122 void *inphys, *outphys;
cannam@167 123 int iphyssz, ophyssz;
cannam@167 124 char *pstring;
cannam@167 125 void *userinfo; /* user can store whatever */
cannam@167 126 int scrambled_in, scrambled_out; /* hack for MPI */
cannam@167 127
cannam@167 128 /* internal hack so that we can use verifier in FFTW test program */
cannam@167 129 void *ini, *outi; /* if nonzero, point to imag. parts for dft */
cannam@167 130
cannam@167 131 /* another internal hack to avoid passing around too many parameters */
cannam@167 132 double setup_time;
cannam@167 133 } bench_problem;
cannam@167 134
cannam@167 135 extern int verbose;
cannam@167 136
cannam@167 137 extern int no_speed_allocation;
cannam@167 138
cannam@167 139 extern int always_pad_real;
cannam@167 140
cannam@167 141 #define LIBBENCH_TIMER 0
cannam@167 142 #define USER_TIMER 1
cannam@167 143 #define BENCH_NTIMERS 2
cannam@167 144 extern void timer_start(int which_timer);
cannam@167 145 extern double timer_stop(int which_timer);
cannam@167 146
cannam@167 147 extern int can_do(bench_problem *p);
cannam@167 148 extern void setup(bench_problem *p);
cannam@167 149 extern void doit(int iter, bench_problem *p);
cannam@167 150 extern void done(bench_problem *p);
cannam@167 151 extern void main_init(int *argc, char ***argv);
cannam@167 152 extern void cleanup(void);
cannam@167 153 extern void verify(const char *param, int rounds, double tol);
cannam@167 154 extern void useropt(const char *arg);
cannam@167 155
cannam@167 156 extern void verify_problem(bench_problem *p, int rounds, double tol);
cannam@167 157
cannam@167 158 extern void problem_alloc(bench_problem *p);
cannam@167 159 extern void problem_free(bench_problem *p);
cannam@167 160 extern void problem_zero(bench_problem *p);
cannam@167 161 extern void problem_destroy(bench_problem *p);
cannam@167 162
cannam@167 163 extern int power_of_two(int n);
cannam@167 164 extern int log_2(int n);
cannam@167 165
cannam@167 166
cannam@167 167 #define CASSIGN(out, in) (c_re(out) = c_re(in), c_im(out) = c_im(in))
cannam@167 168
cannam@167 169 bench_tensor *verify_pack(const bench_tensor *sz, int s);
cannam@167 170
cannam@167 171 typedef struct {
cannam@167 172 double l;
cannam@167 173 double i;
cannam@167 174 double s;
cannam@167 175 } errors;
cannam@167 176
cannam@167 177 void verify_dft(bench_problem *p, int rounds, double tol, errors *e);
cannam@167 178 void verify_rdft2(bench_problem *p, int rounds, double tol, errors *e);
cannam@167 179 void verify_r2r(bench_problem *p, int rounds, double tol, errors *e);
cannam@167 180
cannam@167 181 /**************************************************************/
cannam@167 182 /* routines to override */
cannam@167 183
cannam@167 184 extern void after_problem_ccopy_from(bench_problem *p, bench_real *ri, bench_real *ii);
cannam@167 185 extern void after_problem_ccopy_to(bench_problem *p, bench_real *ro, bench_real *io);
cannam@167 186 extern void after_problem_hccopy_from(bench_problem *p, bench_real *ri, bench_real *ii);
cannam@167 187 extern void after_problem_hccopy_to(bench_problem *p, bench_real *ro, bench_real *io);
cannam@167 188 extern void after_problem_rcopy_from(bench_problem *p, bench_real *ri);
cannam@167 189 extern void after_problem_rcopy_to(bench_problem *p, bench_real *ro);
cannam@167 190 extern void bench_exit(int status);
cannam@167 191 extern double bench_cost_postprocess(double cost);
cannam@167 192
cannam@167 193 /**************************************************************
cannam@167 194 * malloc
cannam@167 195 **************************************************************/
cannam@167 196 extern void *bench_malloc(size_t size);
cannam@167 197 extern void bench_free(void *ptr);
cannam@167 198 extern void bench_free0(void *ptr);
cannam@167 199
cannam@167 200 /**************************************************************
cannam@167 201 * alloca
cannam@167 202 **************************************************************/
cannam@167 203 #ifdef HAVE_ALLOCA_H
cannam@167 204 #include <alloca.h>
cannam@167 205 #endif
cannam@167 206
cannam@167 207 /**************************************************************
cannam@167 208 * assert
cannam@167 209 **************************************************************/
cannam@167 210 extern void bench_assertion_failed(const char *s, int line, const char *file);
cannam@167 211 #define BENCH_ASSERT(ex) \
cannam@167 212 (void)((ex) || (bench_assertion_failed(#ex, __LINE__, __FILE__), 0))
cannam@167 213
cannam@167 214 #define UNUSED(x) (void)x
cannam@167 215
cannam@167 216 /***************************************
cannam@167 217 * Documentation strings
cannam@167 218 ***************************************/
cannam@167 219 struct bench_doc {
cannam@167 220 const char *key;
cannam@167 221 const char *val;
cannam@167 222 const char *(*f)(void);
cannam@167 223 };
cannam@167 224
cannam@167 225 extern struct bench_doc bench_doc[];
cannam@167 226
cannam@167 227 #ifdef CC
cannam@167 228 #define CC_DOC BENCH_DOC("cc", CC)
cannam@167 229 #elif defined(BENCH_CC)
cannam@167 230 #define CC_DOC BENCH_DOC("cc", BENCH_CC)
cannam@167 231 #else
cannam@167 232 #define CC_DOC /* none */
cannam@167 233 #endif
cannam@167 234
cannam@167 235 #ifdef CXX
cannam@167 236 #define CXX_DOC BENCH_DOC("cxx", CXX)
cannam@167 237 #elif defined(BENCH_CXX)
cannam@167 238 #define CXX_DOC BENCH_DOC("cxx", BENCH_CXX)
cannam@167 239 #else
cannam@167 240 #define CXX_DOC /* none */
cannam@167 241 #endif
cannam@167 242
cannam@167 243 #ifdef F77
cannam@167 244 #define F77_DOC BENCH_DOC("f77", F77)
cannam@167 245 #elif defined(BENCH_F77)
cannam@167 246 #define F77_DOC BENCH_DOC("f77", BENCH_F77)
cannam@167 247 #else
cannam@167 248 #define F77_DOC /* none */
cannam@167 249 #endif
cannam@167 250
cannam@167 251 #ifdef F90
cannam@167 252 #define F90_DOC BENCH_DOC("f90", F90)
cannam@167 253 #elif defined(BENCH_F90)
cannam@167 254 #define F90_DOC BENCH_DOC("f90", BENCH_F90)
cannam@167 255 #else
cannam@167 256 #define F90_DOC /* none */
cannam@167 257 #endif
cannam@167 258
cannam@167 259 #define BEGIN_BENCH_DOC \
cannam@167 260 struct bench_doc bench_doc[] = { \
cannam@167 261 CC_DOC \
cannam@167 262 CXX_DOC \
cannam@167 263 F77_DOC \
cannam@167 264 F90_DOC
cannam@167 265
cannam@167 266 #define BENCH_DOC(key, val) { key, val, 0 },
cannam@167 267 #define BENCH_DOCF(key, f) { key, 0, f },
cannam@167 268
cannam@167 269 #define END_BENCH_DOC \
cannam@167 270 {0, 0, 0}};
cannam@167 271
cannam@167 272 #ifdef __cplusplus
cannam@167 273 } /* extern "C" */
cannam@167 274 #endif /* __cplusplus */
cannam@167 275
cannam@167 276 #endif /* __BENCH_USER_H__ */