annotate src/fftw-3.3.8/tests/fftw-bench.c @ 169:223a55898ab9 tip default

Add null config files
author Chris Cannam <cannam@all-day-breakfast.com>
date Mon, 02 Mar 2020 14:03:47 +0000
parents bd3cc4d1df30
children
rev   line source
cannam@167 1 /* See bench.c. We keep a few common subroutines in this file so
cannam@167 2 that they can be re-used in the MPI test program. */
cannam@167 3
cannam@167 4 #include <math.h>
cannam@167 5 #include <stdio.h>
cannam@167 6 #include <string.h>
cannam@167 7 #include "tests/fftw-bench.h"
cannam@167 8
cannam@167 9 /* define to enable code that traps floating-point exceptions.
cannam@167 10 Disabled by default because I don't want to worry about the
cannam@167 11 portability of such code. feenableexcept() seems to be a GNU
cannam@167 12 thing */
cannam@167 13 #undef TRAP_FP_EXCEPTIONS
cannam@167 14
cannam@167 15 #ifdef TRAP_FP_EXCEPTIONS
cannam@167 16 # include <signal.h>
cannam@167 17 # include <fenv.h>
cannam@167 18 #endif
cannam@167 19
cannam@167 20 #ifdef _OPENMP
cannam@167 21 # include <omp.h>
cannam@167 22 #endif
cannam@167 23
cannam@167 24 #ifdef HAVE_SMP
cannam@167 25 int threads_ok = 1;
cannam@167 26 #endif
cannam@167 27
cannam@167 28 FFTW(plan) the_plan = 0;
cannam@167 29
cannam@167 30 static const char *wisdat = "wis.dat";
cannam@167 31 unsigned the_flags = 0;
cannam@167 32 int paranoid = 0;
cannam@167 33 int usewisdom = 0;
cannam@167 34 int havewisdom = 0;
cannam@167 35 int nthreads = 1;
cannam@167 36 int amnesia = 0;
cannam@167 37
cannam@167 38 extern void install_hook(void); /* in hook.c */
cannam@167 39 extern void uninstall_hook(void); /* in hook.c */
cannam@167 40
cannam@167 41 #ifdef FFTW_RANDOM_ESTIMATOR
cannam@167 42 extern unsigned FFTW(random_estimate_seed);
cannam@167 43 #endif
cannam@167 44
cannam@167 45 #ifdef TRAP_FP_EXCEPTIONS
cannam@167 46 static void sigfpe_handler(int sig, siginfo_t *info, void *context)
cannam@167 47 {
cannam@167 48 /* fftw code is not supposed to generate FP exceptions */
cannam@167 49 UNUSED(sig); UNUSED(info); UNUSED(context);
cannam@167 50 fprintf(stderr, "caught FPE, aborting\n");
cannam@167 51 abort();
cannam@167 52 }
cannam@167 53
cannam@167 54 static void setup_sigfpe_handler(void)
cannam@167 55 {
cannam@167 56 struct sigaction a;
cannam@167 57 feenableexcept(FE_DIVBYZERO | FE_INVALID | FE_OVERFLOW | FE_UNDERFLOW);
cannam@167 58 memset(&a, 0, sizeof(a));
cannam@167 59 a.sa_sigaction = sigfpe_handler;
cannam@167 60 a.sa_flags = SA_SIGINFO;
cannam@167 61 if (sigaction(SIGFPE, &a, NULL) == -1) {
cannam@167 62 fprintf(stderr, "cannot install sigfpe handler\n");
cannam@167 63 exit(1);
cannam@167 64 }
cannam@167 65 }
cannam@167 66 #else
cannam@167 67 static void setup_sigfpe_handler(void)
cannam@167 68 {
cannam@167 69 }
cannam@167 70 #endif
cannam@167 71
cannam@167 72 void useropt(const char *arg)
cannam@167 73 {
cannam@167 74 int x;
cannam@167 75 double y;
cannam@167 76
cannam@167 77 if (!strcmp(arg, "patient")) the_flags |= FFTW_PATIENT;
cannam@167 78 else if (!strcmp(arg, "estimate")) the_flags |= FFTW_ESTIMATE;
cannam@167 79 else if (!strcmp(arg, "estimatepat")) the_flags |= FFTW_ESTIMATE_PATIENT;
cannam@167 80 else if (!strcmp(arg, "exhaustive")) the_flags |= FFTW_EXHAUSTIVE;
cannam@167 81 else if (!strcmp(arg, "unaligned")) the_flags |= FFTW_UNALIGNED;
cannam@167 82 else if (!strcmp(arg, "nosimd")) the_flags |= FFTW_NO_SIMD;
cannam@167 83 else if (!strcmp(arg, "noindirectop")) the_flags |= FFTW_NO_INDIRECT_OP;
cannam@167 84 else if (!strcmp(arg, "wisdom-only")) the_flags |= FFTW_WISDOM_ONLY;
cannam@167 85 else if (sscanf(arg, "flag=%d", &x) == 1) the_flags |= x;
cannam@167 86 else if (sscanf(arg, "bflag=%d", &x) == 1) the_flags |= 1U << x;
cannam@167 87 else if (!strcmp(arg, "paranoid")) paranoid = 1;
cannam@167 88 else if (!strcmp(arg, "wisdom")) usewisdom = 1;
cannam@167 89 else if (!strcmp(arg, "amnesia")) amnesia = 1;
cannam@167 90 else if (sscanf(arg, "nthreads=%d", &x) == 1) nthreads = x;
cannam@167 91 #ifdef FFTW_RANDOM_ESTIMATOR
cannam@167 92 else if (sscanf(arg, "eseed=%d", &x) == 1) FFTW(random_estimate_seed) = x;
cannam@167 93 #endif
cannam@167 94 else if (sscanf(arg, "timelimit=%lg", &y) == 1) {
cannam@167 95 FFTW(set_timelimit)(y);
cannam@167 96 }
cannam@167 97
cannam@167 98 else fprintf(stderr, "unknown user option: %s. Ignoring.\n", arg);
cannam@167 99 }
cannam@167 100
cannam@167 101 void rdwisdom(void)
cannam@167 102 {
cannam@167 103 FILE *f;
cannam@167 104 double tim;
cannam@167 105 int success = 0;
cannam@167 106
cannam@167 107 if (havewisdom) return;
cannam@167 108
cannam@167 109 #ifdef HAVE_SMP
cannam@167 110 if (threads_ok) {
cannam@167 111 BENCH_ASSERT(FFTW(init_threads)());
cannam@167 112 FFTW(plan_with_nthreads)(nthreads);
cannam@167 113 FFTW(make_planner_thread_safe)();
cannam@167 114 #ifdef _OPENMP
cannam@167 115 omp_set_num_threads(nthreads);
cannam@167 116 #endif
cannam@167 117 }
cannam@167 118 else if (nthreads > 1 && verbose > 1) {
cannam@167 119 fprintf(stderr, "bench: WARNING - nthreads = %d, but threads not supported\n", nthreads);
cannam@167 120 nthreads = 1;
cannam@167 121 }
cannam@167 122 #endif
cannam@167 123
cannam@167 124 if (!usewisdom) return;
cannam@167 125
cannam@167 126 timer_start(USER_TIMER);
cannam@167 127 if ((f = fopen(wisdat, "r"))) {
cannam@167 128 if (!import_wisdom(f))
cannam@167 129 fprintf(stderr, "bench: ERROR reading wisdom\n");
cannam@167 130 else
cannam@167 131 success = 1;
cannam@167 132 fclose(f);
cannam@167 133 }
cannam@167 134 tim = timer_stop(USER_TIMER);
cannam@167 135
cannam@167 136 if (success) {
cannam@167 137 if (verbose > 1) printf("READ WISDOM (%g seconds): ", tim);
cannam@167 138
cannam@167 139 if (verbose > 3)
cannam@167 140 export_wisdom(stdout);
cannam@167 141 if (verbose > 1)
cannam@167 142 printf("\n");
cannam@167 143 }
cannam@167 144 havewisdom = 1;
cannam@167 145 }
cannam@167 146
cannam@167 147 void wrwisdom(void)
cannam@167 148 {
cannam@167 149 FILE *f;
cannam@167 150 double tim;
cannam@167 151 if (!havewisdom) return;
cannam@167 152
cannam@167 153 timer_start(USER_TIMER);
cannam@167 154 if ((f = fopen(wisdat, "w"))) {
cannam@167 155 export_wisdom(f);
cannam@167 156 fclose(f);
cannam@167 157 }
cannam@167 158 tim = timer_stop(USER_TIMER);
cannam@167 159 if (verbose > 1) printf("write wisdom took %g seconds\n", tim);
cannam@167 160 }
cannam@167 161
cannam@167 162 static unsigned preserve_input_flags(bench_problem *p)
cannam@167 163 {
cannam@167 164 /*
cannam@167 165 * fftw3 cannot preserve input for multidimensional c2r transforms.
cannam@167 166 * Enforce FFTW_DESTROY_INPUT
cannam@167 167 */
cannam@167 168 if (p->kind == PROBLEM_REAL &&
cannam@167 169 p->sign > 0 &&
cannam@167 170 !p->in_place &&
cannam@167 171 p->sz->rnk > 1)
cannam@167 172 p->destroy_input = 1;
cannam@167 173
cannam@167 174 if (p->destroy_input)
cannam@167 175 return FFTW_DESTROY_INPUT;
cannam@167 176 else
cannam@167 177 return FFTW_PRESERVE_INPUT;
cannam@167 178 }
cannam@167 179
cannam@167 180 int can_do(bench_problem *p)
cannam@167 181 {
cannam@167 182 double tim;
cannam@167 183
cannam@167 184 if (verbose > 2 && p->pstring)
cannam@167 185 printf("Planning %s...\n", p->pstring);
cannam@167 186 rdwisdom();
cannam@167 187
cannam@167 188 timer_start(USER_TIMER);
cannam@167 189 the_plan = mkplan(p, preserve_input_flags(p) | the_flags | FFTW_ESTIMATE);
cannam@167 190 tim = timer_stop(USER_TIMER);
cannam@167 191 if (verbose > 2) printf("estimate-planner time: %g s\n", tim);
cannam@167 192
cannam@167 193 if (the_plan) {
cannam@167 194 FFTW(destroy_plan)(the_plan);
cannam@167 195 return 1;
cannam@167 196 }
cannam@167 197 return 0;
cannam@167 198 }
cannam@167 199
cannam@167 200 void setup(bench_problem *p)
cannam@167 201 {
cannam@167 202 double tim;
cannam@167 203
cannam@167 204 setup_sigfpe_handler();
cannam@167 205
cannam@167 206 if (amnesia) {
cannam@167 207 FFTW(forget_wisdom)();
cannam@167 208 havewisdom = 0;
cannam@167 209 }
cannam@167 210
cannam@167 211 /* Regression test: check that fftw_malloc exists and links
cannam@167 212 * properly */
cannam@167 213 {
cannam@167 214 void *ptr = FFTW(malloc(42));
cannam@167 215 BENCH_ASSERT(FFTW(alignment_of)(ptr) == 0);
cannam@167 216 FFTW(free(ptr));
cannam@167 217 }
cannam@167 218
cannam@167 219 rdwisdom();
cannam@167 220 install_hook();
cannam@167 221
cannam@167 222 #ifdef HAVE_SMP
cannam@167 223 if (verbose > 1 && nthreads > 1) printf("NTHREADS = %d\n", nthreads);
cannam@167 224 #endif
cannam@167 225
cannam@167 226 timer_start(USER_TIMER);
cannam@167 227 the_plan = mkplan(p, preserve_input_flags(p) | the_flags);
cannam@167 228 tim = timer_stop(USER_TIMER);
cannam@167 229 if (verbose > 1) printf("planner time: %g s\n", tim);
cannam@167 230
cannam@167 231 BENCH_ASSERT(the_plan);
cannam@167 232
cannam@167 233 {
cannam@167 234 double add, mul, nfma, cost, pcost;
cannam@167 235 FFTW(flops)(the_plan, &add, &mul, &nfma);
cannam@167 236 cost = FFTW(estimate_cost)(the_plan);
cannam@167 237 pcost = FFTW(cost)(the_plan);
cannam@167 238 if (verbose > 1) {
cannam@167 239 FFTW(print_plan)(the_plan);
cannam@167 240 printf("\n");
cannam@167 241 printf("flops: %0.0f add, %0.0f mul, %0.0f fma\n",
cannam@167 242 add, mul, nfma);
cannam@167 243 printf("estimated cost: %f, pcost = %f\n", cost, pcost);
cannam@167 244 }
cannam@167 245 }
cannam@167 246 }
cannam@167 247
cannam@167 248
cannam@167 249 void doit(int iter, bench_problem *p)
cannam@167 250 {
cannam@167 251 int i;
cannam@167 252 FFTW(plan) q = the_plan;
cannam@167 253
cannam@167 254 UNUSED(p);
cannam@167 255 for (i = 0; i < iter; ++i)
cannam@167 256 FFTW(execute)(q);
cannam@167 257 }
cannam@167 258
cannam@167 259 void done(bench_problem *p)
cannam@167 260 {
cannam@167 261 UNUSED(p);
cannam@167 262
cannam@167 263 FFTW(destroy_plan)(the_plan);
cannam@167 264 uninstall_hook();
cannam@167 265 }
cannam@167 266
cannam@167 267 void cleanup(void)
cannam@167 268 {
cannam@167 269 initial_cleanup();
cannam@167 270
cannam@167 271 wrwisdom();
cannam@167 272 #ifdef HAVE_SMP
cannam@167 273 FFTW(cleanup_threads)();
cannam@167 274 #else
cannam@167 275 FFTW(cleanup)();
cannam@167 276 #endif
cannam@167 277
cannam@167 278 # ifdef FFTW_DEBUG_MALLOC
cannam@167 279 {
cannam@167 280 /* undocumented memory checker */
cannam@167 281 FFTW_EXTERN void FFTW(malloc_print_minfo)(int v);
cannam@167 282 FFTW(malloc_print_minfo)(verbose);
cannam@167 283 }
cannam@167 284 # endif
cannam@167 285
cannam@167 286 final_cleanup();
cannam@167 287 }