Chris@19: /* See bench.c. We keep a few common subroutines in this file so Chris@19: that they can be re-used in the MPI test program. */ Chris@19: Chris@19: #include Chris@19: #include Chris@19: #include Chris@19: #include "fftw-bench.h" Chris@19: Chris@19: #ifdef _OPENMP Chris@19: # include Chris@19: #endif Chris@19: Chris@19: #ifdef HAVE_SMP Chris@19: int threads_ok = 1; Chris@19: #endif Chris@19: Chris@19: FFTW(plan) the_plan = 0; Chris@19: Chris@19: static const char *wisdat = "wis.dat"; Chris@19: unsigned the_flags = 0; Chris@19: int paranoid = 0; Chris@19: int usewisdom = 0; Chris@19: int havewisdom = 0; Chris@19: int nthreads = 1; Chris@19: int amnesia = 0; Chris@19: Chris@19: extern void install_hook(void); /* in hook.c */ Chris@19: extern void uninstall_hook(void); /* in hook.c */ Chris@19: Chris@19: #ifdef FFTW_RANDOM_ESTIMATOR Chris@19: extern unsigned FFTW(random_estimate_seed); Chris@19: #endif Chris@19: Chris@19: void useropt(const char *arg) Chris@19: { Chris@19: int x; Chris@19: double y; Chris@19: Chris@19: if (!strcmp(arg, "patient")) the_flags |= FFTW_PATIENT; Chris@19: else if (!strcmp(arg, "estimate")) the_flags |= FFTW_ESTIMATE; Chris@19: else if (!strcmp(arg, "estimatepat")) the_flags |= FFTW_ESTIMATE_PATIENT; Chris@19: else if (!strcmp(arg, "exhaustive")) the_flags |= FFTW_EXHAUSTIVE; Chris@19: else if (!strcmp(arg, "unaligned")) the_flags |= FFTW_UNALIGNED; Chris@19: else if (!strcmp(arg, "nosimd")) the_flags |= FFTW_NO_SIMD; Chris@19: else if (!strcmp(arg, "noindirectop")) the_flags |= FFTW_NO_INDIRECT_OP; Chris@19: else if (!strcmp(arg, "wisdom-only")) the_flags |= FFTW_WISDOM_ONLY; Chris@19: else if (sscanf(arg, "flag=%d", &x) == 1) the_flags |= x; Chris@19: else if (sscanf(arg, "bflag=%d", &x) == 1) the_flags |= 1U << x; Chris@19: else if (!strcmp(arg, "paranoid")) paranoid = 1; Chris@19: else if (!strcmp(arg, "wisdom")) usewisdom = 1; Chris@19: else if (!strcmp(arg, "amnesia")) amnesia = 1; Chris@19: else if (sscanf(arg, "nthreads=%d", &x) == 1) nthreads = x; Chris@19: #ifdef FFTW_RANDOM_ESTIMATOR Chris@19: else if (sscanf(arg, "eseed=%d", &x) == 1) FFTW(random_estimate_seed) = x; Chris@19: #endif Chris@19: else if (sscanf(arg, "timelimit=%lg", &y) == 1) { Chris@19: FFTW(set_timelimit)(y); Chris@19: } Chris@19: Chris@19: else fprintf(stderr, "unknown user option: %s. Ignoring.\n", arg); Chris@19: } Chris@19: Chris@19: void rdwisdom(void) Chris@19: { Chris@19: FILE *f; Chris@19: double tim; Chris@19: int success = 0; Chris@19: Chris@19: if (havewisdom) return; Chris@19: Chris@19: #ifdef HAVE_SMP Chris@19: if (threads_ok) { Chris@19: BENCH_ASSERT(FFTW(init_threads)()); Chris@19: FFTW(plan_with_nthreads)(nthreads); Chris@19: #ifdef _OPENMP Chris@19: omp_set_num_threads(nthreads); Chris@19: #endif Chris@19: } Chris@19: else if (nthreads > 1 && verbose > 1) { Chris@19: fprintf(stderr, "bench: WARNING - nthreads = %d, but threads not supported\n", nthreads); Chris@19: nthreads = 1; Chris@19: } Chris@19: #endif Chris@19: Chris@19: if (!usewisdom) return; Chris@19: Chris@19: timer_start(USER_TIMER); Chris@19: if ((f = fopen(wisdat, "r"))) { Chris@19: if (!import_wisdom(f)) Chris@19: fprintf(stderr, "bench: ERROR reading wisdom\n"); Chris@19: else Chris@19: success = 1; Chris@19: fclose(f); Chris@19: } Chris@19: tim = timer_stop(USER_TIMER); Chris@19: Chris@19: if (success) { Chris@19: if (verbose > 1) printf("READ WISDOM (%g seconds): ", tim); Chris@19: Chris@19: if (verbose > 3) Chris@19: export_wisdom(stdout); Chris@19: if (verbose > 1) Chris@19: printf("\n"); Chris@19: } Chris@19: havewisdom = 1; Chris@19: } Chris@19: Chris@19: void wrwisdom(void) Chris@19: { Chris@19: FILE *f; Chris@19: double tim; Chris@19: if (!havewisdom) return; Chris@19: Chris@19: timer_start(USER_TIMER); Chris@19: if ((f = fopen(wisdat, "w"))) { Chris@19: export_wisdom(f); Chris@19: fclose(f); Chris@19: } Chris@19: tim = timer_stop(USER_TIMER); Chris@19: if (verbose > 1) printf("write wisdom took %g seconds\n", tim); Chris@19: } Chris@19: Chris@19: static unsigned preserve_input_flags(bench_problem *p) Chris@19: { Chris@19: /* Chris@19: * fftw3 cannot preserve input for multidimensional c2r transforms. Chris@19: * Enforce FFTW_DESTROY_INPUT Chris@19: */ Chris@19: if (p->kind == PROBLEM_REAL && Chris@19: p->sign > 0 && Chris@19: !p->in_place && Chris@19: p->sz->rnk > 1) Chris@19: p->destroy_input = 1; Chris@19: Chris@19: if (p->destroy_input) Chris@19: return FFTW_DESTROY_INPUT; Chris@19: else Chris@19: return FFTW_PRESERVE_INPUT; Chris@19: } Chris@19: Chris@19: int can_do(bench_problem *p) Chris@19: { Chris@19: double tim; Chris@19: Chris@19: if (verbose > 2 && p->pstring) Chris@19: printf("Planning %s...\n", p->pstring); Chris@19: rdwisdom(); Chris@19: Chris@19: timer_start(USER_TIMER); Chris@19: the_plan = mkplan(p, preserve_input_flags(p) | the_flags | FFTW_ESTIMATE); Chris@19: tim = timer_stop(USER_TIMER); Chris@19: if (verbose > 2) printf("estimate-planner time: %g s\n", tim); Chris@19: Chris@19: if (the_plan) { Chris@19: FFTW(destroy_plan)(the_plan); Chris@19: return 1; Chris@19: } Chris@19: return 0; Chris@19: } Chris@19: Chris@19: void setup(bench_problem *p) Chris@19: { Chris@19: double tim; Chris@19: Chris@19: if (amnesia) { Chris@19: FFTW(forget_wisdom)(); Chris@19: havewisdom = 0; Chris@19: } Chris@19: Chris@19: /* Regression test: check that fftw_malloc exists and links Chris@19: * properly */ Chris@19: FFTW(free(FFTW(malloc(42)))); Chris@19: Chris@19: rdwisdom(); Chris@19: install_hook(); Chris@19: Chris@19: #ifdef HAVE_SMP Chris@19: if (verbose > 1 && nthreads > 1) printf("NTHREADS = %d\n", nthreads); Chris@19: #endif Chris@19: Chris@19: timer_start(USER_TIMER); Chris@19: the_plan = mkplan(p, preserve_input_flags(p) | the_flags); Chris@19: tim = timer_stop(USER_TIMER); Chris@19: if (verbose > 1) printf("planner time: %g s\n", tim); Chris@19: Chris@19: BENCH_ASSERT(the_plan); Chris@19: Chris@19: { Chris@19: double add, mul, nfma, cost, pcost; Chris@19: FFTW(flops)(the_plan, &add, &mul, &nfma); Chris@19: cost = FFTW(estimate_cost)(the_plan); Chris@19: pcost = FFTW(cost)(the_plan); Chris@19: if (verbose > 1) { Chris@19: FFTW(print_plan)(the_plan); Chris@19: printf("\n"); Chris@19: printf("flops: %0.0f add, %0.0f mul, %0.0f fma\n", Chris@19: add, mul, nfma); Chris@19: printf("estimated cost: %f, pcost = %f\n", cost, pcost); Chris@19: } Chris@19: } Chris@19: } Chris@19: Chris@19: Chris@19: void doit(int iter, bench_problem *p) Chris@19: { Chris@19: int i; Chris@19: FFTW(plan) q = the_plan; Chris@19: Chris@19: UNUSED(p); Chris@19: for (i = 0; i < iter; ++i) Chris@19: FFTW(execute)(q); Chris@19: } Chris@19: Chris@19: void done(bench_problem *p) Chris@19: { Chris@19: UNUSED(p); Chris@19: Chris@19: FFTW(destroy_plan)(the_plan); Chris@19: uninstall_hook(); Chris@19: } Chris@19: Chris@19: void cleanup(void) Chris@19: { Chris@19: initial_cleanup(); Chris@19: Chris@19: wrwisdom(); Chris@19: #ifdef HAVE_SMP Chris@19: FFTW(cleanup_threads)(); Chris@19: #else Chris@19: FFTW(cleanup)(); Chris@19: #endif Chris@19: Chris@19: # ifdef FFTW_DEBUG_MALLOC Chris@19: { Chris@19: /* undocumented memory checker */ Chris@19: FFTW_EXTERN void FFTW(malloc_print_minfo)(int v); Chris@19: FFTW(malloc_print_minfo)(verbose); Chris@19: } Chris@19: # endif Chris@19: Chris@19: final_cleanup(); Chris@19: }