Chris@10: /* Chris@10: * Copyright (c) 2003, 2007-11 Matteo Frigo Chris@10: * Copyright (c) 2003, 2007-11 Massachusetts Institute of Technology Chris@10: * Chris@10: * This program is free software; you can redistribute it and/or modify Chris@10: * it under the terms of the GNU General Public License as published by Chris@10: * the Free Software Foundation; either version 2 of the License, or Chris@10: * (at your option) any later version. Chris@10: * Chris@10: * This program is distributed in the hope that it will be useful, Chris@10: * but WITHOUT ANY WARRANTY; without even the implied warranty of Chris@10: * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the Chris@10: * GNU General Public License for more details. Chris@10: * Chris@10: * You should have received a copy of the GNU General Public License Chris@10: * along with this program; if not, write to the Free Software Chris@10: * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA Chris@10: * Chris@10: */ Chris@10: Chris@10: Chris@10: #include "verify.h" Chris@10: Chris@10: static void recur(int rnk, const bench_iodim *dims0, const bench_iodim *dims1, Chris@10: dotens2_closure *k, Chris@10: int indx0, int ondx0, int indx1, int ondx1) Chris@10: { Chris@10: if (rnk == 0) Chris@10: k->apply(k, indx0, ondx0, indx1, ondx1); Chris@10: else { Chris@10: int i, n = dims0[0].n; Chris@10: int is0 = dims0[0].is; Chris@10: int os0 = dims0[0].os; Chris@10: int is1 = dims1[0].is; Chris@10: int os1 = dims1[0].os; Chris@10: Chris@10: BENCH_ASSERT(n == dims1[0].n); Chris@10: Chris@10: for (i = 0; i < n; ++i) { Chris@10: recur(rnk - 1, dims0 + 1, dims1 + 1, k, Chris@10: indx0, ondx0, indx1, ondx1); Chris@10: indx0 += is0; ondx0 += os0; Chris@10: indx1 += is1; ondx1 += os1; Chris@10: } Chris@10: } Chris@10: } Chris@10: Chris@10: void bench_dotens2(const bench_tensor *sz0, const bench_tensor *sz1, dotens2_closure *k) Chris@10: { Chris@10: BENCH_ASSERT(sz0->rnk == sz1->rnk); Chris@10: if (sz0->rnk == RNK_MINFTY) Chris@10: return; Chris@10: recur(sz0->rnk, sz0->dims, sz1->dims, k, 0, 0, 0, 0); Chris@10: }