cannam@95
|
1 /*
|
cannam@95
|
2 * Copyright (c) 2003, 2007-11 Matteo Frigo
|
cannam@95
|
3 * Copyright (c) 2003, 2007-11 Massachusetts Institute of Technology
|
cannam@95
|
4 *
|
cannam@95
|
5 * This program is free software; you can redistribute it and/or modify
|
cannam@95
|
6 * it under the terms of the GNU General Public License as published by
|
cannam@95
|
7 * the Free Software Foundation; either version 2 of the License, or
|
cannam@95
|
8 * (at your option) any later version.
|
cannam@95
|
9 *
|
cannam@95
|
10 * This program is distributed in the hope that it will be useful,
|
cannam@95
|
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
|
cannam@95
|
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
cannam@95
|
13 * GNU General Public License for more details.
|
cannam@95
|
14 *
|
cannam@95
|
15 * You should have received a copy of the GNU General Public License
|
cannam@95
|
16 * along with this program; if not, write to the Free Software
|
cannam@95
|
17 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
cannam@95
|
18 *
|
cannam@95
|
19 */
|
cannam@95
|
20
|
cannam@95
|
21 #include "ifftw-mpi.h"
|
cannam@95
|
22
|
cannam@95
|
23 /* common functions for rearrangements of the data for the *-rank1-bigvec
|
cannam@95
|
24 solvers */
|
cannam@95
|
25
|
cannam@95
|
26 static int div_mult(INT b, INT a) {
|
cannam@95
|
27 return (a > b && a % b == 0);
|
cannam@95
|
28 }
|
cannam@95
|
29 static int div_mult2(INT b, INT a, INT n) {
|
cannam@95
|
30 return (div_mult(b, a) && div_mult(n, b));
|
cannam@95
|
31 }
|
cannam@95
|
32
|
cannam@95
|
33 int XM(rearrange_applicable)(rearrangement rearrange,
|
cannam@95
|
34 ddim dim0, INT vn, int n_pes)
|
cannam@95
|
35 {
|
cannam@95
|
36 /* note: it is important that cases other than CONTIG be
|
cannam@95
|
37 applicable only when the resulting transpose dimension
|
cannam@95
|
38 is divisible by n_pes; otherwise, the allocation size
|
cannam@95
|
39 returned by the API will be incorrect */
|
cannam@95
|
40 return ((rearrange != DISCONTIG || div_mult(n_pes, vn))
|
cannam@95
|
41 && (rearrange != SQUARE_BEFORE
|
cannam@95
|
42 || div_mult2(dim0.b[IB], vn, n_pes))
|
cannam@95
|
43 && (rearrange != SQUARE_AFTER
|
cannam@95
|
44 || (dim0.b[IB] != dim0.b[OB]
|
cannam@95
|
45 && div_mult2(dim0.b[OB], vn, n_pes)))
|
cannam@95
|
46 && (rearrange != SQUARE_MIDDLE
|
cannam@95
|
47 || div_mult(dim0.n * n_pes, vn)));
|
cannam@95
|
48 }
|
cannam@95
|
49
|
cannam@95
|
50 INT XM(rearrange_ny)(rearrangement rearrange, ddim dim0, INT vn, int n_pes)
|
cannam@95
|
51 {
|
cannam@95
|
52 switch (rearrange) {
|
cannam@95
|
53 case CONTIG:
|
cannam@95
|
54 return vn;
|
cannam@95
|
55 case DISCONTIG:
|
cannam@95
|
56 return n_pes;
|
cannam@95
|
57 case SQUARE_BEFORE:
|
cannam@95
|
58 return dim0.b[IB];
|
cannam@95
|
59 case SQUARE_AFTER:
|
cannam@95
|
60 return dim0.b[OB];
|
cannam@95
|
61 case SQUARE_MIDDLE:
|
cannam@95
|
62 return dim0.n * n_pes;
|
cannam@95
|
63 }
|
cannam@95
|
64 return 0;
|
cannam@95
|
65 }
|