annotate src/fftw-3.3.8/mpi/mpi-transpose.h @ 167:bd3cc4d1df30

Add FFTW 3.3.8 source, and a Linux build
author Chris Cannam <cannam@all-day-breakfast.com>
date Tue, 19 Nov 2019 14:52:55 +0000
parents
children
rev   line source
cannam@167 1 /*
cannam@167 2 * Copyright (c) 2003, 2007-14 Matteo Frigo
cannam@167 3 * Copyright (c) 2003, 2007-14 Massachusetts Institute of Technology
cannam@167 4 *
cannam@167 5 * This program is free software; you can redistribute it and/or modify
cannam@167 6 * it under the terms of the GNU General Public License as published by
cannam@167 7 * the Free Software Foundation; either version 2 of the License, or
cannam@167 8 * (at your option) any later version.
cannam@167 9 *
cannam@167 10 * This program is distributed in the hope that it will be useful,
cannam@167 11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
cannam@167 12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
cannam@167 13 * GNU General Public License for more details.
cannam@167 14 *
cannam@167 15 * You should have received a copy of the GNU General Public License
cannam@167 16 * along with this program; if not, write to the Free Software
cannam@167 17 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
cannam@167 18 *
cannam@167 19 */
cannam@167 20
cannam@167 21 #include "ifftw-mpi.h"
cannam@167 22
cannam@167 23 /* tproblem.c: */
cannam@167 24 typedef struct {
cannam@167 25 problem super;
cannam@167 26 INT vn; /* vector length (vector stride 1) */
cannam@167 27 INT nx, ny; /* nx x ny transposed to ny x nx */
cannam@167 28 R *I, *O; /* contiguous real arrays (both same size!) */
cannam@167 29
cannam@167 30 unsigned flags; /* TRANSPOSED_IN: input is *locally* transposed
cannam@167 31 TRANSPOSED_OUT: output is *locally* transposed */
cannam@167 32
cannam@167 33 INT block, tblock; /* block size, slab decomposition;
cannam@167 34 tblock is for transposed blocks on output */
cannam@167 35
cannam@167 36 MPI_Comm comm;
cannam@167 37 } problem_mpi_transpose;
cannam@167 38
cannam@167 39 problem *XM(mkproblem_transpose)(INT nx, INT ny, INT vn,
cannam@167 40 R *I, R *O,
cannam@167 41 INT block, INT tblock,
cannam@167 42 MPI_Comm comm,
cannam@167 43 unsigned flags);
cannam@167 44
cannam@167 45 /* tsolve.c: */
cannam@167 46 void XM(transpose_solve)(const plan *ego_, const problem *p_);
cannam@167 47
cannam@167 48 /* plans have same operands as rdft plans, so just re-use */
cannam@167 49 typedef plan_rdft plan_mpi_transpose;
cannam@167 50 #define MKPLAN_MPI_TRANSPOSE(type, adt, apply) \
cannam@167 51 (type *)X(mkplan_rdft)(sizeof(type), adt, apply)
cannam@167 52
cannam@167 53 /* transpose-pairwise.c: */
cannam@167 54 int XM(mkplans_posttranspose)(const problem_mpi_transpose *p, planner *plnr,
cannam@167 55 R *I, R *O, int my_pe,
cannam@167 56 plan **cld2, plan **cld2rest, plan **cld3,
cannam@167 57 INT *rest_Ioff, INT *rest_Ooff);
cannam@167 58 /* various solvers */
cannam@167 59 void XM(transpose_pairwise_register)(planner *p);
cannam@167 60 void XM(transpose_alltoall_register)(planner *p);
cannam@167 61 void XM(transpose_recurse_register)(planner *p);