Chris@10: /* Chris@10: * Copyright (c) 2003, 2007-11 Matteo Frigo Chris@10: * Copyright (c) 2003, 2007-11 Massachusetts Institute of Technology Chris@10: * Chris@10: * This program is free software; you can redistribute it and/or modify Chris@10: * it under the terms of the GNU General Public License as published by Chris@10: * the Free Software Foundation; either version 2 of the License, or Chris@10: * (at your option) any later version. Chris@10: * Chris@10: * This program is distributed in the hope that it will be useful, Chris@10: * but WITHOUT ANY WARRANTY; without even the implied warranty of Chris@10: * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the Chris@10: * GNU General Public License for more details. Chris@10: * Chris@10: * You should have received a copy of the GNU General Public License Chris@10: * along with this program; if not, write to the Free Software Chris@10: * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA Chris@10: * Chris@10: */ Chris@10: Chris@10: #include "ifftw-mpi.h" Chris@10: Chris@10: /* tproblem.c: */ Chris@10: typedef struct { Chris@10: problem super; Chris@10: INT vn; /* vector length (vector stride 1) */ Chris@10: INT nx, ny; /* nx x ny transposed to ny x nx */ Chris@10: R *I, *O; /* contiguous real arrays (both same size!) */ Chris@10: Chris@10: unsigned flags; /* TRANSPOSED_IN: input is *locally* transposed Chris@10: TRANSPOSED_OUT: output is *locally* transposed */ Chris@10: Chris@10: INT block, tblock; /* block size, slab decomposition; Chris@10: tblock is for transposed blocks on output */ Chris@10: Chris@10: MPI_Comm comm; Chris@10: } problem_mpi_transpose; Chris@10: Chris@10: problem *XM(mkproblem_transpose)(INT nx, INT ny, INT vn, Chris@10: R *I, R *O, Chris@10: INT block, INT tblock, Chris@10: MPI_Comm comm, Chris@10: unsigned flags); Chris@10: Chris@10: /* tsolve.c: */ Chris@10: void XM(transpose_solve)(const plan *ego_, const problem *p_); Chris@10: Chris@10: /* plans have same operands as rdft plans, so just re-use */ Chris@10: typedef plan_rdft plan_mpi_transpose; Chris@10: #define MKPLAN_MPI_TRANSPOSE(type, adt, apply) \ Chris@10: (type *)X(mkplan_rdft)(sizeof(type), adt, apply) Chris@10: Chris@10: /* transpose-pairwise.c: */ Chris@10: int XM(mkplans_posttranspose)(const problem_mpi_transpose *p, planner *plnr, Chris@10: R *I, R *O, int my_pe, Chris@10: plan **cld2, plan **cld2rest, plan **cld3, Chris@10: INT *rest_Ioff, INT *rest_Ooff); Chris@10: /* various solvers */ Chris@10: void XM(transpose_pairwise_register)(planner *p); Chris@10: void XM(transpose_alltoall_register)(planner *p); Chris@10: void XM(transpose_recurse_register)(planner *p);