Chris@82: /* Chris@82: * Copyright (c) 2003, 2007-14 Matteo Frigo Chris@82: * Copyright (c) 2003, 2007-14 Massachusetts Institute of Technology Chris@82: * Chris@82: * This program is free software; you can redistribute it and/or modify Chris@82: * it under the terms of the GNU General Public License as published by Chris@82: * the Free Software Foundation; either version 2 of the License, or Chris@82: * (at your option) any later version. Chris@82: * Chris@82: * This program is distributed in the hope that it will be useful, Chris@82: * but WITHOUT ANY WARRANTY; without even the implied warranty of Chris@82: * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the Chris@82: * GNU General Public License for more details. Chris@82: * Chris@82: * You should have received a copy of the GNU General Public License Chris@82: * along with this program; if not, write to the Free Software Chris@82: * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA Chris@82: * Chris@82: */ Chris@82: Chris@82: /* detection of alignment. This is complicated because a machine may Chris@82: support multiple SIMD extensions (e.g. SSE2 and AVX) but only one Chris@82: set of alignment contraints. So this alignment stuff cannot be Chris@82: defined in the SIMD header files. Rather than defining a separate Chris@82: set of "machine" header files, we just do this ugly ifdef here. */ Chris@82: #if defined(HAVE_AVX512) Chris@82: # if defined(FFTW_SINGLE) Chris@82: # define ALIGNMENT 8 /* Alignment for the LD/ST macros */ Chris@82: # define ALIGNMENTA 64 /* Alignment for the LDA/STA macros */ Chris@82: # else Chris@82: # define ALIGNMENT 16 /* Alignment for the LD/ST macros */ Chris@82: # define ALIGNMENTA 64 /* Alignment for the LDA/STA macros */ Chris@82: # endif Chris@82: #elif defined(HAVE_SSE2) || defined(HAVE_AVX) || defined(HAVE_AVX2) || (HAVE_AVX_128_FMA) Chris@82: # if defined(FFTW_SINGLE) Chris@82: # define ALIGNMENT 8 /* Alignment for the LD/ST macros */ Chris@82: # define ALIGNMENTA 16 /* Alignment for the LDA/STA macros */ Chris@82: # else Chris@82: # define ALIGNMENT 16 /* Alignment for the LD/ST macros */ Chris@82: # define ALIGNMENTA 16 /* Alignment for the LDA/STA macros */ Chris@82: # endif Chris@82: #elif defined(HAVE_ALTIVEC) Chris@82: # define ALIGNMENT 8 /* Alignment for the LD/ST macros */ Chris@82: # define ALIGNMENTA 16 /* Alignment for the LDA/STA macros */ Chris@82: #elif defined(HAVE_NEON) || defined(HAVE_VSX) Chris@82: # define ALIGNMENT 8 /* Alignment for the LD/ST macros */ Chris@82: # define ALIGNMENTA 8 /* Alignment for the LDA/STA macros */ Chris@82: #elif defined(HAVE_KCVI) Chris@82: # if defined(FFTW_SINGLE) Chris@82: # define ALIGNMENT 8 /* Alignment for the LD/ST macros */ Chris@82: # else Chris@82: # define ALIGNMENT 16 /* Alignment for the LD/ST macros */ Chris@82: # endif Chris@82: # define ALIGNMENTA 64 /* Alignment for the LDA/STA macros */ Chris@82: #elif defined(HAVE_GENERIC_SIMD256) Chris@82: # if defined(FFTW_SINGLE) Chris@82: # define ALIGNMENT 8 Chris@82: # define ALIGNMENTA 32 Chris@82: # else Chris@82: # define ALIGNMENT 16 Chris@82: # define ALIGNMENTA 32 Chris@82: # endif Chris@82: #elif defined(HAVE_GENERIC_SIMD128) Chris@82: # if defined(FFTW_SINGLE) Chris@82: # define ALIGNMENT 8 Chris@82: # define ALIGNMENTA 16 Chris@82: # else Chris@82: # define ALIGNMENT 16 Chris@82: # define ALIGNMENTA 16 Chris@82: # endif Chris@82: #endif Chris@82: Chris@82: #if HAVE_SIMD Chris@82: # ifndef ALIGNMENT Chris@82: # error "ALIGNMENT not defined" Chris@82: # endif Chris@82: # ifndef ALIGNMENTA Chris@82: # error "ALIGNMENTA not defined" Chris@82: # endif Chris@82: #endif Chris@82: Chris@82: /* rename for precision and for SIMD extensions */ Chris@82: #define XSIMD0(name, suffix) CONCAT(name, suffix) Chris@82: #define XSIMD(name) XSIMD0(X(name), SIMD_SUFFIX) Chris@82: #define XSIMD_STRING(x) x STRINGIZE(SIMD_SUFFIX) Chris@82: Chris@82: /* TAINT_BIT is set if pointers are not guaranteed to be multiples of Chris@82: ALIGNMENT */ Chris@82: #define TAINT_BIT 1 Chris@82: Chris@82: /* TAINT_BITA is set if pointers are not guaranteed to be multiples of Chris@82: ALIGNMENTA */ Chris@82: #define TAINT_BITA 2 Chris@82: Chris@82: #define PTRINT(p) ((uintptr_t)(p)) Chris@82: Chris@82: #define ALIGNED(p) \ Chris@82: (((PTRINT(UNTAINT(p)) % ALIGNMENT) == 0) && !(PTRINT(p) & TAINT_BIT)) Chris@82: Chris@82: #define ALIGNEDA(p) \ Chris@82: (((PTRINT(UNTAINT(p)) % ALIGNMENTA) == 0) && !(PTRINT(p) & TAINT_BITA)) Chris@82: Chris@82: #define SIMD_STRIDE_OK(x) (!(((x) * sizeof(R)) % ALIGNMENT)) Chris@82: #define SIMD_STRIDE_OKA(x) (!(((x) * sizeof(R)) % ALIGNMENTA)) Chris@82: #define SIMD_VSTRIDE_OK SIMD_STRIDE_OK Chris@82: