Chris@42: /* Chris@42: * Copyright (c) 2003, 2007-14 Matteo Frigo Chris@42: * Copyright (c) 2003, 2007-14 Massachusetts Institute of Technology Chris@42: * Chris@42: * This program is free software; you can redistribute it and/or modify Chris@42: * it under the terms of the GNU General Public License as published by Chris@42: * the Free Software Foundation; either version 2 of the License, or Chris@42: * (at your option) any later version. Chris@42: * Chris@42: * This program is distributed in the hope that it will be useful, Chris@42: * but WITHOUT ANY WARRANTY; without even the implied warranty of Chris@42: * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the Chris@42: * GNU General Public License for more details. Chris@42: * Chris@42: * You should have received a copy of the GNU General Public License Chris@42: * along with this program; if not, write to the Free Software Chris@42: * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA Chris@42: * Chris@42: */ Chris@42: Chris@42: /* detection of alignment. This is complicated because a machine may Chris@42: support multiple SIMD extensions (e.g. SSE2 and AVX) but only one Chris@42: set of alignment contraints. So this alignment stuff cannot be Chris@42: defined in the SIMD header files. Rather than defining a separate Chris@42: set of "machine" header files, we just do this ugly ifdef here. */ Chris@42: #if defined(HAVE_AVX512) Chris@42: # if defined(FFTW_SINGLE) Chris@42: # define ALIGNMENT 8 /* Alignment for the LD/ST macros */ Chris@42: # define ALIGNMENTA 64 /* Alignment for the LDA/STA macros */ Chris@42: # else Chris@42: # define ALIGNMENT 16 /* Alignment for the LD/ST macros */ Chris@42: # define ALIGNMENTA 64 /* Alignment for the LDA/STA macros */ Chris@42: # endif Chris@42: #elif defined(HAVE_SSE2) || defined(HAVE_AVX) || defined(HAVE_AVX2) || (HAVE_AVX_128_FMA) Chris@42: # if defined(FFTW_SINGLE) Chris@42: # define ALIGNMENT 8 /* Alignment for the LD/ST macros */ Chris@42: # define ALIGNMENTA 16 /* Alignment for the LDA/STA macros */ Chris@42: # else Chris@42: # define ALIGNMENT 16 /* Alignment for the LD/ST macros */ Chris@42: # define ALIGNMENTA 16 /* Alignment for the LDA/STA macros */ Chris@42: # endif Chris@42: #elif defined(HAVE_ALTIVEC) Chris@42: # define ALIGNMENT 8 /* Alignment for the LD/ST macros */ Chris@42: # define ALIGNMENTA 16 /* Alignment for the LDA/STA macros */ Chris@42: #elif defined(HAVE_NEON) || defined(HAVE_VSX) Chris@42: # define ALIGNMENT 8 /* Alignment for the LD/ST macros */ Chris@42: # define ALIGNMENTA 8 /* Alignment for the LDA/STA macros */ Chris@42: #elif defined(HAVE_KCVI) Chris@42: # if defined(FFTW_SINGLE) Chris@42: # define ALIGNMENT 8 /* Alignment for the LD/ST macros */ Chris@42: # else Chris@42: # define ALIGNMENT 16 /* Alignment for the LD/ST macros */ Chris@42: # endif Chris@42: # define ALIGNMENTA 64 /* Alignment for the LDA/STA macros */ Chris@42: #elif defined(HAVE_GENERIC_SIMD256) Chris@42: # if defined(FFTW_SINGLE) Chris@42: # define ALIGNMENT 8 Chris@42: # define ALIGNMENTA 32 Chris@42: # else Chris@42: # define ALIGNMENT 16 Chris@42: # define ALIGNMENTA 32 Chris@42: # endif Chris@42: #elif defined(HAVE_GENERIC_SIMD128) Chris@42: # if defined(FFTW_SINGLE) Chris@42: # define ALIGNMENT 8 Chris@42: # define ALIGNMENTA 16 Chris@42: # else Chris@42: # define ALIGNMENT 16 Chris@42: # define ALIGNMENTA 16 Chris@42: # endif Chris@42: #endif Chris@42: Chris@42: #if HAVE_SIMD Chris@42: # ifndef ALIGNMENT Chris@42: # error "ALIGNMENT not defined" Chris@42: # endif Chris@42: # ifndef ALIGNMENTA Chris@42: # error "ALIGNMENTA not defined" Chris@42: # endif Chris@42: #endif Chris@42: Chris@42: /* rename for precision and for SIMD extensions */ Chris@42: #define XSIMD0(name, suffix) CONCAT(name, suffix) Chris@42: #define XSIMD(name) XSIMD0(X(name), SIMD_SUFFIX) Chris@42: #define XSIMD_STRING(x) x STRINGIZE(SIMD_SUFFIX) Chris@42: Chris@42: /* TAINT_BIT is set if pointers are not guaranteed to be multiples of Chris@42: ALIGNMENT */ Chris@42: #define TAINT_BIT 1 Chris@42: Chris@42: /* TAINT_BITA is set if pointers are not guaranteed to be multiples of Chris@42: ALIGNMENTA */ Chris@42: #define TAINT_BITA 2 Chris@42: Chris@42: #define PTRINT(p) ((uintptr_t)(p)) Chris@42: Chris@42: #define ALIGNED(p) \ Chris@42: (((PTRINT(UNTAINT(p)) % ALIGNMENT) == 0) && !(PTRINT(p) & TAINT_BIT)) Chris@42: Chris@42: #define ALIGNEDA(p) \ Chris@42: (((PTRINT(UNTAINT(p)) % ALIGNMENTA) == 0) && !(PTRINT(p) & TAINT_BITA)) Chris@42: Chris@42: #define SIMD_STRIDE_OK(x) (!(((x) * sizeof(R)) % ALIGNMENT)) Chris@42: #define SIMD_STRIDE_OKA(x) (!(((x) * sizeof(R)) % ALIGNMENTA)) Chris@42: #define SIMD_VSTRIDE_OK SIMD_STRIDE_OK Chris@42: