/* * Copyright (c) 2003, 2007-14 Matteo Frigo * Copyright (c) 2003, 2007-14 Massachusetts Institute of Technology * * This program is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation; either version 2 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program; if not, write to the Free Software * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA * */ /* detection of alignment. This is complicated because a machine may support multiple SIMD extensions (e.g. SSE2 and AVX) but only one set of alignment contraints. So this alignment stuff cannot be defined in the SIMD header files. Rather than defining a separate set of "machine" header files, we just do this ugly ifdef here. */ #if defined(HAVE_AVX512) # if defined(FFTW_SINGLE) # define ALIGNMENT 8 /* Alignment for the LD/ST macros */ # define ALIGNMENTA 64 /* Alignment for the LDA/STA macros */ # else # define ALIGNMENT 16 /* Alignment for the LD/ST macros */ # define ALIGNMENTA 64 /* Alignment for the LDA/STA macros */ # endif #elif defined(HAVE_SSE2) || defined(HAVE_AVX) || defined(HAVE_AVX2) || (HAVE_AVX_128_FMA) # if defined(FFTW_SINGLE) # define ALIGNMENT 8 /* Alignment for the LD/ST macros */ # define ALIGNMENTA 16 /* Alignment for the LDA/STA macros */ # else # define ALIGNMENT 16 /* Alignment for the LD/ST macros */ # define ALIGNMENTA 16 /* Alignment for the LDA/STA macros */ # endif #elif defined(HAVE_ALTIVEC) # define ALIGNMENT 8 /* Alignment for the LD/ST macros */ # define ALIGNMENTA 16 /* Alignment for the LDA/STA macros */ #elif defined(HAVE_NEON) || defined(HAVE_VSX) # define ALIGNMENT 8 /* Alignment for the LD/ST macros */ # define ALIGNMENTA 8 /* Alignment for the LDA/STA macros */ #elif defined(HAVE_KCVI) # if defined(FFTW_SINGLE) # define ALIGNMENT 8 /* Alignment for the LD/ST macros */ # else # define ALIGNMENT 16 /* Alignment for the LD/ST macros */ # endif # define ALIGNMENTA 64 /* Alignment for the LDA/STA macros */ #elif defined(HAVE_GENERIC_SIMD256) # if defined(FFTW_SINGLE) # define ALIGNMENT 8 # define ALIGNMENTA 32 # else # define ALIGNMENT 16 # define ALIGNMENTA 32 # endif #elif defined(HAVE_GENERIC_SIMD128) # if defined(FFTW_SINGLE) # define ALIGNMENT 8 # define ALIGNMENTA 16 # else # define ALIGNMENT 16 # define ALIGNMENTA 16 # endif #endif #if HAVE_SIMD # ifndef ALIGNMENT # error "ALIGNMENT not defined" # endif # ifndef ALIGNMENTA # error "ALIGNMENTA not defined" # endif #endif /* rename for precision and for SIMD extensions */ #define XSIMD0(name, suffix) CONCAT(name, suffix) #define XSIMD(name) XSIMD0(X(name), SIMD_SUFFIX) #define XSIMD_STRING(x) x STRINGIZE(SIMD_SUFFIX) /* TAINT_BIT is set if pointers are not guaranteed to be multiples of ALIGNMENT */ #define TAINT_BIT 1 /* TAINT_BITA is set if pointers are not guaranteed to be multiples of ALIGNMENTA */ #define TAINT_BITA 2 #define PTRINT(p) ((uintptr_t)(p)) #define ALIGNED(p) \ (((PTRINT(UNTAINT(p)) % ALIGNMENT) == 0) && !(PTRINT(p) & TAINT_BIT)) #define ALIGNEDA(p) \ (((PTRINT(UNTAINT(p)) % ALIGNMENTA) == 0) && !(PTRINT(p) & TAINT_BITA)) #define SIMD_STRIDE_OK(x) (!(((x) * sizeof(R)) % ALIGNMENT)) #define SIMD_STRIDE_OKA(x) (!(((x) * sizeof(R)) % ALIGNMENTA)) #define SIMD_VSTRIDE_OK SIMD_STRIDE_OK