99 lines
		
	
	
		
			3.5 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			99 lines
		
	
	
		
			3.5 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| /*
 | |
|  * Copyright (c) 2003, 2007-14 Matteo Frigo
 | |
|  * Copyright (c) 2003, 2007-14 Massachusetts Institute of Technology
 | |
|  *
 | |
|  * This program is free software; you can redistribute it and/or modify
 | |
|  * it under the terms of the GNU General Public License as published by
 | |
|  * the Free Software Foundation; either version 2 of the License, or
 | |
|  * (at your option) any later version.
 | |
|  *
 | |
|  * This program is distributed in the hope that it will be useful,
 | |
|  * but WITHOUT ANY WARRANTY; without even the implied warranty of
 | |
|  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 | |
|  * GNU General Public License for more details.
 | |
|  *
 | |
|  * You should have received a copy of the GNU General Public License
 | |
|  * along with this program; if not, write to the Free Software
 | |
|  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301  USA
 | |
|  *
 | |
|  */
 | |
| 
 | |
| /* detection of alignment.  This is complicated because a machine may
 | |
|    support multiple SIMD extensions (e.g. SSE2 and AVX) but only one
 | |
|    set of alignment contraints.  So this alignment stuff cannot be
 | |
|    defined in the SIMD header files.  Rather than defining a separate
 | |
|    set of "machine" header files, we just do this ugly ifdef here. */
 | |
| #if defined(HAVE_SSE2) || defined(HAVE_AVX) || defined(HAVE_AVX2) || defined(HAVE_AVX_128_FMA) || defined(HAVE_AVX512)
 | |
| #  if defined(FFTW_SINGLE)
 | |
| #    define ALIGNMENT 8     /* Alignment for the LD/ST macros */
 | |
| #    define ALIGNMENTA 16   /* Alignment for the LDA/STA macros */
 | |
| #  else
 | |
| #    define ALIGNMENT 16    /* Alignment for the LD/ST macros */
 | |
| #    define ALIGNMENTA 16   /* Alignment for the LDA/STA macros */
 | |
| #  endif
 | |
| #elif defined(HAVE_ALTIVEC)
 | |
| #  define ALIGNMENT 8     /* Alignment for the LD/ST macros */
 | |
| #  define ALIGNMENTA 16   /* Alignment for the LDA/STA macros */
 | |
| #elif defined(HAVE_NEON) || defined(HAVE_VSX)
 | |
| #  define ALIGNMENT 8     /* Alignment for the LD/ST macros */
 | |
| #  define ALIGNMENTA 8    /* Alignment for the LDA/STA macros */
 | |
| #elif defined(HAVE_KCVI)
 | |
| #  if defined(FFTW_SINGLE)
 | |
| #    define ALIGNMENT 8     /* Alignment for the LD/ST macros */
 | |
| #  else
 | |
| #    define ALIGNMENT 16     /* Alignment for the LD/ST macros */
 | |
| #  endif
 | |
| #  define ALIGNMENTA 64   /* Alignment for the LDA/STA macros */
 | |
| #elif defined(HAVE_GENERIC_SIMD256)
 | |
| #  if defined(FFTW_SINGLE)
 | |
| #    define ALIGNMENT 8
 | |
| #    define ALIGNMENTA 32
 | |
| #  else
 | |
| #    define ALIGNMENT 16
 | |
| #    define ALIGNMENTA 32
 | |
| #  endif
 | |
| #elif defined(HAVE_GENERIC_SIMD128)
 | |
| #  if defined(FFTW_SINGLE)
 | |
| #    define ALIGNMENT 8
 | |
| #    define ALIGNMENTA 16
 | |
| #  else
 | |
| #    define ALIGNMENT 16
 | |
| #    define ALIGNMENTA 16
 | |
| #  endif
 | |
| #endif
 | |
| 
 | |
| #if HAVE_SIMD
 | |
| #  ifndef ALIGNMENT
 | |
| #  error "ALIGNMENT not defined"
 | |
| #  endif
 | |
| #  ifndef ALIGNMENTA
 | |
| #  error "ALIGNMENTA not defined"
 | |
| #  endif
 | |
| #endif
 | |
| 
 | |
| /* rename for precision and for SIMD extensions */
 | |
| #define XSIMD0(name, suffix) CONCAT(name, suffix)
 | |
| #define XSIMD(name) XSIMD0(X(name), SIMD_SUFFIX)
 | |
| #define XSIMD_STRING(x) x STRINGIZE(SIMD_SUFFIX)
 | |
| 
 | |
| /* TAINT_BIT is set if pointers are not guaranteed to be multiples of
 | |
|    ALIGNMENT */
 | |
| #define TAINT_BIT 1    
 | |
| 
 | |
| /* TAINT_BITA is set if pointers are not guaranteed to be multiples of
 | |
|    ALIGNMENTA */
 | |
| #define TAINT_BITA 2
 | |
| 
 | |
| #define PTRINT(p) ((uintptr_t)(p))
 | |
| 
 | |
| #define ALIGNED(p) \
 | |
|   (((PTRINT(UNTAINT(p)) % ALIGNMENT) == 0) && !(PTRINT(p) & TAINT_BIT))
 | |
| 
 | |
| #define ALIGNEDA(p) \
 | |
|   (((PTRINT(UNTAINT(p)) % ALIGNMENTA) == 0) && !(PTRINT(p) & TAINT_BITA))
 | |
| 
 | |
| #define SIMD_STRIDE_OK(x) (!(((x) * sizeof(R)) % ALIGNMENT))
 | |
| #define SIMD_STRIDE_OKA(x) (!(((x) * sizeof(R)) % ALIGNMENTA))
 | |
| #define SIMD_VSTRIDE_OK SIMD_STRIDE_OK
 | |
| 
 | 
