99 lines
		
	
	
		
			3.5 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
		
		
			
		
	
	
			99 lines
		
	
	
		
			3.5 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
|   | /*
 | ||
|  |  * Copyright (c) 2003, 2007-14 Matteo Frigo | ||
|  |  * Copyright (c) 2003, 2007-14 Massachusetts Institute of Technology | ||
|  |  * | ||
|  |  * This program is free software; you can redistribute it and/or modify | ||
|  |  * it under the terms of the GNU General Public License as published by | ||
|  |  * the Free Software Foundation; either version 2 of the License, or | ||
|  |  * (at your option) any later version. | ||
|  |  * | ||
|  |  * This program is distributed in the hope that it will be useful, | ||
|  |  * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
|  |  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the | ||
|  |  * GNU General Public License for more details. | ||
|  |  * | ||
|  |  * You should have received a copy of the GNU General Public License | ||
|  |  * along with this program; if not, write to the Free Software | ||
|  |  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301  USA | ||
|  |  * | ||
|  |  */ | ||
|  | 
 | ||
|  | /* detection of alignment.  This is complicated because a machine may
 | ||
|  |    support multiple SIMD extensions (e.g. SSE2 and AVX) but only one | ||
|  |    set of alignment contraints.  So this alignment stuff cannot be | ||
|  |    defined in the SIMD header files.  Rather than defining a separate | ||
|  |    set of "machine" header files, we just do this ugly ifdef here. */ | ||
|  | #if defined(HAVE_SSE2) || defined(HAVE_AVX) || defined(HAVE_AVX2) || defined(HAVE_AVX_128_FMA) || defined(HAVE_AVX512)
 | ||
|  | #  if defined(FFTW_SINGLE)
 | ||
|  | #    define ALIGNMENT 8     /* Alignment for the LD/ST macros */
 | ||
|  | #    define ALIGNMENTA 16   /* Alignment for the LDA/STA macros */
 | ||
|  | #  else
 | ||
|  | #    define ALIGNMENT 16    /* Alignment for the LD/ST macros */
 | ||
|  | #    define ALIGNMENTA 16   /* Alignment for the LDA/STA macros */
 | ||
|  | #  endif
 | ||
|  | #elif defined(HAVE_ALTIVEC)
 | ||
|  | #  define ALIGNMENT 8     /* Alignment for the LD/ST macros */
 | ||
|  | #  define ALIGNMENTA 16   /* Alignment for the LDA/STA macros */
 | ||
|  | #elif defined(HAVE_NEON) || defined(HAVE_VSX)
 | ||
|  | #  define ALIGNMENT 8     /* Alignment for the LD/ST macros */
 | ||
|  | #  define ALIGNMENTA 8    /* Alignment for the LDA/STA macros */
 | ||
|  | #elif defined(HAVE_KCVI)
 | ||
|  | #  if defined(FFTW_SINGLE)
 | ||
|  | #    define ALIGNMENT 8     /* Alignment for the LD/ST macros */
 | ||
|  | #  else
 | ||
|  | #    define ALIGNMENT 16     /* Alignment for the LD/ST macros */
 | ||
|  | #  endif
 | ||
|  | #  define ALIGNMENTA 64   /* Alignment for the LDA/STA macros */
 | ||
|  | #elif defined(HAVE_GENERIC_SIMD256)
 | ||
|  | #  if defined(FFTW_SINGLE)
 | ||
|  | #    define ALIGNMENT 8
 | ||
|  | #    define ALIGNMENTA 32
 | ||
|  | #  else
 | ||
|  | #    define ALIGNMENT 16
 | ||
|  | #    define ALIGNMENTA 32
 | ||
|  | #  endif
 | ||
|  | #elif defined(HAVE_GENERIC_SIMD128)
 | ||
|  | #  if defined(FFTW_SINGLE)
 | ||
|  | #    define ALIGNMENT 8
 | ||
|  | #    define ALIGNMENTA 16
 | ||
|  | #  else
 | ||
|  | #    define ALIGNMENT 16
 | ||
|  | #    define ALIGNMENTA 16
 | ||
|  | #  endif
 | ||
|  | #endif
 | ||
|  | 
 | ||
|  | #if HAVE_SIMD
 | ||
|  | #  ifndef ALIGNMENT
 | ||
|  | #  error "ALIGNMENT not defined"
 | ||
|  | #  endif
 | ||
|  | #  ifndef ALIGNMENTA
 | ||
|  | #  error "ALIGNMENTA not defined"
 | ||
|  | #  endif
 | ||
|  | #endif
 | ||
|  | 
 | ||
|  | /* rename for precision and for SIMD extensions */ | ||
|  | #define XSIMD0(name, suffix) CONCAT(name, suffix)
 | ||
|  | #define XSIMD(name) XSIMD0(X(name), SIMD_SUFFIX)
 | ||
|  | #define XSIMD_STRING(x) x STRINGIZE(SIMD_SUFFIX)
 | ||
|  | 
 | ||
|  | /* TAINT_BIT is set if pointers are not guaranteed to be multiples of
 | ||
|  |    ALIGNMENT */ | ||
|  | #define TAINT_BIT 1    
 | ||
|  | 
 | ||
|  | /* TAINT_BITA is set if pointers are not guaranteed to be multiples of
 | ||
|  |    ALIGNMENTA */ | ||
|  | #define TAINT_BITA 2
 | ||
|  | 
 | ||
|  | #define PTRINT(p) ((uintptr_t)(p))
 | ||
|  | 
 | ||
|  | #define ALIGNED(p) \
 | ||
|  |   (((PTRINT(UNTAINT(p)) % ALIGNMENT) == 0) && !(PTRINT(p) & TAINT_BIT)) | ||
|  | 
 | ||
|  | #define ALIGNEDA(p) \
 | ||
|  |   (((PTRINT(UNTAINT(p)) % ALIGNMENTA) == 0) && !(PTRINT(p) & TAINT_BITA)) | ||
|  | 
 | ||
|  | #define SIMD_STRIDE_OK(x) (!(((x) * sizeof(R)) % ALIGNMENT))
 | ||
|  | #define SIMD_STRIDE_OKA(x) (!(((x) * sizeof(R)) % ALIGNMENTA))
 | ||
|  | #define SIMD_VSTRIDE_OK SIMD_STRIDE_OK
 | ||
|  | 
 |