99 lines
		
	
	
		
			3.5 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			99 lines
		
	
	
		
			3.5 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
/*
 | 
						|
 * Copyright (c) 2003, 2007-14 Matteo Frigo
 | 
						|
 * Copyright (c) 2003, 2007-14 Massachusetts Institute of Technology
 | 
						|
 *
 | 
						|
 * This program is free software; you can redistribute it and/or modify
 | 
						|
 * it under the terms of the GNU General Public License as published by
 | 
						|
 * the Free Software Foundation; either version 2 of the License, or
 | 
						|
 * (at your option) any later version.
 | 
						|
 *
 | 
						|
 * This program is distributed in the hope that it will be useful,
 | 
						|
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 | 
						|
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 | 
						|
 * GNU General Public License for more details.
 | 
						|
 *
 | 
						|
 * You should have received a copy of the GNU General Public License
 | 
						|
 * along with this program; if not, write to the Free Software
 | 
						|
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301  USA
 | 
						|
 *
 | 
						|
 */
 | 
						|
 | 
						|
/* detection of alignment.  This is complicated because a machine may
 | 
						|
   support multiple SIMD extensions (e.g. SSE2 and AVX) but only one
 | 
						|
   set of alignment contraints.  So this alignment stuff cannot be
 | 
						|
   defined in the SIMD header files.  Rather than defining a separate
 | 
						|
   set of "machine" header files, we just do this ugly ifdef here. */
 | 
						|
#if defined(HAVE_SSE2) || defined(HAVE_AVX) || defined(HAVE_AVX2) || defined(HAVE_AVX_128_FMA) || defined(HAVE_AVX512)
 | 
						|
#  if defined(FFTW_SINGLE)
 | 
						|
#    define ALIGNMENT 8     /* Alignment for the LD/ST macros */
 | 
						|
#    define ALIGNMENTA 16   /* Alignment for the LDA/STA macros */
 | 
						|
#  else
 | 
						|
#    define ALIGNMENT 16    /* Alignment for the LD/ST macros */
 | 
						|
#    define ALIGNMENTA 16   /* Alignment for the LDA/STA macros */
 | 
						|
#  endif
 | 
						|
#elif defined(HAVE_ALTIVEC)
 | 
						|
#  define ALIGNMENT 8     /* Alignment for the LD/ST macros */
 | 
						|
#  define ALIGNMENTA 16   /* Alignment for the LDA/STA macros */
 | 
						|
#elif defined(HAVE_NEON) || defined(HAVE_VSX)
 | 
						|
#  define ALIGNMENT 8     /* Alignment for the LD/ST macros */
 | 
						|
#  define ALIGNMENTA 8    /* Alignment for the LDA/STA macros */
 | 
						|
#elif defined(HAVE_KCVI)
 | 
						|
#  if defined(FFTW_SINGLE)
 | 
						|
#    define ALIGNMENT 8     /* Alignment for the LD/ST macros */
 | 
						|
#  else
 | 
						|
#    define ALIGNMENT 16     /* Alignment for the LD/ST macros */
 | 
						|
#  endif
 | 
						|
#  define ALIGNMENTA 64   /* Alignment for the LDA/STA macros */
 | 
						|
#elif defined(HAVE_GENERIC_SIMD256)
 | 
						|
#  if defined(FFTW_SINGLE)
 | 
						|
#    define ALIGNMENT 8
 | 
						|
#    define ALIGNMENTA 32
 | 
						|
#  else
 | 
						|
#    define ALIGNMENT 16
 | 
						|
#    define ALIGNMENTA 32
 | 
						|
#  endif
 | 
						|
#elif defined(HAVE_GENERIC_SIMD128)
 | 
						|
#  if defined(FFTW_SINGLE)
 | 
						|
#    define ALIGNMENT 8
 | 
						|
#    define ALIGNMENTA 16
 | 
						|
#  else
 | 
						|
#    define ALIGNMENT 16
 | 
						|
#    define ALIGNMENTA 16
 | 
						|
#  endif
 | 
						|
#endif
 | 
						|
 | 
						|
#if HAVE_SIMD
 | 
						|
#  ifndef ALIGNMENT
 | 
						|
#  error "ALIGNMENT not defined"
 | 
						|
#  endif
 | 
						|
#  ifndef ALIGNMENTA
 | 
						|
#  error "ALIGNMENTA not defined"
 | 
						|
#  endif
 | 
						|
#endif
 | 
						|
 | 
						|
/* rename for precision and for SIMD extensions */
 | 
						|
#define XSIMD0(name, suffix) CONCAT(name, suffix)
 | 
						|
#define XSIMD(name) XSIMD0(X(name), SIMD_SUFFIX)
 | 
						|
#define XSIMD_STRING(x) x STRINGIZE(SIMD_SUFFIX)
 | 
						|
 | 
						|
/* TAINT_BIT is set if pointers are not guaranteed to be multiples of
 | 
						|
   ALIGNMENT */
 | 
						|
#define TAINT_BIT 1    
 | 
						|
 | 
						|
/* TAINT_BITA is set if pointers are not guaranteed to be multiples of
 | 
						|
   ALIGNMENTA */
 | 
						|
#define TAINT_BITA 2
 | 
						|
 | 
						|
#define PTRINT(p) ((uintptr_t)(p))
 | 
						|
 | 
						|
#define ALIGNED(p) \
 | 
						|
  (((PTRINT(UNTAINT(p)) % ALIGNMENT) == 0) && !(PTRINT(p) & TAINT_BIT))
 | 
						|
 | 
						|
#define ALIGNEDA(p) \
 | 
						|
  (((PTRINT(UNTAINT(p)) % ALIGNMENTA) == 0) && !(PTRINT(p) & TAINT_BITA))
 | 
						|
 | 
						|
#define SIMD_STRIDE_OK(x) (!(((x) * sizeof(R)) % ALIGNMENT))
 | 
						|
#define SIMD_STRIDE_OKA(x) (!(((x) * sizeof(R)) % ALIGNMENTA))
 | 
						|
#define SIMD_VSTRIDE_OK SIMD_STRIDE_OK
 | 
						|
 |