90 lines
		
	
	
		
			2.1 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
		
		
			
		
	
	
			90 lines
		
	
	
		
			2.1 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
|   | /*
 | ||
|  |  * Copyright (c) 2003, 2007-14 Matteo Frigo | ||
|  |  * Copyright (c) 2003, 2007-14 Massachusetts Institute of Technology | ||
|  |  * | ||
|  |  * This program is free software; you can redistribute it and/or modify | ||
|  |  * it under the terms of the GNU General Public License as published by | ||
|  |  * the Free Software Foundation; either version 2 of the License, or | ||
|  |  * (at your option) any later version. | ||
|  |  * | ||
|  |  * This program is distributed in the hope that it will be useful, | ||
|  |  * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
|  |  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the | ||
|  |  * GNU General Public License for more details. | ||
|  |  * | ||
|  |  * You should have received a copy of the GNU General Public License | ||
|  |  * along with this program; if not, write to the Free Software | ||
|  |  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301  USA | ||
|  |  * | ||
|  |  */ | ||
|  | 
 | ||
|  | 
 | ||
|  | #include "kernel/ifftw.h"
 | ||
|  | 
 | ||
|  | #ifdef FFTW_SINGLE
 | ||
|  | #  define DS(d,s) s /* single-precision option */
 | ||
|  | #else
 | ||
|  | #  define DS(d,s) d /* double-precision option */
 | ||
|  | #endif
 | ||
|  | 
 | ||
|  | #if HAVE_SSE2
 | ||
|  | 
 | ||
|  | # if defined(__x86_64__) || defined(_M_X64) || defined(_M_AMD64)
 | ||
|  | 
 | ||
|  |   int X(have_simd_sse2)(void) | ||
|  |   { | ||
|  |        return 1; | ||
|  |   } | ||
|  | 
 | ||
|  | # else /* !x86_64 */
 | ||
|  | 
 | ||
|  | # include <signal.h>
 | ||
|  | # include <setjmp.h>
 | ||
|  | # include "x86-cpuid.h"
 | ||
|  | 
 | ||
|  |   static jmp_buf jb; | ||
|  | 
 | ||
|  |   static void sighandler(int x) | ||
|  |   { | ||
|  |        UNUSED(x); | ||
|  |        longjmp(jb, 1); | ||
|  |   } | ||
|  | 
 | ||
|  |   static int sse2_works(void) | ||
|  |   { | ||
|  |        void (*oldsig)(int); | ||
|  |        oldsig = signal(SIGILL, sighandler); | ||
|  |        if (setjmp(jb)) { | ||
|  | 	    signal(SIGILL, oldsig); | ||
|  | 	    return 0; | ||
|  |        } else { | ||
|  | #         ifdef _MSC_VER
 | ||
|  | 	    _asm { DS(xorpd,xorps) xmm0,xmm0 } | ||
|  | #         else
 | ||
|  | 	    /* asm volatile ("xorpd/s %xmm0, %xmm0"); */ | ||
|  | 	    asm volatile(DS(".byte 0x66; .byte 0x0f; .byte 0x57; .byte 0xc0", | ||
|  | 			                ".byte 0x0f; .byte 0x57; .byte 0xc0")); | ||
|  | #         endif
 | ||
|  | 	    signal(SIGILL, oldsig); | ||
|  | 	    return 1; | ||
|  |        } | ||
|  |   } | ||
|  | 
 | ||
|  |   int X(have_simd_sse2)(void) | ||
|  |   { | ||
|  |        static int init = 0, res; | ||
|  | 
 | ||
|  |        if (!init) { | ||
|  | 	    res =   !is_386()  | ||
|  | 		 && has_cpuid() | ||
|  | 		 && (cpuid_edx(1) & (1 << DS(26,25))) | ||
|  | 		 && sse2_works(); | ||
|  | 	    init = 1; | ||
|  |        } | ||
|  |        return res; | ||
|  |   } | ||
|  | 
 | ||
|  | # endif
 | ||
|  | 
 | ||
|  | #endif
 |