90 lines
		
	
	
		
			2.1 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			90 lines
		
	
	
		
			2.1 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| /*
 | |
|  * Copyright (c) 2003, 2007-14 Matteo Frigo
 | |
|  * Copyright (c) 2003, 2007-14 Massachusetts Institute of Technology
 | |
|  *
 | |
|  * This program is free software; you can redistribute it and/or modify
 | |
|  * it under the terms of the GNU General Public License as published by
 | |
|  * the Free Software Foundation; either version 2 of the License, or
 | |
|  * (at your option) any later version.
 | |
|  *
 | |
|  * This program is distributed in the hope that it will be useful,
 | |
|  * but WITHOUT ANY WARRANTY; without even the implied warranty of
 | |
|  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 | |
|  * GNU General Public License for more details.
 | |
|  *
 | |
|  * You should have received a copy of the GNU General Public License
 | |
|  * along with this program; if not, write to the Free Software
 | |
|  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301  USA
 | |
|  *
 | |
|  */
 | |
| 
 | |
| 
 | |
| #include "kernel/ifftw.h"
 | |
| 
 | |
| #ifdef FFTW_SINGLE
 | |
| #  define DS(d,s) s /* single-precision option */
 | |
| #else
 | |
| #  define DS(d,s) d /* double-precision option */
 | |
| #endif
 | |
| 
 | |
| #if HAVE_SSE2
 | |
| 
 | |
| # if defined(__x86_64__) || defined(_M_X64) || defined(_M_AMD64)
 | |
| 
 | |
|   int X(have_simd_sse2)(void)
 | |
|   {
 | |
|        return 1;
 | |
|   }
 | |
| 
 | |
| # else /* !x86_64 */
 | |
| 
 | |
| # include <signal.h>
 | |
| # include <setjmp.h>
 | |
| # include "x86-cpuid.h"
 | |
| 
 | |
|   static jmp_buf jb;
 | |
| 
 | |
|   static void sighandler(int x)
 | |
|   {
 | |
|        UNUSED(x);
 | |
|        longjmp(jb, 1);
 | |
|   }
 | |
| 
 | |
|   static int sse2_works(void)
 | |
|   {
 | |
|        void (*oldsig)(int);
 | |
|        oldsig = signal(SIGILL, sighandler);
 | |
|        if (setjmp(jb)) {
 | |
| 	    signal(SIGILL, oldsig);
 | |
| 	    return 0;
 | |
|        } else {
 | |
| #         ifdef _MSC_VER
 | |
| 	    _asm { DS(xorpd,xorps) xmm0,xmm0 }
 | |
| #         else
 | |
| 	    /* asm volatile ("xorpd/s %xmm0, %xmm0"); */
 | |
| 	    asm volatile(DS(".byte 0x66; .byte 0x0f; .byte 0x57; .byte 0xc0",
 | |
| 			                ".byte 0x0f; .byte 0x57; .byte 0xc0"));
 | |
| #         endif
 | |
| 	    signal(SIGILL, oldsig);
 | |
| 	    return 1;
 | |
|        }
 | |
|   }
 | |
| 
 | |
|   int X(have_simd_sse2)(void)
 | |
|   {
 | |
|        static int init = 0, res;
 | |
| 
 | |
|        if (!init) {
 | |
| 	    res =   !is_386() 
 | |
| 		 && has_cpuid()
 | |
| 		 && (cpuid_edx(1) & (1 << DS(26,25)))
 | |
| 		 && sse2_works();
 | |
| 	    init = 1;
 | |
|        }
 | |
|        return res;
 | |
|   }
 | |
| 
 | |
| # endif
 | |
| 
 | |
| #endif
 | 
