113 lines
		
	
	
		
			3.3 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			113 lines
		
	
	
		
			3.3 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| /*
 | |
|  * Copyright (c) 2003, 2007-14 Matteo Frigo
 | |
|  * Copyright (c) 2003, 2007-14 Massachusetts Institute of Technology
 | |
|  *
 | |
|  * This program is free software; you can redistribute it and/or modify
 | |
|  * it under the terms of the GNU General Public License as published by
 | |
|  * the Free Software Foundation; either version 2 of the License, or
 | |
|  * (at your option) any later version.
 | |
|  *
 | |
|  * This program is distributed in the hope that it will be useful,
 | |
|  * but WITHOUT ANY WARRANTY; without even the implied warranty of
 | |
|  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 | |
|  * GNU General Public License for more details.
 | |
|  *
 | |
|  * You should have received a copy of the GNU General Public License
 | |
|  * along with this program; if not, write to the Free Software
 | |
|  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301  USA
 | |
|  *
 | |
|  */
 | |
| 
 | |
| 
 | |
| /*
 | |
|  * This header file must include every file or define every
 | |
|  * type or macro which is required to compile a codelet.
 | |
|  */
 | |
| 
 | |
| #ifndef __DFT_CODELET_H__
 | |
| #define __DFT_CODELET_H__
 | |
| 
 | |
| #include "kernel/ifftw.h"
 | |
| 
 | |
| /**************************************************************
 | |
|  * types of codelets
 | |
|  **************************************************************/
 | |
| 
 | |
| /* DFT codelets */
 | |
| typedef struct kdft_desc_s kdft_desc;
 | |
| 
 | |
| typedef struct {
 | |
|      int (*okp)(
 | |
| 	  const kdft_desc *desc,
 | |
| 	  const R *ri, const R *ii, const R *ro, const R *io,
 | |
| 	  INT is, INT os, INT vl, INT ivs, INT ovs,
 | |
| 	  const planner *plnr);
 | |
|      INT vl;
 | |
| } kdft_genus;
 | |
| 
 | |
| struct kdft_desc_s {
 | |
|      INT sz;    /* size of transform computed */
 | |
|      const char *nam;
 | |
|      opcnt ops;
 | |
|      const kdft_genus *genus;
 | |
|      INT is;
 | |
|      INT os;
 | |
|      INT ivs;
 | |
|      INT ovs;
 | |
| };
 | |
| 
 | |
| typedef void (*kdft) (const R *ri, const R *ii, R *ro, R *io,
 | |
|                       stride is, stride os, INT vl, INT ivs, INT ovs);
 | |
| void X(kdft_register)(planner *p, kdft codelet, const kdft_desc *desc);
 | |
| 
 | |
| 
 | |
| typedef struct ct_desc_s ct_desc;
 | |
| 
 | |
| typedef struct {
 | |
|      int (*okp)(
 | |
| 	  const struct ct_desc_s *desc,
 | |
| 	  const R *rio, const R *iio, 
 | |
| 	  INT rs, INT vs, INT m, INT mb, INT me, INT ms,
 | |
| 	  const planner *plnr);
 | |
|      INT vl;
 | |
| } ct_genus;
 | |
| 
 | |
| struct ct_desc_s {
 | |
|      INT radix;
 | |
|      const char *nam;
 | |
|      const tw_instr *tw;
 | |
|      const ct_genus *genus;
 | |
|      opcnt ops;
 | |
|      INT rs;
 | |
|      INT vs;
 | |
|      INT ms;
 | |
| };
 | |
| 
 | |
| typedef void (*kdftw) (R *rioarray, R *iioarray, const R *W,
 | |
| 		       stride ios, INT mb, INT me, INT ms);
 | |
| void X(kdft_dit_register)(planner *p, kdftw codelet, const ct_desc *desc);
 | |
| void X(kdft_dif_register)(planner *p, kdftw codelet, const ct_desc *desc);
 | |
| 
 | |
| 
 | |
| typedef void (*kdftwsq) (R *rioarray, R *iioarray,
 | |
| 			 const R *W, stride is, stride vs,
 | |
| 			 INT mb, INT me, INT ms);
 | |
| void X(kdft_difsq_register)(planner *p, kdftwsq codelet, const ct_desc *desc);
 | |
| 
 | |
| 
 | |
| extern const solvtab X(solvtab_dft_standard);
 | |
| extern const solvtab X(solvtab_dft_sse2);
 | |
| extern const solvtab X(solvtab_dft_avx);
 | |
| extern const solvtab X(solvtab_dft_avx_128_fma);
 | |
| extern const solvtab X(solvtab_dft_avx2);
 | |
| extern const solvtab X(solvtab_dft_avx2_128);
 | |
| extern const solvtab X(solvtab_dft_avx512);
 | |
| extern const solvtab X(solvtab_dft_kcvi);
 | |
| extern const solvtab X(solvtab_dft_altivec);
 | |
| extern const solvtab X(solvtab_dft_vsx);
 | |
| extern const solvtab X(solvtab_dft_neon);
 | |
| extern const solvtab X(solvtab_dft_generic_simd128);
 | |
| extern const solvtab X(solvtab_dft_generic_simd256);
 | |
| 
 | |
| #endif				/* __DFT_CODELET_H__ */
 | 
