/* * Copyright (c) 2003, 2007-14 Matteo Frigo * Copyright (c) 2003, 2007-14 Massachusetts Institute of Technology * * This program is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation; either version 2 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program; if not, write to the Free Software * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA * */ /* * This header file must include every file or define every * type or macro which is required to compile a codelet. */ #ifndef __DFT_CODELET_H__ #define __DFT_CODELET_H__ #include "kernel/ifftw.h" /************************************************************** * types of codelets **************************************************************/ /* DFT codelets */ typedef struct kdft_desc_s kdft_desc; typedef struct { int (*okp)( const kdft_desc *desc, const R *ri, const R *ii, const R *ro, const R *io, INT is, INT os, INT vl, INT ivs, INT ovs, const planner *plnr); INT vl; } kdft_genus; struct kdft_desc_s { INT sz; /* size of transform computed */ const char *nam; opcnt ops; const kdft_genus *genus; INT is; INT os; INT ivs; INT ovs; }; typedef void (*kdft) (const R *ri, const R *ii, R *ro, R *io, stride is, stride os, INT vl, INT ivs, INT ovs); void X(kdft_register)(planner *p, kdft codelet, const kdft_desc *desc); typedef struct ct_desc_s ct_desc; typedef struct { int (*okp)( const struct ct_desc_s *desc, const R *rio, const R *iio, INT rs, INT vs, INT m, INT mb, INT me, INT ms, const planner *plnr); INT vl; } ct_genus; struct ct_desc_s { INT radix; const char *nam; const tw_instr *tw; const ct_genus *genus; opcnt ops; INT rs; INT vs; INT ms; }; typedef void (*kdftw) (R *rioarray, R *iioarray, const R *W, stride ios, INT mb, INT me, INT ms); void X(kdft_dit_register)(planner *p, kdftw codelet, const ct_desc *desc); void X(kdft_dif_register)(planner *p, kdftw codelet, const ct_desc *desc); typedef void (*kdftwsq) (R *rioarray, R *iioarray, const R *W, stride is, stride vs, INT mb, INT me, INT ms); void X(kdft_difsq_register)(planner *p, kdftwsq codelet, const ct_desc *desc); extern const solvtab X(solvtab_dft_standard); extern const solvtab X(solvtab_dft_sse2); extern const solvtab X(solvtab_dft_avx); extern const solvtab X(solvtab_dft_avx_128_fma); extern const solvtab X(solvtab_dft_avx2); extern const solvtab X(solvtab_dft_avx2_128); extern const solvtab X(solvtab_dft_avx512); extern const solvtab X(solvtab_dft_kcvi); extern const solvtab X(solvtab_dft_altivec); extern const solvtab X(solvtab_dft_vsx); extern const solvtab X(solvtab_dft_neon); extern const solvtab X(solvtab_dft_generic_simd128); extern const solvtab X(solvtab_dft_generic_simd256); #endif /* __DFT_CODELET_H__ */