#ifndef _LIBFFTSS_H
#define _LIBFFTSS_H
#ifdef HAVE_CONFIG_H
#include "config.h"
#elif defined(_WIN32)
#include "win32config.h"
#endif
#include <math.h>
typedef struct {
void (*kern)(double *, double *, double *, long, long);
long bsize, blocks;
long radix;
} fftss_kern;
typedef struct _fftss_plan_1d_s {
void (*fp)(struct _fftss_plan_1d_s *, double *, double *);
double *in, *out;
double *w;
double *work;
long n, logn2;
long stages;
long flags;
long sign;
long map_id, table_type, kset_id;
double fastest;
fftss_kern *k;
} fftss_plan_1d_s;
typedef fftss_plan_1d_s *fftss_plan_1d;
typedef struct _fftss_plan_s {
void (*fp)(struct _fftss_plan_s *, double *, double *);
double *in, *out;
long nx, ny, nz;
long py, pz;
long flags;
double **b;
double *work;
fftss_plan_1d p1, p2, p3;
} fftss_plan_s;
typedef fftss_plan_s *fftss_plan;
extern void fftss_copyin(double *, double *, long, long);
extern void fftss_copyout(double *, double *, long, long);
#ifndef _OPENMP
#define omp_get_max_threads() 1
#define omp_get_thread_num() 0
#endif
#define FFTSS_FORWARD -1
#define FFTSS_BACKWARD 1
#define FFTSS_MEASURE 0
#define FFTSS_DESTROY_INPUT (1<<0)
#define FFTSS_UNALIGNED (1<<1)
#define FFTSS_CONSERVE_MEMORY (1<<2)
#define FFTSS_EXHAUSTIVE (1<<3)
#define FFTSS_PRESERVE_INPUT (1<<4)
#define FFTSS_PATIENT (1<<5)
#define FFTSS_ESTIMATE (1<<6)
#define FFTSS_NO_SIMD (1<<17)
#define FFTSS_VERBOSE (1<<20)
#define FFTSS_INOUT (1<<21)
#ifndef M_PI
#define M_PI 3.14159265358979323846
#endif
extern int fftss_version(char *);
extern void fftss_execute(fftss_plan);
extern void fftss_execute_dft_1d(fftss_plan_1d, double *, double *);
extern void fftss_execute_inplace_dft_1d(fftss_plan_1d, double *, double *);
extern void *fftss_malloc(long);
extern void fftss_free(void *);
extern fftss_plan fftss_plan_dft_1d(long, double *, double *, long, long);
extern fftss_plan fftss_plan_dft_2d(long, long, long, double *, double *, long, long);
extern fftss_plan fftss_plan_dft_3d(long, long, long, long, long, double *, double *, long, long);
extern void fftss_set(fftss_plan, double *, double *);
extern void fftss_destroy_plan(fftss_plan);
extern double fftss_get_wtime(void);
extern int fftss_test_fma(void);
extern int fftss_verbose;
typedef void (*fftss_kernel)(double*, double*, double*, long, long);
enum{ KSET_NORMAL = 0, KSET_ONE, KSET_UNROLL1, KSET_UNROLL4, KSET_UNROLL8 };
typedef struct {
long table_type;
char *name;
int required, enabled;
fftss_kernel *r4f, *r8f;
fftss_kernel *r4b, *r8b;
} fftss_kset;
typedef struct {
char *name;
void (*gen)(fftss_plan_1d);
} fftss_table_type;
enum { FFTSS_TABLE_NORMAL = 0, FFTSS_TABLE_FMA };
extern fftss_table_type fftss_table_types[];
extern fftss_kset fftss_kset_list[];
extern double *fftss_table_alloc(long, long);
extern void fftss_table_add(long, long, double *);
#define FFTSS_MAP_MAX 4
typedef int (*fftss_map)(fftss_plan_1d, long);
extern fftss_map fftss_map_list[];
extern void fftss_use_kset(fftss_plan_1d, fftss_kernel *, fftss_kernel *);
extern int fftss_cpu;
extern void fftss_check_cpu(void);
#define FFTSS_ANY (0<<0)
#define FFTSS_X86_INTEL (1<<0)
#define FFTSS_X86_AMD (1<<1)
#define FFTSS_X86_MMX (1<<4)
#define FFTSS_X86_SSE (1<<5)
#define FFTSS_X86_SSE2 (1<<6)
#define FFTSS_X86_SSE3 (1<<7)
#define FFTSS_FMA (1<<8)
#define FFTSS_SIMD (FFTSS_X86_SSE2|FFTSS_X86_SSE3)
#define FFTSS_ALIGN (1<<20)
#endif