10 #ifndef EIGEN_CXX11_TENSOR_TENSOR_FFT_H
11 #define EIGEN_CXX11_TENSOR_TENSOR_FFT_H
29 template <
bool NeedUprade>
41 return std::complex<T>(
val, 0);
53 template <
int ResultType>
78 template <
typename FFT,
typename XprType,
int FFTResultType,
int FFTDir>
84 typedef std::conditional_t<FFTResultType == RealPart || FFTResultType == ImagPart, RealScalar, ComplexScalar>
88 typedef typename XprType::Nested
Nested;
89 typedef std::remove_reference_t<Nested>
Nested_;
90 static constexpr
int NumDimensions = XprTraits::NumDimensions;
91 static constexpr
int Layout = XprTraits::Layout;
95 template <
typename FFT,
typename XprType,
int FFTResultType,
int FFTDirection>
100 template <
typename FFT,
typename XprType,
int FFTResultType,
int FFTDirection>
108 template <
typename FFT,
typename XprType,
int FFTResultType,
int FFTDir>
114 typedef std::conditional_t<FFTResultType == RealPart || FFTResultType == ImagPart, RealScalar, ComplexScalar>
133 template <
typename FFT,
typename ArgType,
typename Device,
int FFTResultType,
int FFTDir>
145 typedef std::conditional_t<FFTResultType == RealPart || FFTResultType == ImagPart, RealScalar, ComplexScalar>
158 PreferBlockAccess =
false,
170 for (
int i = 0;
i < NumDims; ++
i) {
172 m_dimensions[
i] = input_dims[
i];
177 for (
int i = 1;
i < NumDims; ++
i) {
178 m_strides[
i] = m_strides[
i - 1] * m_dimensions[
i - 1];
181 m_strides[NumDims - 1] = 1;
182 for (
int i = NumDims - 2;
i >= 0; --
i) {
183 m_strides[
i] = m_strides[
i + 1] * m_dimensions[
i + 1];
186 m_size = m_dimensions.TotalSize();
192 m_impl.evalSubExprsIfNeeded(NULL);
214 template <
int LoadMode>
216 return internal::ploadt<PacketReturnType, LoadMode>(
m_data + index);
231 for (
Index i = 0;
i < m_size; ++
i) {
235 for (
size_t i = 0;
i < m_fft.size(); ++
i) {
238 Index line_len = m_dimensions[dim];
241 const bool is_power_of_two = isPowerOfTwo(line_len);
242 const Index good_composite = is_power_of_two ? 0 : findGoodComposite(line_len);
243 const Index log_len = is_power_of_two ? getLog2(line_len) : getLog2(good_composite);
251 if (!is_power_of_two) {
278 for (
int j = 0;
j < line_len + 1; ++
j) {
285 for (
Index partial_index = 0; partial_index < m_size / line_len; ++partial_index) {
286 const Index base_offset = getBaseOffsetFromIndex(partial_index, dim);
289 const Index stride = m_strides[dim];
293 Index offset = base_offset;
294 for (
int j = 0;
j < line_len; ++
j, offset += stride) {
295 line_buf[
j] = buf[offset];
300 if (is_power_of_two) {
301 processDataLineCooleyTukey(line_buf, line_len, log_len);
303 processDataLineBluestein(line_buf, line_len, good_composite, log_len,
a,
b, pos_j_base_powered);
310 Index offset = base_offset;
312 for (
int j = 0;
j < line_len; ++
j, offset += stride) {
313 buf[offset] = (FFTDir ==
FFT_FORWARD) ? line_buf[
j] : line_buf[
j] * div_factor;
318 if (!is_power_of_two) {
321 m_device.deallocate(pos_j_base_powered);
326 for (
Index i = 0;
i < m_size; ++
i) {
335 return !(
x & (
x - 1));
341 while (
i < 2 *
n - 1)
i *= 2;
347 while (
m >>= 1) log2m++;
355 scramble_FFT(line_buf, line_len);
356 compute_1D_Butterfly<FFTDir>(line_buf, line_len, log_len);
372 a[
i] =
data[
i] * pos_j_base_powered[
i];
381 b[
i] = pos_j_base_powered[
i];
391 b[
i] = pos_j_base_powered[
m -
i];
398 compute_1D_Butterfly<FFT_FORWARD>(
a,
m, log_len);
401 compute_1D_Butterfly<FFT_FORWARD>(
b,
m, log_len);
408 compute_1D_Butterfly<FFT_REVERSE>(
a,
m, log_len);
419 data[
i] =
a[
i] * pos_j_base_powered[
i];
432 while (
m >= 2 &&
j >
m) {
485 tmp_2[0] = tmp_1[0] + tmp_1[2];
486 tmp_2[1] = tmp_1[1] + tmp_1[3];
487 tmp_2[2] = tmp_1[0] - tmp_1[2];
488 tmp_2[3] = tmp_1[1] - tmp_1[3];
489 tmp_2[4] = tmp_1[4] + tmp_1[6];
491 #define SQRT2DIV2 0.7071067811865476
501 data[0] = tmp_2[0] + tmp_2[4];
502 data[1] = tmp_2[1] + tmp_2[5];
503 data[2] = tmp_2[2] + tmp_2[6];
504 data[3] = tmp_2[3] + tmp_2[7];
505 data[4] = tmp_2[0] - tmp_2[4];
506 data[5] = tmp_2[1] - tmp_2[5];
507 data[6] = tmp_2[2] - tmp_2[6];
508 data[7] = tmp_2[3] - tmp_2[7];
516 const RealScalar wtemp = m_sin_PI_div_n_LUT[n_power_of_2];
518 (Dir ==
FFT_FORWARD) ? m_minus_sin_2_PI_div_n_LUT[n_power_of_2] : -m_minus_sin_2_PI_div_n_LUT[n_power_of_2];
538 data[
i + 1] += temp1;
541 data[
i + 2] += temp2;
544 data[
i + 3] += temp3;
552 compute_1D_Butterfly<Dir>(
data,
n / 2, n_power_of_2 - 1);
553 compute_1D_Butterfly<Dir>(
data +
n / 2,
n / 2, n_power_of_2 - 1);
554 butterfly_1D_merge<Dir>(
data,
n, n_power_of_2);
556 butterfly_8<Dir>(
data);
558 butterfly_4<Dir>(
data);
560 butterfly_2<Dir>(
data);
568 for (
int i = NumDims - 1;
i > omitted_dim; --
i) {
569 const Index partial_m_stride = m_strides[
i] / m_dimensions[omitted_dim];
570 const Index idx = index / partial_m_stride;
571 index -= idx * partial_m_stride;
572 result += idx * m_strides[
i];
576 for (
Index i = 0;
i < omitted_dim; ++
i) {
577 const Index partial_m_stride = m_strides[
i] / m_dimensions[omitted_dim];
578 const Index idx = index / partial_m_stride;
579 index -= idx * partial_m_stride;
580 result += idx * m_strides[
i];
589 Index result = base + offset * m_strides[omitted_dim];
AnnoyingScalar conj(const AnnoyingScalar &x)
Definition: AnnoyingScalar.h:133
int i
Definition: BiCGSTAB_step_by_step.cpp:9
const unsigned n
Definition: CG3DPackingUnitTest.cpp:11
#define EIGEN_ALWAYS_INLINE
Definition: Macros.h:845
#define EIGEN_DEVICE_FUNC
Definition: Macros.h:892
#define eigen_assert(x)
Definition: Macros.h:910
#define EIGEN_STRONG_INLINE
Definition: Macros.h:834
#define EIGEN_PI
Definition: MathFunctions.h:16
RowVector3d w
Definition: Matrix_resize_int.cpp:3
#define EIGEN_DEVICE_REF
Definition: TensorMacros.h:34
Scalar * b
Definition: benchVecAdd.cpp:17
SCALAR Scalar
Definition: bench_gemm.cpp:45
NumTraits< Scalar >::Real RealScalar
Definition: bench_gemm.cpp:46
Generic expression where a coefficient-wise binary operator is applied to two expressions.
Definition: CwiseBinaryOp.h:79
The tensor base class.
Definition: TensorBase.h:1026
Definition: TensorFFT.h:109
const FFT m_fft
Definition: TensorFFT.h:129
Eigen::internal::nested< TensorFFTOp >::type Nested
Definition: TensorFFT.h:117
EIGEN_DEVICE_FUNC const FFT & fft() const
Definition: TensorFFT.h:123
OutputScalar CoeffReturnType
Definition: TensorFFT.h:116
Eigen::NumTraits< Scalar >::Real RealScalar
Definition: TensorFFT.h:112
Eigen::internal::traits< TensorFFTOp >::Scalar Scalar
Definition: TensorFFT.h:111
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE TensorFFTOp(const XprType &expr, const FFT &fft)
Definition: TensorFFT.h:121
EIGEN_DEVICE_FUNC const internal::remove_all_t< typename XprType::Nested > & expression() const
Definition: TensorFFT.h:125
Eigen::internal::traits< TensorFFTOp >::StorageKind StorageKind
Definition: TensorFFT.h:118
std::conditional_t< FFTResultType==RealPart||FFTResultType==ImagPart, RealScalar, ComplexScalar > OutputScalar
Definition: TensorFFT.h:115
Eigen::internal::traits< TensorFFTOp >::Index Index
Definition: TensorFFT.h:119
std::complex< RealScalar > ComplexScalar
Definition: TensorFFT.h:113
XprType::Nested m_xpr
Definition: TensorFFT.h:128
Definition: TensorCostModel.h:28
Definition: TensorBlock.h:566
@ ColMajor
Definition: Constants.h:318
EIGEN_BLAS_FUNC() swap(int *n, RealScalar *px, int *incx, RealScalar *py, int *incy)
Definition: level1_impl.h:117
const Scalar * a
Definition: level2_cplx_impl.h:32
int * m
Definition: level2_cplx_impl.h:294
char char * op
Definition: level2_impl.h:374
Eigen::Matrix< Scalar, Dynamic, Dynamic, ColMajor > tmp
Definition: level3_impl.h:365
typename remove_all< T >::type remove_all_t
Definition: Meta.h:142
EIGEN_DEVICE_FUNC EIGEN_ALWAYS_INLINE T cos(const T &x)
Definition: MathFunctions.h:1559
EIGEN_DEVICE_FUNC EIGEN_ALWAYS_INLINE T sin(const T &x)
Definition: MathFunctions.h:1581
Namespace containing all symbols from the Eigen library.
Definition: bench_norm.cpp:70
FFTDirection
Definition: TensorForwardDeclarations.h:170
@ FFT_FORWARD
Definition: TensorForwardDeclarations.h:170
std::array< T, N > array
Definition: EmulateArray.h:231
squared absolute value
Definition: GlobalFunctions.h:87
FFTResultType
Definition: TensorForwardDeclarations.h:168
@ ImagPart
Definition: TensorForwardDeclarations.h:168
@ RealPart
Definition: TensorForwardDeclarations.h:168
EIGEN_DEFAULT_DENSE_INDEX_TYPE Index
The Index type as used for the API.
Definition: Meta.h:83
val
Definition: calibrate.py:119
Definition: Eigen_Colamd.h:49
list x
Definition: plotDoE.py:28
Definition: Constants.h:519
T Real
Definition: NumTraits.h:183
EIGEN_DEVICE_FUNC std::complex< T > operator()(const std::complex< T > &val) const
Definition: TensorFFT.h:48
EIGEN_DEVICE_FUNC std::complex< T > operator()(const T &val) const
Definition: TensorFFT.h:40
Definition: TensorFFT.h:30
EIGEN_DEVICE_FUNC T operator()(const T &val) const
Definition: TensorFFT.h:32
T operator()(const std::complex< T > &val) const
Definition: TensorFFT.h:72
T operator()(const std::complex< T > &val) const
Definition: TensorFFT.h:64
Definition: TensorFFT.h:54
T operator()(const T &val) const
Definition: TensorFFT.h:56
Definition: TensorForwardDeclarations.h:42
internal::TensorBlockNotImplemented TensorBlock
Definition: TensorFFT.h:164
EIGEN_DEVICE_FUNC EvaluatorPointerType data() const
Definition: TensorFFT.h:223
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE void butterfly_8(ComplexScalar *data)
Definition: TensorFFT.h:465
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE void evalToBuf(EvaluatorPointerType data)
Definition: TensorFFT.h:226
const Device EIGEN_DEVICE_REF m_device
Definition: TensorFFT.h:600
EvaluatorPointerType m_data
Definition: TensorFFT.h:599
internal::traits< XprType > XprTraits
Definition: TensorFFT.h:143
Storage::Type EvaluatorPointerType
Definition: TensorFFT.h:151
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE void processDataLineCooleyTukey(ComplexScalar *line_buf, Index line_len, Index log_len)
Definition: TensorFFT.h:352
TensorEvaluator< ArgType, Device > m_impl
Definition: TensorFFT.h:598
TensorFFTOp< FFT, ArgType, FFTResultType, FFTDir > XprType
Definition: TensorFFT.h:135
Dimensions m_dimensions
Definition: TensorFFT.h:596
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE Index getIndexFromOffset(Index base, Index omitted_dim, Index offset) const
Definition: TensorFFT.h:588
EIGEN_STRONG_INLINE TensorEvaluator(const XprType &op, const Device &device)
Definition: TensorFFT.h:167
Index m_size
Definition: TensorFFT.h:594
EIGEN_DEVICE_FUNC static EIGEN_STRONG_INLINE bool isPowerOfTwo(Index x)
Definition: TensorFFT.h:333
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE Index getBaseOffsetFromIndex(Index index, Index omitted_dim) const
Definition: TensorFFT.h:564
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE void processDataLineBluestein(ComplexScalar *line_buf, Index line_len, Index good_composite, Index log_len, ComplexScalar *a, ComplexScalar *b, const ComplexScalar *pos_j_base_powered)
Definition: TensorFFT.h:360
const FFT EIGEN_DEVICE_REF m_fft
Definition: TensorFFT.h:595
EIGEN_DEVICE_FUNC EIGEN_ALWAYS_INLINE CoeffReturnType coeff(Index index) const
Definition: TensorFFT.h:212
PacketType< OutputScalar, Device >::type PacketReturnType
Definition: TensorFFT.h:148
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE void butterfly_1D_merge(ComplexScalar *data, Index n, Index n_power_of_2)
Definition: TensorFFT.h:512
std::complex< RealScalar > ComplexScalar
Definition: TensorFFT.h:141
DSizes< Index, NumDims > Dimensions
Definition: TensorFFT.h:138
Eigen::NumTraits< Scalar >::Real RealScalar
Definition: TensorFFT.h:140
EIGEN_DEVICE_FUNC static EIGEN_STRONG_INLINE Index findGoodComposite(Index n)
Definition: TensorFFT.h:339
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE TensorOpCost costPerCoeff(bool vectorized) const
Definition: TensorFFT.h:219
EIGEN_STRONG_INLINE void cleanup()
Definition: TensorFFT.h:204
array< Index, NumDims > m_strides
Definition: TensorFFT.h:597
XprTraits::Scalar InputScalar
Definition: TensorFFT.h:144
XprType::Scalar Scalar
Definition: TensorFFT.h:139
EIGEN_DEVICE_FUNC static EIGEN_STRONG_INLINE void scramble_FFT(ComplexScalar *data, Index n)
Definition: TensorFFT.h:424
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE const Dimensions & dimensions() const
Definition: TensorFFT.h:189
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE void butterfly_4(ComplexScalar *data)
Definition: TensorFFT.h:448
std::conditional_t< FFTResultType==RealPart||FFTResultType==ImagPart, RealScalar, ComplexScalar > OutputScalar
Definition: TensorFFT.h:146
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE void butterfly_2(ComplexScalar *data)
Definition: TensorFFT.h:441
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE void compute_1D_Butterfly(ComplexScalar *data, Index n, Index n_power_of_2)
Definition: TensorFFT.h:549
StorageMemory< CoeffReturnType, Device > Storage
Definition: TensorFFT.h:150
EIGEN_STRONG_INLINE bool evalSubExprsIfNeeded(EvaluatorPointerType data)
Definition: TensorFFT.h:191
TensorEvaluator< ArgType, Device >::Dimensions InputDimensions
Definition: TensorFFT.h:142
EIGEN_DEVICE_FUNC EIGEN_ALWAYS_INLINE PacketReturnType packet(Index index) const
Definition: TensorFFT.h:215
EIGEN_DEVICE_FUNC static EIGEN_STRONG_INLINE Index getLog2(Index m)
Definition: TensorFFT.h:345
OutputScalar CoeffReturnType
Definition: TensorFFT.h:147
XprType::Index Index
Definition: TensorFFT.h:136
A cost model used to limit the number of threads used for evaluating tensor expression.
Definition: TensorEvaluator.h:31
static constexpr int Layout
Definition: TensorEvaluator.h:46
const Device EIGEN_DEVICE_REF m_device
Definition: TensorEvaluator.h:170
Storage::Type EvaluatorPointerType
Definition: TensorEvaluator.h:41
@ PacketAccess
Definition: TensorEvaluator.h:50
@ IsAligned
Definition: TensorEvaluator.h:49
static constexpr int PacketSize
Definition: TensorEvaluator.h:38
EIGEN_DEVICE_FUNC EvaluatorPointerType data() const
Definition: TensorEvaluator.h:165
EvaluatorPointerType m_data
Definition: TensorEvaluator.h:168
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE const Dimensions & dimensions() const
Definition: TensorEvaluator.h:69
const TensorFFTOp< FFT, XprType, FFTResultType, FFTDirection > & type
Definition: TensorFFT.h:97
Definition: XprHelper.h:427
TensorFFTOp< FFT, XprType, FFTResultType, FFTDirection > type
Definition: TensorFFT.h:103
Definition: TensorTraits.h:152
ref_selector< T >::type type
Definition: TensorTraits.h:153
traits< XprType > XprTraits
Definition: TensorFFT.h:80
std::conditional_t< FFTResultType==RealPart||FFTResultType==ImagPart, RealScalar, ComplexScalar > OutputScalar
Definition: TensorFFT.h:85
XprTraits::Index Index
Definition: TensorFFT.h:87
traits< XprType >::PointerType PointerType
Definition: TensorFFT.h:92
XprTraits::Scalar InputScalar
Definition: TensorFFT.h:83
std::complex< RealScalar > ComplexScalar
Definition: TensorFFT.h:82
XprType::Nested Nested
Definition: TensorFFT.h:88
std::remove_reference_t< Nested > Nested_
Definition: TensorFFT.h:89
XprTraits::StorageKind StorageKind
Definition: TensorFFT.h:86
NumTraits< typename XprTraits::Scalar >::Real RealScalar
Definition: TensorFFT.h:81
Definition: ForwardDeclarations.h:21
Definition: GenericPacketMath.h:134
std::ptrdiff_t j
Definition: tut_arithmetic_redux_minmax.cpp:2