xtensor/include/xtensor/misc/xfft.hpp at 7d469563fbaae1963ace5784b58dddc8f33af4ef · xtensor-stack/xtensor · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
#ifdef XTENSOR_USE_TBB
#include <oneapi/tbb.h>
#endif
#include <stdexcept>

#include <xtl/xcomplex.hpp>

#include "../containers/xarray.hpp"
#include "../core/xmath.hpp"
#include "../core/xnoalias.hpp"
#include "../generators/xbuilder.hpp"
#include "../misc/xcomplex.hpp"
#include "../utils/xutils.hpp"
#include "../views/xaxis_slice_iterator.hpp"
#include "../views/xview.hpp"
#include "./xtl_concepts.hpp"

namespace xt
{
    namespace fft
    {
        namespace detail
        {
            template <xtl::complex_concept E>
            inline auto radix2(E&& e)
            {
                using namespace xt::placeholders;
                using namespace std::complex_literals;
                using value_type = typename std::decay_t<E>::value_type;
                using precision = typename value_type::value_type;
                auto N = e.size();
                const bool powerOfTwo = !(N == 0) && !(N & (N - 1));
                // check for power of 2
                if (!powerOfTwo || N == 0)
                {
                    // TODO: Replace implementation with dft
                    XTENSOR_THROW(std::runtime_error, "FFT Implementation requires power of 2");
                }
                auto pi = xt::numeric_constants<precision>::PI;
                xt::xtensor<value_type, 1> ev = e;
                if (N <= 1)
                {
                    return ev;
                }
                else
                {
#ifdef XTENSOR_USE_TBB
                    xt::xtensor<value_type, 1> even;
                    xt::xtensor<value_type, 1> odd;
                    oneapi::tbb::parallel_invoke(
                        [&]
                        {
                            even = radix2(xt::view(ev, xt::range(0, _, 2)));
                        },
                        [&]
                        {
                            odd = radix2(xt::view(ev, xt::range(1, _, 2)));
                        }
                    );
#else
                    auto even = radix2(xt::view(ev, xt::range(0, _, 2)));
                    auto odd = radix2(xt::view(ev, xt::range(1, _, 2)));
#endif

                    auto range = xt::arange<double>(0.5 * static_cast<double>(N));
                    auto exp = xt::exp(static_cast<value_type>(-2i) * pi * range / static_cast<precision>(N));
                    auto t = exp * odd;
                    auto first_half = even + t;
                    auto second_half = even - t;
                    // TODO: should be a call to stack if performance was improved
                    auto spectrum = xt::xtensor<value_type, 1>::from_shape({N});
                    xt::view(spectrum, xt::range(0, static_cast<size_t>(N / 2))) = first_half;
                    xt::view(spectrum, xt::range(static_cast<size_t>(N / 2), N)) = second_half;
                    return spectrum;
                }
            }

            template <typename E>
            auto transform_bluestein(E&& data)
            {
                using value_type = typename std::decay_t<E>::value_type;
                using precision = typename value_type::value_type;

                // Find a power-of-2 convolution length m such that m >= n * 2 + 1
                const std::size_t n = data.size();
                auto m = static_cast<size_t>(std::ceil(std::log2(n * 2 + 1)));
                m = 1 << m;

                // Trignometric table
                auto exp_table = xt::xtensor<std::complex<precision>, 1>::from_shape({n});
                xt::xtensor<std::size_t, 1> i = xt::pow(xt::linspace<std::size_t>(0, n - 1, n), 2);
                i %= (n * 2);

                auto angles = xt::eval(
                    static_cast<precision>(3.141592653589793238463) * xt::cast<precision>(i)
                    / static_cast<precision>(n)
                );
                auto j = std::complex<precision>(0, 1);
                exp_table = xt::exp(-angles * j);

                // Temporary vectors and preprocessing
                auto av = xt::empty<std::complex<precision>>({m});
                xt::view(av, xt::range(0, n)) = data * exp_table;


                auto bv = xt::empty<std::complex<precision>>({m});
                xt::view(bv, xt::range(0, n)) = ::xt::conj(exp_table);
                xt::view(bv, xt::range(-n + 1, xt::placeholders::_)) = xt::view(
                    ::xt::conj(xt::flip(exp_table)),
                    xt::range(xt::placeholders::_, -1)
                );

                // Convolution
                auto xv = radix2(av);
                auto yv = radix2(bv);
                auto spectrum_k = xv * yv;
                auto complex_args = xt::conj(spectrum_k);
                auto fft_res = radix2(complex_args);
                auto cv = xt::conj(fft_res) / static_cast<precision>(m);

                return xt::eval(xt::view(cv, xt::range(0, n)) * exp_table);
            }
        }  // namespace detail

        /**
         * @brief 1D FFT of an Nd array along a specified axis
         * @param e an Nd expression to be transformed to the fourier domain
         * @param axis the axis along which to perform the 1D FFT
         * @return a transformed xarray of the specified precision
         */
        template <class E>
        inline auto fft(E&& e, std::ptrdiff_t axis = -1)
        {
            using value_type = typename std::decay<E>::type::value_type;
            if constexpr (xtl::is_complex<typename std::decay<E>::type::value_type>::value)
            {
                using precision = typename value_type::value_type;
                const auto saxis = xt::normalize_axis(e.dimension(), axis);
                const size_t N = e.shape(saxis);
                const bool powerOfTwo = !(N == 0) && !(N & (N - 1));
                xt::xarray<std::complex<precision>> out = xt::eval(e);
                auto begin = xt::axis_slice_begin(out, saxis);
                auto end = xt::axis_slice_end(out, saxis);
                for (auto iter = begin; iter != end; iter++)
                {
                    if (powerOfTwo)
                    {
                        xt::noalias(*iter) = detail::radix2(*iter);
                    }
                    else
                    {
                        xt::noalias(*iter) = detail::transform_bluestein(*iter);
                    }
                }
                return out;
            }
            else
            {
                return fft(xt::cast<std::complex<value_type>>(e), axis);
            }
        }

        template <class E>
        inline auto ifft(E&& e, std::ptrdiff_t axis = -1)
        {
            if constexpr (xtl::is_complex<typename std::decay<E>::type::value_type>::value)
            {
                // check the length of the data on that axis
                const std::size_t n = e.shape(as_unsigned(axis));
                if (n == 0)
                {
                    XTENSOR_THROW(std::runtime_error, "Cannot take the iFFT along an empty dimention");
                }
                auto complex_args = xt::conj(e);
                auto fft_res = xt::fft::fft(complex_args, axis);
                fft_res = xt::conj(fft_res);
                return fft_res;
            }
            else
            {
                using value_type = typename std::decay<E>::type::value_type;
                return ifft(xt::cast<std::complex<value_type>>(e), axis);
            }
        }

        /*
         * @brief performs a circular fft convolution xvec and yvec must
         *        be the same shape.
         * @param xvec first array of the convolution
         * @param yvec second array of the convolution
         * @param axis axis along which to perform the convolution
         */
        template <typename E1, typename E2>
        auto convolve(E1&& xvec, E2&& yvec, std::ptrdiff_t axis = -1)
        {
            // we could broadcast but that could get complicated???
            if (xvec.dimension() != yvec.dimension())
            {
                XTENSOR_THROW(std::runtime_error, "Mismatched dimentions");
            }

            auto saxis = xt::normalize_axis(xvec.dimension(), axis);
            if (xvec.shape(saxis) != yvec.shape(saxis))
            {
                XTENSOR_THROW(std::runtime_error, "Mismatched lengths along slice axis");
            }

            const std::size_t n = xvec.shape(saxis);

            auto xv = fft(xvec, axis);
            auto yv = fft(yvec, axis);

            auto begin_x = xt::axis_slice_begin(xv, saxis);
            auto end_x = xt::axis_slice_end(xv, saxis);
            auto iter_y = xt::axis_slice_begin(yv, saxis);

            for (auto iter = begin_x; iter != end_x; iter++)
            {
                (*iter) = (*iter_y++) * (*iter);
            }

            auto outvec = ifft(xv, axis);

            // Scaling (because this FFT implementation omits it)
            using outvec_type = typename decltype(outvec)::value_type::value_type;
            outvec_type scale = static_cast<outvec_type>(1.0) / static_cast<outvec_type>(n);
            outvec *= scale;

            return outvec;
        }

    }
}  // namespace xt::fft