mayhem-firmware/firmware/common/dsp_fft.hpp

/*
 * Copyright (C) 2013 Jared Boone, ShareBrained Technology, Inc.
 *
 * This file is part of PortaPack.
 *
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published by
 * the Free Software Foundation; either version 2, or (at your option)
 * any later version.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with this program; see the file COPYING.  If not, write to
 * the Free Software Foundation, Inc., 51 Franklin Street,
 * Boston, MA 02110-1301, USA.
 */

#ifndef __DSP_FFT_H__
#define __DSP_FFT_H__

#include <cstdint>
#include <cstddef>
#include <complex>
#include <cmath>
#include <type_traits>
#include <array>

#include "dsp_types.hpp"
#include "complex.hpp"
#include "hal.h"
#include "utility.hpp"
#include "sine_table_int8.hpp"

namespace std {
	/* https://github.com/AE9RB/fftbench/blob/master/cxlr.hpp
	 * Nice trick from AE9RB (David Turnbull) to get compiler to produce simpler
	 * fma (fused multiply-accumulate) instead of worrying about NaN handling
	 */
	inline complex<float>
	operator*(const complex<float>& v1, const complex<float>& v2) {
		return complex<float> {
			v1.real() * v2.real() - v1.imag() * v2.imag(),
			v1.real() * v2.imag() + v1.imag() * v2.real()
		};
	}
} /* namespace std */

template<typename T, size_t N>
void fft_swap(const buffer_c16_t src, std::array<T, N>& dst) {
	static_assert(power_of_two(N), "only defined for N == power of two");

	for(size_t i=0; i<N; i++) {
		const size_t i_rev = __RBIT(i) >> (32 - log_2(N));
		const auto s = src.p[i];
		dst[i_rev] = {
			static_cast<typename T::value_type>(s.real()),
			static_cast<typename T::value_type>(s.imag())
		};
	}
}

template<typename T, size_t N>
void fft_swap(const std::array<complex16_t, N>& src, std::array<T, N>& dst) {
	static_assert(power_of_two(N), "only defined for N == power of two");

	for(size_t i=0; i<N; i++) {
		const size_t i_rev = __RBIT(i) >> (32 - log_2(N));
		const auto s = src[i];
		dst[i_rev] = {
			static_cast<typename T::value_type>(s.real()),
			static_cast<typename T::value_type>(s.imag())
		};
	}
}

template<typename T, size_t N>
void fft_swap(const std::array<T, N>& src, std::array<T, N>& dst) {
	static_assert(power_of_two(N), "only defined for N == power of two");

	for(size_t i=0; i<N; i++) {
		const size_t i_rev = __RBIT(i) >> (32 - log_2(N));
		dst[i_rev] = src[i];
	}
}

template<typename T, size_t N>
void fft_swap_in_place(std::array<T, N>& data) {
	static_assert(power_of_two(N), "only defined for N == power of two");

	for(size_t i=0; i<N/2; i++) {
		const size_t i_rev = __RBIT(i) >> (32 - log_2(N));
		std::swap(data[i], data[i_rev]);
	}
}

/* http://beige.ucs.indiana.edu/B673/node14.html */
/* http://www.drdobbs.com/cpp/a-simple-and-efficient-fft-implementatio/199500857?pgno=3 */

template<typename T, size_t N>
void fft_c_preswapped(std::array<T, N>& data, const size_t from, const size_t to) {
	static_assert(power_of_two(N), "only defined for N == power of two");
	constexpr auto K = log_2(N);
	if ((to > K) || (from > K)) return;

	constexpr size_t K_max = 8;
	static_assert(K <= K_max, "No FFT twiddle factors for K > 8");
	static constexpr std::array<std::complex<float>, K_max> wp_table { {
		{ -2.0f,                        0.0f                     },	// 2
		{ -1.0f,                       -1.0f                     },	// 4
		{ -0.2928932188134524756f,     -0.7071067811865475244f   },	// 8
		{ -0.076120467488713243872f,   -0.38268343236508977173f  },	// 16
		{ -0.019214719596769550874f,   -0.19509032201612826785f  },	// 32
		{ -0.0048152733278031137552f,  -0.098017140329560601994f },	// 64
		{ -0.0012045437948276072852f,  -0.049067674327418014255f },	// 128
		{ -0.00030118130379577988423f, -0.024541228522912288032f },	// 256
	} };

	/* Provide data to this function, pre-swapped. */
	for(size_t k = from; k < to; k++) {
		const size_t mmax = 1 << k;
		const auto wp = wp_table[k];
		T w { 1.0f, 0.0f };
		for(size_t m = 0; m < mmax; ++m) {
			for(size_t i = m; i < N; i += mmax * 2) {
				const size_t j = i + mmax;
				const T temp = w * data[j];
				data[j]  = data[i] - temp;
				data[i] += temp;
			}
			w += w * wp;
		}
	}
}

/* 
   ifft(v,N):
   [0] If N==1 then return.
   [1] For k = 0 to N/2-1, let ve[k] = v[2*k]
   [2] Compute ifft(ve, N/2);
   [3] For k = 0 to N/2-1, let vo[k] = v[2*k+1]
   [4] Compute ifft(vo, N/2);
   [5] For m = 0 to N/2-1, do [6] through [9]
   [6]   Let w.real() = cos(2*PI*m/N)
   [7]   Let w.imag() = sin(2*PI*m/N)
   [8]   Let v[m] = ve[m] + w*vo[m]
   [9]   Let v[m+N/2] = ve[m] - w*vo[m]
 */
template<typename T>
void ifft( T *v, int n, T *tmp )
{
    if(n>1) {
        int k,m;
		T z, w, *vo, *ve;
        ve = tmp; vo = tmp+n/2;
        for(k=0; k<n/2; k++) {
            ve[k] = v[2*k];
            vo[k] = v[2*k+1];
        }
        ifft( ve, n/2, v );		/* FFT on even-indexed elements of v[] */
        ifft( vo, n/2, v );		/* FFT on odd-indexed elements of v[] */
        for(m=0; m<n/2; m++) {
            w.real(sine_table_i8[((int)(m/(double)n * 0x100 + 0x40)) & 0xFF]);
            w.imag(sine_table_i8[((int)(m/(double)n * 0x100)) & 0xFF]);

            z.real((w.real()*vo[m].real() - w.imag()*vo[m].imag())/127);	/* Re(w*vo[m]) */
            z.imag((w.real()*vo[m].imag() + w.imag()*vo[m].real())/127);	/* Im(w*vo[m]) */
            v[  m  ].real(ve[m].real() + z.real());
            v[  m  ].imag(ve[m].imag() + z.imag());
            v[m+n/2].real(ve[m].real() - z.real());
            v[m+n/2].imag(ve[m].imag() - z.imag());
        }
    }
    return;
}

#endif/*__DSP_FFT_H__*/
Initial firmware commit. 2015-07-08 08:39:24 -07:00			`/*`
			`* Copyright (C) 2013 Jared Boone, ShareBrained Technology, Inc.`
			`*`
			`* This file is part of PortaPack.`
			`*`
			`* This program is free software; you can redistribute it and/or modify`
			`* it under the terms of the GNU General Public License as published by`
			`* the Free Software Foundation; either version 2, or (at your option)`
			`* any later version.`
			`*`
			`* This program is distributed in the hope that it will be useful,`
			`* but WITHOUT ANY WARRANTY; without even the implied warranty of`
			`* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the`
			`* GNU General Public License for more details.`
			`*`
			`* You should have received a copy of the GNU General Public License`
			`* along with this program; see the file COPYING. If not, write to`
			`* the Free Software Foundation, Inc., 51 Franklin Street,`
			`* Boston, MA 02110-1301, USA.`
			`*/`

			`#ifndef __DSP_FFT_H__`
			`#define __DSP_FFT_H__`

			`#include <cstdint>`
			`#include <cstddef>`
			`#include <complex>`
			`#include <cmath>`
			`#include <type_traits>`
			`#include <array>`

Add more fft_swap bit reversal functions. 2015-09-17 17:27:37 -07:00			`#include "dsp_types.hpp"`
Initial firmware commit. 2015-07-08 08:39:24 -07:00			`#include "complex.hpp"`
			`#include "hal.h"`
Extract some constexpr math utilities to utility.hpp ...my dumping ground for so many random bits. 2016-02-10 10:15:42 -08:00			`#include "utility.hpp"`
New app: Spectrum Painter (#988) * added spectrum painter app 2023-05-14 23:09:43 +02:00			`#include "sine_table_int8.hpp"`
Initial firmware commit. 2015-07-08 08:39:24 -07:00
			`namespace std {`
			`/* https://github.com/AE9RB/fftbench/blob/master/cxlr.hpp`
			`* Nice trick from AE9RB (David Turnbull) to get compiler to produce simpler`
			`* fma (fused multiply-accumulate) instead of worrying about NaN handling`
			`*/`
			`inline complex<float>`
			`operator*(const complex<float>& v1, const complex<float>& v2) {`
			`return complex<float> {`
			`v1.real() * v2.real() - v1.imag() * v2.imag(),`
			`v1.real() * v2.imag() + v1.imag() * v2.real()`
			`};`
			`}`
			`} /* namespace std */`

Add more fft_swap bit reversal functions. 2015-09-17 17:27:37 -07:00			`template<typename T, size_t N>`
			`void fft_swap(const buffer_c16_t src, std::array<T, N>& dst) {`
			`static_assert(power_of_two(N), "only defined for N == power of two");`

			`for(size_t i=0; i<N; i++) {`
			`const size_t i_rev = __RBIT(i) >> (32 - log_2(N));`
			`const auto s = src.p[i];`
			`dst[i_rev] = {`
			`static_cast<typename T::value_type>(s.real()),`
			`static_cast<typename T::value_type>(s.imag())`
			`};`
			`}`
			`}`

Initial firmware commit. 2015-07-08 08:39:24 -07:00			`template<typename T, size_t N>`
			`void fft_swap(const std::array<complex16_t, N>& src, std::array<T, N>& dst) {`
			`static_assert(power_of_two(N), "only defined for N == power of two");`

			`for(size_t i=0; i<N; i++) {`
			`const size_t i_rev = __RBIT(i) >> (32 - log_2(N));`
			`const auto s = src[i];`
			`dst[i_rev] = {`
			`static_cast<typename T::value_type>(s.real()),`
			`static_cast<typename T::value_type>(s.imag())`
			`};`
			`}`
			`}`

			`template<typename T, size_t N>`
Add more fft_swap bit reversal functions. 2015-09-17 17:27:37 -07:00			`void fft_swap(const std::array<T, N>& src, std::array<T, N>& dst) {`
Initial firmware commit. 2015-07-08 08:39:24 -07:00			`static_assert(power_of_two(N), "only defined for N == power of two");`

			`for(size_t i=0; i<N; i++) {`
Add more fft_swap bit reversal functions. 2015-09-17 17:27:37 -07:00			`const size_t i_rev = __RBIT(i) >> (32 - log_2(N));`
			`dst[i_rev] = src[i];`
			`}`
			`}`

			`template<typename T, size_t N>`
			`void fft_swap_in_place(std::array<T, N>& data) {`
			`static_assert(power_of_two(N), "only defined for N == power of two");`

			`for(size_t i=0; i<N/2; i++) {`
Initial firmware commit. 2015-07-08 08:39:24 -07:00			`const size_t i_rev = __RBIT(i) >> (32 - log_2(N));`
			`std::swap(data[i], data[i_rev]);`
			`}`
			`}`

			`/* http://beige.ucs.indiana.edu/B673/node14.html */`
			`/* http://www.drdobbs.com/cpp/a-simple-and-efficient-fft-implementatio/199500857?pgno=3 */`

			`template<typename T, size_t N>`
Added an audio FFT view in Wideband FM receive Tried speeding up fill_rectangle for clearing the waveform widget 2018-05-21 18:46:48 +01:00			`void fft_c_preswapped(std::array<T, N>& data, const size_t from, const size_t to) {`
Initial firmware commit. 2015-07-08 08:39:24 -07:00			`static_assert(power_of_two(N), "only defined for N == power of two");`
Hard-code K=8 FFT twiddle constants for now. So low on baseband RAM! This eliminates the sin_f32() function and table, which is only used in the FFT, for the moment. 2016-01-03 20:08:26 -08:00			`constexpr auto K = log_2(N);`
Added an audio FFT view in Wideband FM receive Tried speeding up fill_rectangle for clearing the waveform widget 2018-05-21 18:46:48 +01:00			`if ((to > K) \|\| (from > K)) return;`
Hard-code K=8 FFT twiddle constants for now. So low on baseband RAM! This eliminates the sin_f32() function and table, which is only used in the FFT, for the moment. 2016-01-03 20:08:26 -08:00
FFT twiddles can be used for all K <= table length. Change assert to allow FFTs < 8. 2016-01-03 20:25:31 -08:00			`constexpr size_t K_max = 8;`
			`static_assert(K <= K_max, "No FFT twiddle factors for K > 8");`
			`static constexpr std::array<std::complex<float>, K_max> wp_table { {`
Added an audio FFT view in Wideband FM receive Tried speeding up fill_rectangle for clearing the waveform widget 2018-05-21 18:46:48 +01:00			`{ -2.0f, 0.0f }, // 2`
			`{ -1.0f, -1.0f }, // 4`
			`{ -0.2928932188134524756f, -0.7071067811865475244f }, // 8`
			`{ -0.076120467488713243872f, -0.38268343236508977173f }, // 16`
			`{ -0.019214719596769550874f, -0.19509032201612826785f }, // 32`
			`{ -0.0048152733278031137552f, -0.098017140329560601994f }, // 64`
			`{ -0.0012045437948276072852f, -0.049067674327418014255f }, // 128`
			`{ -0.00030118130379577988423f, -0.024541228522912288032f }, // 256`
Hard-code K=8 FFT twiddle constants for now. So low on baseband RAM! This eliminates the sin_f32() function and table, which is only used in the FFT, for the moment. 2016-01-03 20:08:26 -08:00			`} };`
Initial firmware commit. 2015-07-08 08:39:24 -07:00
			`/* Provide data to this function, pre-swapped. */`
Added an audio FFT view in Wideband FM receive Tried speeding up fill_rectangle for clearing the waveform widget 2018-05-21 18:46:48 +01:00			`for(size_t k = from; k < to; k++) {`
Little FFT loop indexing tweak. 2016-01-03 17:47:08 -08:00			`const size_t mmax = 1 << k;`
Hard-code K=8 FFT twiddle constants for now. So low on baseband RAM! This eliminates the sin_f32() function and table, which is only used in the FFT, for the moment. 2016-01-03 20:08:26 -08:00			`const auto wp = wp_table[k];`
Initial firmware commit. 2015-07-08 08:39:24 -07:00			`T w { 1.0f, 0.0f };`
			`for(size_t m = 0; m < mmax; ++m) {`
			`for(size_t i = m; i < N; i += mmax * 2) {`
			`const size_t j = i + mmax;`
			`const T temp = w * data[j];`
			`data[j] = data[i] - temp;`
			`data[i] += temp;`
			`}`
			`w += w * wp;`
			`}`
			`}`
			`}`

New app: Spectrum Painter (#988) * added spectrum painter app 2023-05-14 23:09:43 +02:00			`/*`
			`ifft(v,N):`
			`[0] If N==1 then return.`
			`[1] For k = 0 to N/2-1, let ve[k] = v[2*k]`
			`[2] Compute ifft(ve, N/2);`
			`[3] For k = 0 to N/2-1, let vo[k] = v[2*k+1]`
			`[4] Compute ifft(vo, N/2);`
			`[5] For m = 0 to N/2-1, do [6] through [9]`
			`[6] Let w.real() = cos(2PIm/N)`
			`[7] Let w.imag() = sin(2PIm/N)`
			`[8] Let v[m] = ve[m] + w*vo[m]`
			`[9] Let v[m+N/2] = ve[m] - w*vo[m]`
			`*/`
			`template<typename T>`
			`void ifft( T v, int n, T tmp )`
			`{`
			`if(n>1) {`
			`int k,m;`
			`T z, w, vo, ve;`
			`ve = tmp; vo = tmp+n/2;`
			`for(k=0; k<n/2; k++) {`
			`ve[k] = v[2*k];`
			`vo[k] = v[2*k+1];`
			`}`
			`ifft( ve, n/2, v ); /* FFT on even-indexed elements of v[] */`
			`ifft( vo, n/2, v ); /* FFT on odd-indexed elements of v[] */`
			`for(m=0; m<n/2; m++) {`
			`w.real(sine_table_i8[((int)(m/(double)n * 0x100 + 0x40)) & 0xFF]);`
			`w.imag(sine_table_i8[((int)(m/(double)n * 0x100)) & 0xFF]);`

			`z.real((w.real()vo[m].real() - w.imag()vo[m].imag())/127); /* Re(wvo[m]) /`
			`z.imag((w.real()vo[m].imag() + w.imag()vo[m].real())/127); /* Im(wvo[m]) /`
			`v[ m ].real(ve[m].real() + z.real());`
			`v[ m ].imag(ve[m].imag() + z.imag());`
			`v[m+n/2].real(ve[m].real() - z.real());`
			`v[m+n/2].imag(ve[m].imag() - z.imag());`
			`}`
			`}`
			`return;`
			`}`

Initial firmware commit. 2015-07-08 08:39:24 -07:00			`#endif/__DSP_FFT_H__/`