sof/src/math/fft/fft_16.c at ca0d3afe2872614aaa32656539e6073ef3fb5479 · thesofproject/sof · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
// SPDX-License-Identifier: BSD-3-Clause
//
// Copyright(c) 2020 Intel Corporation. All rights reserved.
//
// Author: Amery Song <chao.song@intel.com>
//	   Keyon Jie <yang.jie@linux.intel.com>

#include <sof/audio/format.h>
#include <sof/common.h>
#include <sof/math/fft.h>

#ifdef FFT_GENERIC

/*
 * Helpers for 16 bit FFT calculation
 */
static inline void icomplex16_add(const struct icomplex16 *in1, const struct icomplex16 *in2,
				  struct icomplex16 *out)
{
	out->real = in1->real + in2->real;
	out->imag = in1->imag + in2->imag;
}

static inline void icomplex16_sub(const struct icomplex16 *in1, const struct icomplex16 *in2,
				  struct icomplex16 *out)
{
	out->real = in1->real - in2->real;
	out->imag = in1->imag - in2->imag;
}

static inline void icomplex16_mul(const struct icomplex16 *in1, const struct icomplex16 *in2,
				  struct icomplex16 *out)
{
	int32_t real = (int32_t)in1->real * in2->real - (int32_t)in1->imag * in2->imag;
	int32_t imag = (int32_t)in1->real * in2->imag + (int32_t)in1->imag * in2->real;

	out->real = Q_SHIFT_RND(real, 30, 15);
	out->imag = Q_SHIFT_RND(imag, 30, 15);
}

/* complex conjugate */
static inline void icomplex16_conj(struct icomplex16 *comp)
{
	comp->imag = sat_int16(-((int32_t)comp->imag));
}

/* shift a complex n bits, n > 0: left shift, n < 0: right shift */
static inline void icomplex16_shift(const struct icomplex16 *input, int16_t n,
				    struct icomplex16 *output)
{
	int n1, n2;

	if (n >= 0) {
		/* need saturation handling */
		output->real = sat_int16((int32_t)input->real << n);
		output->imag = sat_int16((int32_t)input->imag << n);
	} else {
		n1 = -n;
		n2 = 1 << (n1 - 1);
		output->real = sat_int16(((int32_t)input->real + n2) >> n1);
		output->imag = sat_int16(((int32_t)input->imag  + n2) >> n1);
	}
}

/**
 * \brief Execute the 16-bits Fast Fourier Transform (FFT) or Inverse FFT (IFFT)
 *	  For the configured fft_pan.
 * \param[in] plan - pointer to fft_plan which will be executed.
 * \param[in] ifft - set to 1 for IFFT and 0 for FFT.
 */
void fft_execute_16(struct fft_plan *plan, bool ifft)
{
	struct icomplex16 tmp1;
	struct icomplex16 tmp2;
	struct icomplex16 *inb;
	struct icomplex16 *outb;
	struct icomplex16 *twiddle;
	int depth;
	int top;
	int bottom;
	int index;
	int i;
	int j;
	int k;
	int m;
	int n;

	if (!plan || !plan->bit_reverse_idx)
		return;

	inb = plan->inb16;
	outb = plan->outb16;
	if (!inb || !outb)
		return;

	/* convert to complex conjugate for ifft */
	if (ifft) {
		for (i = 0; i < plan->size; i++)
			icomplex16_conj(&inb[i]);
	}

	/* step 1: re-arrange input in bit reverse order, and shrink the level to avoid overflow */
	for (i = 1; i < plan->size; ++i)
		icomplex16_shift(&inb[i], -(plan->len), &outb[plan->bit_reverse_idx[i]]);

	/* step 2: loop to do FFT transform in smaller size */
	twiddle = plan->twiddle;
	for (depth = 1; depth <= plan->len; ++depth) {
		m = 1 << depth;
		n = m >> 1;
		i = plan->size >> depth;

		/* doing FFT transforms in size m */
		for (k = 0; k < plan->size; k += m) {
			/* doing one FFT transform for size m */
			for (j = 0; j < n; ++j) {
				index = i * j;
				top = k + j;
				bottom = top + n;
				tmp1 = twiddle[index];
				/* calculate the accumulator: twiddle * bottom */
				icomplex16_mul(&tmp1, &outb[bottom], &tmp2);
				tmp1 = outb[top];
				/* calculate the top output: top = top + accumulate */
				icomplex16_add(&tmp1, &tmp2, &outb[top]);
				/* calculate the bottom output: bottom = top - accumulate */
				icomplex16_sub(&tmp1, &tmp2, &outb[bottom]);
			}
		}
	}

	/* shift back for ifft */
	if (ifft) {
		/*
		 * no need to divide N as it is already done in the input side
		 * for Q1.31 format. Instead, we need to multiply N to compensate
		 * the shrink we did in the FFT transform.
		 */
		for (i = 0; i < plan->size; i++)
			icomplex16_shift(&outb[i], plan->len, &outb[i]);
	}
}
#endif