annotate mdct.c @ 7545:2dca9201c400 libavcodec

remove a float->double->float conversion. 1.8x faster imdct_c with fpmath=sse, no change with x87
author lorenm
date Tue, 12 Aug 2008 00:34:08 +0000
parents ee1cb5ab9f99
children 97383e012cb9
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
1 /*
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
2 * MDCT/IMDCT transforms
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
3 * Copyright (c) 2002 Fabrice Bellard.
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
4 *
3947
c8c591fe26f8 Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents: 3036
diff changeset
5 * This file is part of FFmpeg.
c8c591fe26f8 Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents: 3036
diff changeset
6 *
c8c591fe26f8 Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents: 3036
diff changeset
7 * FFmpeg is free software; you can redistribute it and/or
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
8 * modify it under the terms of the GNU Lesser General Public
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
9 * License as published by the Free Software Foundation; either
3947
c8c591fe26f8 Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents: 3036
diff changeset
10 * version 2.1 of the License, or (at your option) any later version.
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
11 *
3947
c8c591fe26f8 Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents: 3036
diff changeset
12 * FFmpeg is distributed in the hope that it will be useful,
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
15 * Lesser General Public License for more details.
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
16 *
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
17 * You should have received a copy of the GNU Lesser General Public
3947
c8c591fe26f8 Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents: 3036
diff changeset
18 * License along with FFmpeg; if not, write to the Free Software
3036
0b546eab515d Update licensing information: The FSF changed postal address.
diego
parents: 2967
diff changeset
19 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
20 */
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
21 #include "dsputil.h"
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
22
1106
1e39f273ecd6 per file doxy
michaelni
parents: 970
diff changeset
23 /**
1e39f273ecd6 per file doxy
michaelni
parents: 970
diff changeset
24 * @file mdct.c
1e39f273ecd6 per file doxy
michaelni
parents: 970
diff changeset
25 * MDCT/IMDCT transforms.
1e39f273ecd6 per file doxy
michaelni
parents: 970
diff changeset
26 */
1e39f273ecd6 per file doxy
michaelni
parents: 970
diff changeset
27
6139
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
28 // Generate a Kaiser-Bessel Derived Window.
6142
a35b838ab955 Add variable alpha and size of half window for Kaiser-Bessel Derived window
superdump
parents: 6139
diff changeset
29 #define BESSEL_I0_ITER 50 // default: 50 iterations of Bessel I0 approximation
a35b838ab955 Add variable alpha and size of half window for Kaiser-Bessel Derived window
superdump
parents: 6139
diff changeset
30 void ff_kbd_window_init(float *window, float alpha, int n)
6139
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
31 {
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
32 int i, j;
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
33 double sum = 0.0, bessel, tmp;
6142
a35b838ab955 Add variable alpha and size of half window for Kaiser-Bessel Derived window
superdump
parents: 6139
diff changeset
34 double local_window[n];
a35b838ab955 Add variable alpha and size of half window for Kaiser-Bessel Derived window
superdump
parents: 6139
diff changeset
35 double alpha2 = (alpha * M_PI / n) * (alpha * M_PI / n);
6139
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
36
6142
a35b838ab955 Add variable alpha and size of half window for Kaiser-Bessel Derived window
superdump
parents: 6139
diff changeset
37 for (i = 0; i < n; i++) {
a35b838ab955 Add variable alpha and size of half window for Kaiser-Bessel Derived window
superdump
parents: 6139
diff changeset
38 tmp = i * (n - i) * alpha2;
6139
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
39 bessel = 1.0;
6142
a35b838ab955 Add variable alpha and size of half window for Kaiser-Bessel Derived window
superdump
parents: 6139
diff changeset
40 for (j = BESSEL_I0_ITER; j > 0; j--)
6139
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
41 bessel = bessel * tmp / (j * j) + 1;
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
42 sum += bessel;
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
43 local_window[i] = sum;
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
44 }
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
45
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
46 sum++;
6142
a35b838ab955 Add variable alpha and size of half window for Kaiser-Bessel Derived window
superdump
parents: 6139
diff changeset
47 for (i = 0; i < n; i++)
6139
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
48 window[i] = sqrt(local_window[i] / sum);
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
49 }
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
50
7094
b0820b8bd4dd Add generic ff_sine_window_init function and implement in codecs appropriately
superdump
parents: 6498
diff changeset
51 // Generate a sine window.
b0820b8bd4dd Add generic ff_sine_window_init function and implement in codecs appropriately
superdump
parents: 6498
diff changeset
52 void ff_sine_window_init(float *window, int n) {
b0820b8bd4dd Add generic ff_sine_window_init function and implement in codecs appropriately
superdump
parents: 6498
diff changeset
53 int i;
b0820b8bd4dd Add generic ff_sine_window_init function and implement in codecs appropriately
superdump
parents: 6498
diff changeset
54 for(i = 0; i < n; i++)
b0820b8bd4dd Add generic ff_sine_window_init function and implement in codecs appropriately
superdump
parents: 6498
diff changeset
55 window[i] = sin((i + 0.5) / (2 * n) * M_PI);
b0820b8bd4dd Add generic ff_sine_window_init function and implement in codecs appropriately
superdump
parents: 6498
diff changeset
56 }
b0820b8bd4dd Add generic ff_sine_window_init function and implement in codecs appropriately
superdump
parents: 6498
diff changeset
57
1106
1e39f273ecd6 per file doxy
michaelni
parents: 970
diff changeset
58 /**
1e39f273ecd6 per file doxy
michaelni
parents: 970
diff changeset
59 * init MDCT or IMDCT computation.
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
60 */
794
670009af4fc2 avoid name clash
bellard
parents: 781
diff changeset
61 int ff_mdct_init(MDCTContext *s, int nbits, int inverse)
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
62 {
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
63 int n, n4, i;
6498
d9c48a85fd23 improve precision in mdct.c using double for some temporaries
mru
parents: 6142
diff changeset
64 double alpha;
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
65
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
66 memset(s, 0, sizeof(*s));
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
67 n = 1 << nbits;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
68 s->nbits = nbits;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
69 s->n = n;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
70 n4 = n >> 2;
970
a521e0ecc5a8 use av_malloc instead of malloc
bellard
parents: 794
diff changeset
71 s->tcos = av_malloc(n4 * sizeof(FFTSample));
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
72 if (!s->tcos)
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
73 goto fail;
970
a521e0ecc5a8 use av_malloc instead of malloc
bellard
parents: 794
diff changeset
74 s->tsin = av_malloc(n4 * sizeof(FFTSample));
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
75 if (!s->tsin)
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
76 goto fail;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
77
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
78 for(i=0;i<n4;i++) {
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
79 alpha = 2 * M_PI * (i + 1.0 / 8.0) / n;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
80 s->tcos[i] = -cos(alpha);
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
81 s->tsin[i] = -sin(alpha);
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
82 }
1879
dd63cb7e5080 fft_*() renamed into ff_fft_*() patch by (Gildas Bazin <gbazin at altern dot org>)
michael
parents: 1106
diff changeset
83 if (ff_fft_init(&s->fft, s->nbits - 2, inverse) < 0)
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
84 goto fail;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
85 return 0;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
86 fail:
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
87 av_freep(&s->tcos);
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
88 av_freep(&s->tsin);
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
89 return -1;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
90 }
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
91
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
92 /* complex multiplication: p = a * b */
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
93 #define CMUL(pre, pim, are, aim, bre, bim) \
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
94 {\
7545
2dca9201c400 remove a float->double->float conversion.
lorenm
parents: 7544
diff changeset
95 FFTSample _are = (are);\
2dca9201c400 remove a float->double->float conversion.
lorenm
parents: 7544
diff changeset
96 FFTSample _aim = (aim);\
2dca9201c400 remove a float->double->float conversion.
lorenm
parents: 7544
diff changeset
97 FFTSample _bre = (bre);\
2dca9201c400 remove a float->double->float conversion.
lorenm
parents: 7544
diff changeset
98 FFTSample _bim = (bim);\
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
99 (pre) = _are * _bre - _aim * _bim;\
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
100 (pim) = _are * _bim + _aim * _bre;\
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
101 }
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
102
7544
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
103 /**
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
104 * Compute the middle half of the inverse MDCT of size N = 2^nbits,
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
105 * thus excluding the parts that can be derived by symmetry
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
106 * @param output N/2 samples
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
107 * @param input N/2 samples
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
108 */
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
109 void ff_imdct_half(MDCTContext *s, FFTSample *output, const FFTSample *input)
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
110 {
7544
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
111 int k, n8, n4, n2, n, j;
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
112 const uint16_t *revtab = s->fft.revtab;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
113 const FFTSample *tcos = s->tcos;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
114 const FFTSample *tsin = s->tsin;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
115 const FFTSample *in1, *in2;
7544
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
116 FFTComplex *z = (FFTComplex *)output;
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
117
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
118 n = 1 << s->nbits;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
119 n2 = n >> 1;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
120 n4 = n >> 2;
7544
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
121 n8 = n >> 3;
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
122
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
123 /* pre rotation */
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
124 in1 = input;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
125 in2 = input + n2 - 1;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
126 for(k = 0; k < n4; k++) {
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
127 j=revtab[k];
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
128 CMUL(z[j].re, z[j].im, *in2, *in1, tcos[k], tsin[k]);
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
129 in1 += 2;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
130 in2 -= 2;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
131 }
1879
dd63cb7e5080 fft_*() renamed into ff_fft_*() patch by (Gildas Bazin <gbazin at altern dot org>)
michael
parents: 1106
diff changeset
132 ff_fft_calc(&s->fft, z);
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
133
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
134 /* post rotation + reordering */
7544
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
135 output += n4;
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
136 for(k = 0; k < n8; k++) {
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
137 FFTSample r0, i0, r1, i1;
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
138 CMUL(r0, i1, z[n8-k-1].im, z[n8-k-1].re, tsin[n8-k-1], tcos[n8-k-1]);
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
139 CMUL(r1, i0, z[n8+k ].im, z[n8+k ].re, tsin[n8+k ], tcos[n8+k ]);
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
140 z[n8-k-1].re = r0;
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
141 z[n8-k-1].im = i0;
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
142 z[n8+k ].re = r1;
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
143 z[n8+k ].im = i1;
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
144 }
7263
fc843d00867c exploit mdct symmetry
lorenm
parents: 7094
diff changeset
145 }
fc843d00867c exploit mdct symmetry
lorenm
parents: 7094
diff changeset
146
fc843d00867c exploit mdct symmetry
lorenm
parents: 7094
diff changeset
147 /**
fc843d00867c exploit mdct symmetry
lorenm
parents: 7094
diff changeset
148 * Compute inverse MDCT of size N = 2^nbits
fc843d00867c exploit mdct symmetry
lorenm
parents: 7094
diff changeset
149 * @param output N samples
fc843d00867c exploit mdct symmetry
lorenm
parents: 7094
diff changeset
150 * @param input N/2 samples
fc843d00867c exploit mdct symmetry
lorenm
parents: 7094
diff changeset
151 * @param tmp N/2 samples
fc843d00867c exploit mdct symmetry
lorenm
parents: 7094
diff changeset
152 */
fc843d00867c exploit mdct symmetry
lorenm
parents: 7094
diff changeset
153 void ff_imdct_calc(MDCTContext *s, FFTSample *output,
fc843d00867c exploit mdct symmetry
lorenm
parents: 7094
diff changeset
154 const FFTSample *input, FFTSample *tmp)
fc843d00867c exploit mdct symmetry
lorenm
parents: 7094
diff changeset
155 {
7544
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
156 int k;
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
157 int n = 1 << s->nbits;
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
158 int n2 = n >> 1;
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
159 int n4 = n >> 2;
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
160
7544
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
161 ff_imdct_half(s, output+n4, input);
7263
fc843d00867c exploit mdct symmetry
lorenm
parents: 7094
diff changeset
162
7544
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
163 for(k = 0; k < n4; k++) {
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
164 output[k] = -output[n2-k-1];
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
165 output[n-k-1] = output[n2+k];
7263
fc843d00867c exploit mdct symmetry
lorenm
parents: 7094
diff changeset
166 }
fc843d00867c exploit mdct symmetry
lorenm
parents: 7094
diff changeset
167 }
fc843d00867c exploit mdct symmetry
lorenm
parents: 7094
diff changeset
168
fc843d00867c exploit mdct symmetry
lorenm
parents: 7094
diff changeset
169 /**
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
170 * Compute MDCT of size N = 2^nbits
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
171 * @param input N samples
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
172 * @param out N/2 samples
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
173 * @param tmp temporary storage of N/2 samples
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
174 */
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 1879
diff changeset
175 void ff_mdct_calc(MDCTContext *s, FFTSample *out,
794
670009af4fc2 avoid name clash
bellard
parents: 781
diff changeset
176 const FFTSample *input, FFTSample *tmp)
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
177 {
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
178 int i, j, n, n8, n4, n2, n3;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
179 FFTSample re, im, re1, im1;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
180 const uint16_t *revtab = s->fft.revtab;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
181 const FFTSample *tcos = s->tcos;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
182 const FFTSample *tsin = s->tsin;
7544
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
183 FFTComplex *x = (FFTComplex *)out;
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
184
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
185 n = 1 << s->nbits;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
186 n2 = n >> 1;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
187 n4 = n >> 2;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
188 n8 = n >> 3;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
189 n3 = 3 * n4;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
190
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
191 /* pre rotation */
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
192 for(i=0;i<n8;i++) {
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
193 re = -input[2*i+3*n4] - input[n3-1-2*i];
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
194 im = -input[n4+2*i] + input[n4-1-2*i];
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
195 j = revtab[i];
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
196 CMUL(x[j].re, x[j].im, re, im, -tcos[i], tsin[i]);
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
197
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
198 re = input[2*i] - input[n2-1-2*i];
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
199 im = -(input[n2+2*i] + input[n-1-2*i]);
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
200 j = revtab[n8 + i];
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
201 CMUL(x[j].re, x[j].im, re, im, -tcos[n8 + i], tsin[n8 + i]);
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
202 }
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
203
1879
dd63cb7e5080 fft_*() renamed into ff_fft_*() patch by (Gildas Bazin <gbazin at altern dot org>)
michael
parents: 1106
diff changeset
204 ff_fft_calc(&s->fft, x);
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 1879
diff changeset
205
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
206 /* post rotation */
7544
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
207 for(i=0;i<n8;i++) {
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
208 FFTSample r0, i0, r1, i1;
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
209 CMUL(i1, r0, x[n8-i-1].re, x[n8-i-1].im, -tsin[n8-i-1], -tcos[n8-i-1]);
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
210 CMUL(i0, r1, x[n8+i ].re, x[n8+i ].im, -tsin[n8+i ], -tcos[n8+i ]);
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
211 x[n8-i-1].re = r0;
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
212 x[n8-i-1].im = i0;
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
213 x[n8+i ].re = r1;
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
214 x[n8+i ].im = i1;
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
215 }
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
216 }
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
217
794
670009af4fc2 avoid name clash
bellard
parents: 781
diff changeset
218 void ff_mdct_end(MDCTContext *s)
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
219 {
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
220 av_freep(&s->tcos);
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
221 av_freep(&s->tsin);
1879
dd63cb7e5080 fft_*() renamed into ff_fft_*() patch by (Gildas Bazin <gbazin at altern dot org>)
michael
parents: 1106
diff changeset
222 ff_fft_end(&s->fft);
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
223 }