annotate mdct.c @ 9658:67a20f0eb42c libavcodec

Support for getting (i)MDCT output multiplied by a constant scaling factor. Scaling (i)MDCT output has no runtime overhead and can be used to improve performance of audio codecs. All the changes are only needed in 'ff_mdct_init' function and slow down initialization a bit.
author serge
date Sat, 16 May 2009 14:17:08 +0000
parents d527872fdf26
children 50ec8930f99e
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
1 /*
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
2 * MDCT/IMDCT transforms
8629
04423b2f6e0b cosmetics: Remove pointless period after copyright statement non-sentences.
diego
parents: 8567
diff changeset
3 * Copyright (c) 2002 Fabrice Bellard
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
4 *
3947
c8c591fe26f8 Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents: 3036
diff changeset
5 * This file is part of FFmpeg.
c8c591fe26f8 Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents: 3036
diff changeset
6 *
c8c591fe26f8 Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents: 3036
diff changeset
7 * FFmpeg is free software; you can redistribute it and/or
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
8 * modify it under the terms of the GNU Lesser General Public
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
9 * License as published by the Free Software Foundation; either
3947
c8c591fe26f8 Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents: 3036
diff changeset
10 * version 2.1 of the License, or (at your option) any later version.
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
11 *
3947
c8c591fe26f8 Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents: 3036
diff changeset
12 * FFmpeg is distributed in the hope that it will be useful,
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
15 * Lesser General Public License for more details.
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
16 *
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
17 * You should have received a copy of the GNU Lesser General Public
3947
c8c591fe26f8 Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents: 3036
diff changeset
18 * License along with FFmpeg; if not, write to the Free Software
3036
0b546eab515d Update licensing information: The FSF changed postal address.
diego
parents: 2967
diff changeset
19 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
20 */
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
21 #include "dsputil.h"
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
22
1106
1e39f273ecd6 per file doxy
michaelni
parents: 970
diff changeset
23 /**
8718
e9d9d946f213 Use full internal pathname in doxygen @file directives.
diego
parents: 8629
diff changeset
24 * @file libavcodec/mdct.c
1106
1e39f273ecd6 per file doxy
michaelni
parents: 970
diff changeset
25 * MDCT/IMDCT transforms.
1e39f273ecd6 per file doxy
michaelni
parents: 970
diff changeset
26 */
1e39f273ecd6 per file doxy
michaelni
parents: 970
diff changeset
27
6139
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
28 // Generate a Kaiser-Bessel Derived Window.
6142
a35b838ab955 Add variable alpha and size of half window for Kaiser-Bessel Derived window
superdump
parents: 6139
diff changeset
29 #define BESSEL_I0_ITER 50 // default: 50 iterations of Bessel I0 approximation
8737
eeca2fc122f8 Add av_cold attributes to *_init and *_end functions.
alexc
parents: 8718
diff changeset
30 av_cold void ff_kbd_window_init(float *window, float alpha, int n)
6139
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
31 {
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
32 int i, j;
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
33 double sum = 0.0, bessel, tmp;
6142
a35b838ab955 Add variable alpha and size of half window for Kaiser-Bessel Derived window
superdump
parents: 6139
diff changeset
34 double local_window[n];
a35b838ab955 Add variable alpha and size of half window for Kaiser-Bessel Derived window
superdump
parents: 6139
diff changeset
35 double alpha2 = (alpha * M_PI / n) * (alpha * M_PI / n);
6139
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
36
6142
a35b838ab955 Add variable alpha and size of half window for Kaiser-Bessel Derived window
superdump
parents: 6139
diff changeset
37 for (i = 0; i < n; i++) {
a35b838ab955 Add variable alpha and size of half window for Kaiser-Bessel Derived window
superdump
parents: 6139
diff changeset
38 tmp = i * (n - i) * alpha2;
6139
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
39 bessel = 1.0;
6142
a35b838ab955 Add variable alpha and size of half window for Kaiser-Bessel Derived window
superdump
parents: 6139
diff changeset
40 for (j = BESSEL_I0_ITER; j > 0; j--)
6139
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
41 bessel = bessel * tmp / (j * j) + 1;
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
42 sum += bessel;
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
43 local_window[i] = sum;
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
44 }
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
45
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
46 sum++;
6142
a35b838ab955 Add variable alpha and size of half window for Kaiser-Bessel Derived window
superdump
parents: 6139
diff changeset
47 for (i = 0; i < n; i++)
6139
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
48 window[i] = sqrt(local_window[i] / sum);
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
49 }
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
50
7577
ed956c3c2cf3 The ff_sine_#[] should be aligned as they will commonly be used in dsputil
superdump
parents: 7573
diff changeset
51 DECLARE_ALIGNED(16, float, ff_sine_128 [ 128]);
ed956c3c2cf3 The ff_sine_#[] should be aligned as they will commonly be used in dsputil
superdump
parents: 7573
diff changeset
52 DECLARE_ALIGNED(16, float, ff_sine_256 [ 256]);
ed956c3c2cf3 The ff_sine_#[] should be aligned as they will commonly be used in dsputil
superdump
parents: 7573
diff changeset
53 DECLARE_ALIGNED(16, float, ff_sine_512 [ 512]);
ed956c3c2cf3 The ff_sine_#[] should be aligned as they will commonly be used in dsputil
superdump
parents: 7573
diff changeset
54 DECLARE_ALIGNED(16, float, ff_sine_1024[1024]);
ed956c3c2cf3 The ff_sine_#[] should be aligned as they will commonly be used in dsputil
superdump
parents: 7573
diff changeset
55 DECLARE_ALIGNED(16, float, ff_sine_2048[2048]);
8567
0d5b2b0e7a87 Add size that is needed for the wmapro codec
banan
parents: 7822
diff changeset
56 DECLARE_ALIGNED(16, float, ff_sine_4096[4096]);
0d5b2b0e7a87 Add size that is needed for the wmapro codec
banan
parents: 7822
diff changeset
57 float *ff_sine_windows[6] = {
0d5b2b0e7a87 Add size that is needed for the wmapro codec
banan
parents: 7822
diff changeset
58 ff_sine_128, ff_sine_256, ff_sine_512, ff_sine_1024, ff_sine_2048, ff_sine_4096
7573
7802295cae6f Add declarations for the sine tables used in wma.c (half window sizes: 128,
superdump
parents: 7547
diff changeset
59 };
7802295cae6f Add declarations for the sine tables used in wma.c (half window sizes: 128,
superdump
parents: 7547
diff changeset
60
7094
b0820b8bd4dd Add generic ff_sine_window_init function and implement in codecs appropriately
superdump
parents: 6498
diff changeset
61 // Generate a sine window.
8737
eeca2fc122f8 Add av_cold attributes to *_init and *_end functions.
alexc
parents: 8718
diff changeset
62 av_cold void ff_sine_window_init(float *window, int n) {
7094
b0820b8bd4dd Add generic ff_sine_window_init function and implement in codecs appropriately
superdump
parents: 6498
diff changeset
63 int i;
b0820b8bd4dd Add generic ff_sine_window_init function and implement in codecs appropriately
superdump
parents: 6498
diff changeset
64 for(i = 0; i < n; i++)
7822
67cfe4983e6d Try to fix wma regression.
michael
parents: 7699
diff changeset
65 window[i] = sinf((i + 0.5) * (M_PI / (2.0 * n)));
7094
b0820b8bd4dd Add generic ff_sine_window_init function and implement in codecs appropriately
superdump
parents: 6498
diff changeset
66 }
b0820b8bd4dd Add generic ff_sine_window_init function and implement in codecs appropriately
superdump
parents: 6498
diff changeset
67
1106
1e39f273ecd6 per file doxy
michaelni
parents: 970
diff changeset
68 /**
1e39f273ecd6 per file doxy
michaelni
parents: 970
diff changeset
69 * init MDCT or IMDCT computation.
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
70 */
9658
67a20f0eb42c Support for getting (i)MDCT output multiplied by a constant scaling factor.
serge
parents: 9480
diff changeset
71 av_cold int ff_mdct_init(MDCTContext *s, int nbits, int inverse, double scale)
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
72 {
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
73 int n, n4, i;
9658
67a20f0eb42c Support for getting (i)MDCT output multiplied by a constant scaling factor.
serge
parents: 9480
diff changeset
74 double alpha, theta;
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
75
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
76 memset(s, 0, sizeof(*s));
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
77 n = 1 << nbits;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
78 s->nbits = nbits;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
79 s->n = n;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
80 n4 = n >> 2;
970
a521e0ecc5a8 use av_malloc instead of malloc
bellard
parents: 794
diff changeset
81 s->tcos = av_malloc(n4 * sizeof(FFTSample));
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
82 if (!s->tcos)
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
83 goto fail;
970
a521e0ecc5a8 use av_malloc instead of malloc
bellard
parents: 794
diff changeset
84 s->tsin = av_malloc(n4 * sizeof(FFTSample));
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
85 if (!s->tsin)
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
86 goto fail;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
87
9658
67a20f0eb42c Support for getting (i)MDCT output multiplied by a constant scaling factor.
serge
parents: 9480
diff changeset
88 theta = 1.0 / 8.0 + (scale < 0 ? n4 : 0);
67a20f0eb42c Support for getting (i)MDCT output multiplied by a constant scaling factor.
serge
parents: 9480
diff changeset
89 scale = sqrt(fabs(scale));
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
90 for(i=0;i<n4;i++) {
9658
67a20f0eb42c Support for getting (i)MDCT output multiplied by a constant scaling factor.
serge
parents: 9480
diff changeset
91 alpha = 2 * M_PI * (i + theta) / n;
67a20f0eb42c Support for getting (i)MDCT output multiplied by a constant scaling factor.
serge
parents: 9480
diff changeset
92 s->tcos[i] = -cos(alpha) * scale;
67a20f0eb42c Support for getting (i)MDCT output multiplied by a constant scaling factor.
serge
parents: 9480
diff changeset
93 s->tsin[i] = -sin(alpha) * scale;
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
94 }
1879
dd63cb7e5080 fft_*() renamed into ff_fft_*() patch by (Gildas Bazin <gbazin at altern dot org>)
michael
parents: 1106
diff changeset
95 if (ff_fft_init(&s->fft, s->nbits - 2, inverse) < 0)
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
96 goto fail;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
97 return 0;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
98 fail:
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
99 av_freep(&s->tcos);
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
100 av_freep(&s->tsin);
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
101 return -1;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
102 }
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
103
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
104 /* complex multiplication: p = a * b */
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
105 #define CMUL(pre, pim, are, aim, bre, bim) \
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
106 {\
7545
2dca9201c400 remove a float->double->float conversion.
lorenm
parents: 7544
diff changeset
107 FFTSample _are = (are);\
2dca9201c400 remove a float->double->float conversion.
lorenm
parents: 7544
diff changeset
108 FFTSample _aim = (aim);\
2dca9201c400 remove a float->double->float conversion.
lorenm
parents: 7544
diff changeset
109 FFTSample _bre = (bre);\
2dca9201c400 remove a float->double->float conversion.
lorenm
parents: 7544
diff changeset
110 FFTSample _bim = (bim);\
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
111 (pre) = _are * _bre - _aim * _bim;\
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
112 (pim) = _are * _bim + _aim * _bre;\
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
113 }
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
114
7544
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
115 /**
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
116 * Compute the middle half of the inverse MDCT of size N = 2^nbits,
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
117 * thus excluding the parts that can be derived by symmetry
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
118 * @param output N/2 samples
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
119 * @param input N/2 samples
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
120 */
7547
8226017a65ae mdct wrapper function to match fft
lorenm
parents: 7546
diff changeset
121 void ff_imdct_half_c(MDCTContext *s, FFTSample *output, const FFTSample *input)
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
122 {
7544
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
123 int k, n8, n4, n2, n, j;
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
124 const uint16_t *revtab = s->fft.revtab;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
125 const FFTSample *tcos = s->tcos;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
126 const FFTSample *tsin = s->tsin;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
127 const FFTSample *in1, *in2;
7544
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
128 FFTComplex *z = (FFTComplex *)output;
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
129
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
130 n = 1 << s->nbits;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
131 n2 = n >> 1;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
132 n4 = n >> 2;
7544
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
133 n8 = n >> 3;
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
134
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
135 /* pre rotation */
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
136 in1 = input;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
137 in2 = input + n2 - 1;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
138 for(k = 0; k < n4; k++) {
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
139 j=revtab[k];
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
140 CMUL(z[j].re, z[j].im, *in2, *in1, tcos[k], tsin[k]);
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
141 in1 += 2;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
142 in2 -= 2;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
143 }
1879
dd63cb7e5080 fft_*() renamed into ff_fft_*() patch by (Gildas Bazin <gbazin at altern dot org>)
michael
parents: 1106
diff changeset
144 ff_fft_calc(&s->fft, z);
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
145
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
146 /* post rotation + reordering */
7544
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
147 for(k = 0; k < n8; k++) {
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
148 FFTSample r0, i0, r1, i1;
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
149 CMUL(r0, i1, z[n8-k-1].im, z[n8-k-1].re, tsin[n8-k-1], tcos[n8-k-1]);
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
150 CMUL(r1, i0, z[n8+k ].im, z[n8+k ].re, tsin[n8+k ], tcos[n8+k ]);
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
151 z[n8-k-1].re = r0;
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
152 z[n8-k-1].im = i0;
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
153 z[n8+k ].re = r1;
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
154 z[n8+k ].im = i1;
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
155 }
7263
fc843d00867c exploit mdct symmetry
lorenm
parents: 7094
diff changeset
156 }
fc843d00867c exploit mdct symmetry
lorenm
parents: 7094
diff changeset
157
fc843d00867c exploit mdct symmetry
lorenm
parents: 7094
diff changeset
158 /**
fc843d00867c exploit mdct symmetry
lorenm
parents: 7094
diff changeset
159 * Compute inverse MDCT of size N = 2^nbits
fc843d00867c exploit mdct symmetry
lorenm
parents: 7094
diff changeset
160 * @param output N samples
fc843d00867c exploit mdct symmetry
lorenm
parents: 7094
diff changeset
161 * @param input N/2 samples
fc843d00867c exploit mdct symmetry
lorenm
parents: 7094
diff changeset
162 */
7547
8226017a65ae mdct wrapper function to match fft
lorenm
parents: 7546
diff changeset
163 void ff_imdct_calc_c(MDCTContext *s, FFTSample *output, const FFTSample *input)
7263
fc843d00867c exploit mdct symmetry
lorenm
parents: 7094
diff changeset
164 {
7544
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
165 int k;
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
166 int n = 1 << s->nbits;
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
167 int n2 = n >> 1;
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
168 int n4 = n >> 2;
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
169
7547
8226017a65ae mdct wrapper function to match fft
lorenm
parents: 7546
diff changeset
170 ff_imdct_half_c(s, output+n4, input);
7263
fc843d00867c exploit mdct symmetry
lorenm
parents: 7094
diff changeset
171
7544
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
172 for(k = 0; k < n4; k++) {
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
173 output[k] = -output[n2-k-1];
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
174 output[n-k-1] = output[n2+k];
7263
fc843d00867c exploit mdct symmetry
lorenm
parents: 7094
diff changeset
175 }
fc843d00867c exploit mdct symmetry
lorenm
parents: 7094
diff changeset
176 }
fc843d00867c exploit mdct symmetry
lorenm
parents: 7094
diff changeset
177
fc843d00867c exploit mdct symmetry
lorenm
parents: 7094
diff changeset
178 /**
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
179 * Compute MDCT of size N = 2^nbits
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
180 * @param input N samples
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
181 * @param out N/2 samples
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
182 */
7546
97383e012cb9 remove mdct tmp buffer
lorenm
parents: 7545
diff changeset
183 void ff_mdct_calc(MDCTContext *s, FFTSample *out, const FFTSample *input)
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
184 {
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
185 int i, j, n, n8, n4, n2, n3;
7546
97383e012cb9 remove mdct tmp buffer
lorenm
parents: 7545
diff changeset
186 FFTSample re, im;
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
187 const uint16_t *revtab = s->fft.revtab;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
188 const FFTSample *tcos = s->tcos;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
189 const FFTSample *tsin = s->tsin;
7544
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
190 FFTComplex *x = (FFTComplex *)out;
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
191
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
192 n = 1 << s->nbits;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
193 n2 = n >> 1;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
194 n4 = n >> 2;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
195 n8 = n >> 3;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
196 n3 = 3 * n4;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
197
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
198 /* pre rotation */
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
199 for(i=0;i<n8;i++) {
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
200 re = -input[2*i+3*n4] - input[n3-1-2*i];
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
201 im = -input[n4+2*i] + input[n4-1-2*i];
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
202 j = revtab[i];
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
203 CMUL(x[j].re, x[j].im, re, im, -tcos[i], tsin[i]);
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
204
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
205 re = input[2*i] - input[n2-1-2*i];
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
206 im = -(input[n2+2*i] + input[n-1-2*i]);
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
207 j = revtab[n8 + i];
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
208 CMUL(x[j].re, x[j].im, re, im, -tcos[n8 + i], tsin[n8 + i]);
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
209 }
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
210
1879
dd63cb7e5080 fft_*() renamed into ff_fft_*() patch by (Gildas Bazin <gbazin at altern dot org>)
michael
parents: 1106
diff changeset
211 ff_fft_calc(&s->fft, x);
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 1879
diff changeset
212
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
213 /* post rotation */
7544
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
214 for(i=0;i<n8;i++) {
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
215 FFTSample r0, i0, r1, i1;
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
216 CMUL(i1, r0, x[n8-i-1].re, x[n8-i-1].im, -tsin[n8-i-1], -tcos[n8-i-1]);
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
217 CMUL(i0, r1, x[n8+i ].re, x[n8+i ].im, -tsin[n8+i ], -tcos[n8+i ]);
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
218 x[n8-i-1].re = r0;
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
219 x[n8-i-1].im = i0;
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
220 x[n8+i ].re = r1;
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
221 x[n8+i ].im = i1;
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
222 }
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
223 }
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
224
8737
eeca2fc122f8 Add av_cold attributes to *_init and *_end functions.
alexc
parents: 8718
diff changeset
225 av_cold void ff_mdct_end(MDCTContext *s)
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
226 {
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
227 av_freep(&s->tcos);
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
228 av_freep(&s->tsin);
1879
dd63cb7e5080 fft_*() renamed into ff_fft_*() patch by (Gildas Bazin <gbazin at altern dot org>)
michael
parents: 1106
diff changeset
229 ff_fft_end(&s->fft);
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
230 }