annotate mdct.c @ 10952:ea8f891d997d libavcodec

H264 DXVA2 implementation It allows VLD H264 decoding using DXVA2 (GPU assisted decoding API under VISTA and Windows 7). It is implemented by using AVHWAccel API. It has been tested successfully for some time in VLC using an nvidia card on Windows 7. To compile it, you need to have the system header dxva2api.h (either from microsoft or using http://downloads.videolan.org/pub/videolan/testing/contrib/dxva2api.h) The generated libavcodec.dll does not depend directly on any new lib as the necessary objects are given by the application using FFmpeg.
author fenrir
date Wed, 20 Jan 2010 18:54:51 +0000
parents 3d011a01a6a0
children 4b3da727d832
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
1 /*
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
2 * MDCT/IMDCT transforms
8629
04423b2f6e0b cosmetics: Remove pointless period after copyright statement non-sentences.
diego
parents: 8567
diff changeset
3 * Copyright (c) 2002 Fabrice Bellard
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
4 *
3947
c8c591fe26f8 Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents: 3036
diff changeset
5 * This file is part of FFmpeg.
c8c591fe26f8 Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents: 3036
diff changeset
6 *
c8c591fe26f8 Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents: 3036
diff changeset
7 * FFmpeg is free software; you can redistribute it and/or
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
8 * modify it under the terms of the GNU Lesser General Public
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
9 * License as published by the Free Software Foundation; either
3947
c8c591fe26f8 Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents: 3036
diff changeset
10 * version 2.1 of the License, or (at your option) any later version.
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
11 *
3947
c8c591fe26f8 Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents: 3036
diff changeset
12 * FFmpeg is distributed in the hope that it will be useful,
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
15 * Lesser General Public License for more details.
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
16 *
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
17 * You should have received a copy of the GNU Lesser General Public
3947
c8c591fe26f8 Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents: 3036
diff changeset
18 * License along with FFmpeg; if not, write to the Free Software
3036
0b546eab515d Update licensing information: The FSF changed postal address.
diego
parents: 2967
diff changeset
19 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
20 */
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
21 #include "dsputil.h"
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
22
1106
1e39f273ecd6 per file doxy
michaelni
parents: 970
diff changeset
23 /**
8718
e9d9d946f213 Use full internal pathname in doxygen @file directives.
diego
parents: 8629
diff changeset
24 * @file libavcodec/mdct.c
1106
1e39f273ecd6 per file doxy
michaelni
parents: 970
diff changeset
25 * MDCT/IMDCT transforms.
1e39f273ecd6 per file doxy
michaelni
parents: 970
diff changeset
26 */
1e39f273ecd6 per file doxy
michaelni
parents: 970
diff changeset
27
6139
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
28 // Generate a Kaiser-Bessel Derived Window.
6142
a35b838ab955 Add variable alpha and size of half window for Kaiser-Bessel Derived window
superdump
parents: 6139
diff changeset
29 #define BESSEL_I0_ITER 50 // default: 50 iterations of Bessel I0 approximation
8737
eeca2fc122f8 Add av_cold attributes to *_init and *_end functions.
alexc
parents: 8718
diff changeset
30 av_cold void ff_kbd_window_init(float *window, float alpha, int n)
6139
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
31 {
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
32 int i, j;
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
33 double sum = 0.0, bessel, tmp;
6142
a35b838ab955 Add variable alpha and size of half window for Kaiser-Bessel Derived window
superdump
parents: 6139
diff changeset
34 double local_window[n];
a35b838ab955 Add variable alpha and size of half window for Kaiser-Bessel Derived window
superdump
parents: 6139
diff changeset
35 double alpha2 = (alpha * M_PI / n) * (alpha * M_PI / n);
6139
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
36
6142
a35b838ab955 Add variable alpha and size of half window for Kaiser-Bessel Derived window
superdump
parents: 6139
diff changeset
37 for (i = 0; i < n; i++) {
a35b838ab955 Add variable alpha and size of half window for Kaiser-Bessel Derived window
superdump
parents: 6139
diff changeset
38 tmp = i * (n - i) * alpha2;
6139
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
39 bessel = 1.0;
6142
a35b838ab955 Add variable alpha and size of half window for Kaiser-Bessel Derived window
superdump
parents: 6139
diff changeset
40 for (j = BESSEL_I0_ITER; j > 0; j--)
6139
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
41 bessel = bessel * tmp / (j * j) + 1;
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
42 sum += bessel;
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
43 local_window[i] = sum;
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
44 }
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
45
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
46 sum++;
6142
a35b838ab955 Add variable alpha and size of half window for Kaiser-Bessel Derived window
superdump
parents: 6139
diff changeset
47 for (i = 0; i < n; i++)
6139
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
48 window[i] = sqrt(local_window[i] / sum);
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
49 }
5077d1562573 Make the Kaiser-Bessel window generator a common function
andoma
parents: 3947
diff changeset
50
10827
3d011a01a6a0 Add support for hard-coded MDCT-related ff_sine_windows tables.
reimar
parents: 10204
diff changeset
51 #include "mdct_tablegen.h"
7094
b0820b8bd4dd Add generic ff_sine_window_init function and implement in codecs appropriately
superdump
parents: 6498
diff changeset
52
1106
1e39f273ecd6 per file doxy
michaelni
parents: 970
diff changeset
53 /**
1e39f273ecd6 per file doxy
michaelni
parents: 970
diff changeset
54 * init MDCT or IMDCT computation.
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
55 */
10199
38ab367d4231 Merge FFTContext and MDCTContext
mru
parents: 10174
diff changeset
56 av_cold int ff_mdct_init(FFTContext *s, int nbits, int inverse, double scale)
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
57 {
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
58 int n, n4, i;
9658
67a20f0eb42c Support for getting (i)MDCT output multiplied by a constant scaling factor.
serge
parents: 9480
diff changeset
59 double alpha, theta;
10204
db033d1fbf44 Allow arch-specific mdct code to request interleaving of cos/sin tables
mru
parents: 10199
diff changeset
60 int tstep;
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
61
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
62 memset(s, 0, sizeof(*s));
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
63 n = 1 << nbits;
10199
38ab367d4231 Merge FFTContext and MDCTContext
mru
parents: 10174
diff changeset
64 s->mdct_bits = nbits;
38ab367d4231 Merge FFTContext and MDCTContext
mru
parents: 10174
diff changeset
65 s->mdct_size = n;
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
66 n4 = n >> 2;
10204
db033d1fbf44 Allow arch-specific mdct code to request interleaving of cos/sin tables
mru
parents: 10199
diff changeset
67 s->permutation = FF_MDCT_PERM_NONE;
db033d1fbf44 Allow arch-specific mdct code to request interleaving of cos/sin tables
mru
parents: 10199
diff changeset
68
db033d1fbf44 Allow arch-specific mdct code to request interleaving of cos/sin tables
mru
parents: 10199
diff changeset
69 if (ff_fft_init(s, s->mdct_bits - 2, inverse) < 0)
db033d1fbf44 Allow arch-specific mdct code to request interleaving of cos/sin tables
mru
parents: 10199
diff changeset
70 goto fail;
db033d1fbf44 Allow arch-specific mdct code to request interleaving of cos/sin tables
mru
parents: 10199
diff changeset
71
db033d1fbf44 Allow arch-specific mdct code to request interleaving of cos/sin tables
mru
parents: 10199
diff changeset
72 s->tcos = av_malloc(n/2 * sizeof(FFTSample));
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
73 if (!s->tcos)
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
74 goto fail;
10204
db033d1fbf44 Allow arch-specific mdct code to request interleaving of cos/sin tables
mru
parents: 10199
diff changeset
75
db033d1fbf44 Allow arch-specific mdct code to request interleaving of cos/sin tables
mru
parents: 10199
diff changeset
76 switch (s->permutation) {
db033d1fbf44 Allow arch-specific mdct code to request interleaving of cos/sin tables
mru
parents: 10199
diff changeset
77 case FF_MDCT_PERM_NONE:
db033d1fbf44 Allow arch-specific mdct code to request interleaving of cos/sin tables
mru
parents: 10199
diff changeset
78 s->tsin = s->tcos + n4;
db033d1fbf44 Allow arch-specific mdct code to request interleaving of cos/sin tables
mru
parents: 10199
diff changeset
79 tstep = 1;
db033d1fbf44 Allow arch-specific mdct code to request interleaving of cos/sin tables
mru
parents: 10199
diff changeset
80 break;
db033d1fbf44 Allow arch-specific mdct code to request interleaving of cos/sin tables
mru
parents: 10199
diff changeset
81 case FF_MDCT_PERM_INTERLEAVE:
db033d1fbf44 Allow arch-specific mdct code to request interleaving of cos/sin tables
mru
parents: 10199
diff changeset
82 s->tsin = s->tcos + 1;
db033d1fbf44 Allow arch-specific mdct code to request interleaving of cos/sin tables
mru
parents: 10199
diff changeset
83 tstep = 2;
db033d1fbf44 Allow arch-specific mdct code to request interleaving of cos/sin tables
mru
parents: 10199
diff changeset
84 break;
db033d1fbf44 Allow arch-specific mdct code to request interleaving of cos/sin tables
mru
parents: 10199
diff changeset
85 default:
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
86 goto fail;
10204
db033d1fbf44 Allow arch-specific mdct code to request interleaving of cos/sin tables
mru
parents: 10199
diff changeset
87 }
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
88
9658
67a20f0eb42c Support for getting (i)MDCT output multiplied by a constant scaling factor.
serge
parents: 9480
diff changeset
89 theta = 1.0 / 8.0 + (scale < 0 ? n4 : 0);
67a20f0eb42c Support for getting (i)MDCT output multiplied by a constant scaling factor.
serge
parents: 9480
diff changeset
90 scale = sqrt(fabs(scale));
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
91 for(i=0;i<n4;i++) {
9658
67a20f0eb42c Support for getting (i)MDCT output multiplied by a constant scaling factor.
serge
parents: 9480
diff changeset
92 alpha = 2 * M_PI * (i + theta) / n;
10204
db033d1fbf44 Allow arch-specific mdct code to request interleaving of cos/sin tables
mru
parents: 10199
diff changeset
93 s->tcos[i*tstep] = -cos(alpha) * scale;
db033d1fbf44 Allow arch-specific mdct code to request interleaving of cos/sin tables
mru
parents: 10199
diff changeset
94 s->tsin[i*tstep] = -sin(alpha) * scale;
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
95 }
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
96 return 0;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
97 fail:
10204
db033d1fbf44 Allow arch-specific mdct code to request interleaving of cos/sin tables
mru
parents: 10199
diff changeset
98 ff_mdct_end(s);
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
99 return -1;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
100 }
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
101
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
102 /* complex multiplication: p = a * b */
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
103 #define CMUL(pre, pim, are, aim, bre, bim) \
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
104 {\
7545
2dca9201c400 remove a float->double->float conversion.
lorenm
parents: 7544
diff changeset
105 FFTSample _are = (are);\
2dca9201c400 remove a float->double->float conversion.
lorenm
parents: 7544
diff changeset
106 FFTSample _aim = (aim);\
2dca9201c400 remove a float->double->float conversion.
lorenm
parents: 7544
diff changeset
107 FFTSample _bre = (bre);\
2dca9201c400 remove a float->double->float conversion.
lorenm
parents: 7544
diff changeset
108 FFTSample _bim = (bim);\
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
109 (pre) = _are * _bre - _aim * _bim;\
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
110 (pim) = _are * _bim + _aim * _bre;\
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
111 }
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
112
7544
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
113 /**
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
114 * Compute the middle half of the inverse MDCT of size N = 2^nbits,
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
115 * thus excluding the parts that can be derived by symmetry
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
116 * @param output N/2 samples
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
117 * @param input N/2 samples
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
118 */
10199
38ab367d4231 Merge FFTContext and MDCTContext
mru
parents: 10174
diff changeset
119 void ff_imdct_half_c(FFTContext *s, FFTSample *output, const FFTSample *input)
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
120 {
7544
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
121 int k, n8, n4, n2, n, j;
10199
38ab367d4231 Merge FFTContext and MDCTContext
mru
parents: 10174
diff changeset
122 const uint16_t *revtab = s->revtab;
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
123 const FFTSample *tcos = s->tcos;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
124 const FFTSample *tsin = s->tsin;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
125 const FFTSample *in1, *in2;
7544
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
126 FFTComplex *z = (FFTComplex *)output;
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
127
10199
38ab367d4231 Merge FFTContext and MDCTContext
mru
parents: 10174
diff changeset
128 n = 1 << s->mdct_bits;
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
129 n2 = n >> 1;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
130 n4 = n >> 2;
7544
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
131 n8 = n >> 3;
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
132
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
133 /* pre rotation */
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
134 in1 = input;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
135 in2 = input + n2 - 1;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
136 for(k = 0; k < n4; k++) {
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
137 j=revtab[k];
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
138 CMUL(z[j].re, z[j].im, *in2, *in1, tcos[k], tsin[k]);
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
139 in1 += 2;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
140 in2 -= 2;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
141 }
10199
38ab367d4231 Merge FFTContext and MDCTContext
mru
parents: 10174
diff changeset
142 ff_fft_calc(s, z);
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
143
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
144 /* post rotation + reordering */
7544
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
145 for(k = 0; k < n8; k++) {
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
146 FFTSample r0, i0, r1, i1;
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
147 CMUL(r0, i1, z[n8-k-1].im, z[n8-k-1].re, tsin[n8-k-1], tcos[n8-k-1]);
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
148 CMUL(r1, i0, z[n8+k ].im, z[n8+k ].re, tsin[n8+k ], tcos[n8+k ]);
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
149 z[n8-k-1].re = r0;
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
150 z[n8-k-1].im = i0;
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
151 z[n8+k ].re = r1;
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
152 z[n8+k ].im = i1;
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
153 }
7263
fc843d00867c exploit mdct symmetry
lorenm
parents: 7094
diff changeset
154 }
fc843d00867c exploit mdct symmetry
lorenm
parents: 7094
diff changeset
155
fc843d00867c exploit mdct symmetry
lorenm
parents: 7094
diff changeset
156 /**
fc843d00867c exploit mdct symmetry
lorenm
parents: 7094
diff changeset
157 * Compute inverse MDCT of size N = 2^nbits
fc843d00867c exploit mdct symmetry
lorenm
parents: 7094
diff changeset
158 * @param output N samples
fc843d00867c exploit mdct symmetry
lorenm
parents: 7094
diff changeset
159 * @param input N/2 samples
fc843d00867c exploit mdct symmetry
lorenm
parents: 7094
diff changeset
160 */
10199
38ab367d4231 Merge FFTContext and MDCTContext
mru
parents: 10174
diff changeset
161 void ff_imdct_calc_c(FFTContext *s, FFTSample *output, const FFTSample *input)
7263
fc843d00867c exploit mdct symmetry
lorenm
parents: 7094
diff changeset
162 {
7544
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
163 int k;
10199
38ab367d4231 Merge FFTContext and MDCTContext
mru
parents: 10174
diff changeset
164 int n = 1 << s->mdct_bits;
7544
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
165 int n2 = n >> 1;
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
166 int n4 = n >> 2;
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
167
7547
8226017a65ae mdct wrapper function to match fft
lorenm
parents: 7546
diff changeset
168 ff_imdct_half_c(s, output+n4, input);
7263
fc843d00867c exploit mdct symmetry
lorenm
parents: 7094
diff changeset
169
7544
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
170 for(k = 0; k < n4; k++) {
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
171 output[k] = -output[n2-k-1];
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
172 output[n-k-1] = output[n2+k];
7263
fc843d00867c exploit mdct symmetry
lorenm
parents: 7094
diff changeset
173 }
fc843d00867c exploit mdct symmetry
lorenm
parents: 7094
diff changeset
174 }
fc843d00867c exploit mdct symmetry
lorenm
parents: 7094
diff changeset
175
fc843d00867c exploit mdct symmetry
lorenm
parents: 7094
diff changeset
176 /**
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
177 * Compute MDCT of size N = 2^nbits
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
178 * @param input N samples
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
179 * @param out N/2 samples
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
180 */
10199
38ab367d4231 Merge FFTContext and MDCTContext
mru
parents: 10174
diff changeset
181 void ff_mdct_calc_c(FFTContext *s, FFTSample *out, const FFTSample *input)
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
182 {
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
183 int i, j, n, n8, n4, n2, n3;
7546
97383e012cb9 remove mdct tmp buffer
lorenm
parents: 7545
diff changeset
184 FFTSample re, im;
10199
38ab367d4231 Merge FFTContext and MDCTContext
mru
parents: 10174
diff changeset
185 const uint16_t *revtab = s->revtab;
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
186 const FFTSample *tcos = s->tcos;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
187 const FFTSample *tsin = s->tsin;
7544
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
188 FFTComplex *x = (FFTComplex *)out;
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
189
10199
38ab367d4231 Merge FFTContext and MDCTContext
mru
parents: 10174
diff changeset
190 n = 1 << s->mdct_bits;
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
191 n2 = n >> 1;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
192 n4 = n >> 2;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
193 n8 = n >> 3;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
194 n3 = 3 * n4;
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
195
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
196 /* pre rotation */
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
197 for(i=0;i<n8;i++) {
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
198 re = -input[2*i+3*n4] - input[n3-1-2*i];
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
199 im = -input[n4+2*i] + input[n4-1-2*i];
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
200 j = revtab[i];
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
201 CMUL(x[j].re, x[j].im, re, im, -tcos[i], tsin[i]);
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
202
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
203 re = input[2*i] - input[n2-1-2*i];
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
204 im = -(input[n2+2*i] + input[n-1-2*i]);
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
205 j = revtab[n8 + i];
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
206 CMUL(x[j].re, x[j].im, re, im, -tcos[n8 + i], tsin[n8 + i]);
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
207 }
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
208
10199
38ab367d4231 Merge FFTContext and MDCTContext
mru
parents: 10174
diff changeset
209 ff_fft_calc(s, x);
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 1879
diff changeset
210
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
211 /* post rotation */
7544
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
212 for(i=0;i<n8;i++) {
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
213 FFTSample r0, i0, r1, i1;
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
214 CMUL(i1, r0, x[n8-i-1].re, x[n8-i-1].im, -tsin[n8-i-1], -tcos[n8-i-1]);
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
215 CMUL(i0, r1, x[n8+i ].re, x[n8+i ].im, -tsin[n8+i ], -tcos[n8+i ]);
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
216 x[n8-i-1].re = r0;
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
217 x[n8-i-1].im = i0;
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
218 x[n8+i ].re = r1;
ee1cb5ab9f99 optimize imdct_half:
lorenm
parents: 7263
diff changeset
219 x[n8+i ].im = i1;
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
220 }
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
221 }
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
222
10199
38ab367d4231 Merge FFTContext and MDCTContext
mru
parents: 10174
diff changeset
223 av_cold void ff_mdct_end(FFTContext *s)
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
224 {
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
225 av_freep(&s->tcos);
10199
38ab367d4231 Merge FFTContext and MDCTContext
mru
parents: 10174
diff changeset
226 ff_fft_end(s);
781
6f5e87957bcb new generic FFT/MDCT code for audio codecs
bellard
parents:
diff changeset
227 }