libavcodec.hg: wmadec.c comparison

comparison wmadec.c @ 3592:6a358dccf2ab libavcodec

SIMD vector optimizations. 3% faster overall decoding.

author	banan
date	Sat, 19 Aug 2006 08:46:52 +0000
parents	5ea82888103e
children	e28285ddde8d

comparison

equal deleted inserted replaced

-:088be7d7c4fd
+:6a358dccf2ab
 /* lsp_to_curve tables */
 float lsp_cos_table[BLOCK_MAX_SIZE];
 float lsp_pow_e_table[256];
 float lsp_pow_m_table1[(1 << LSP_POW_BITS)];
 float lsp_pow_m_table2[(1 << LSP_POW_BITS)];
+DSPContext dsp;
 #ifdef TRACE
 int frame_count;
 #endif
 } WMADecodeContext;
 s->sample_rate = avctx->sample_rate;
 s->nb_channels = avctx->channels;
 s->bit_rate = avctx->bit_rate;
 s->block_align = avctx->block_align;
+dsputil_init(&s->dsp, avctx);
 if (avctx->codec->id == CODEC_ID_WMAV1) {
 s->version = 1;
 } else {
 s->version = 2;
 for(ch = 0; ch < s->nb_channels; ch++) {
 if (s->channel_coded[ch]) {
 DECLARE_ALIGNED_16(FFTSample, output[BLOCK_MAX_SIZE * 2]);
 float *ptr;
-int i, n4, index, n;
+int n4, index, n;
 n = s->block_len;
 n4 = s->block_len / 2;
 s->mdct_ctx[bsize].fft.imdct_calc(&s->mdct_ctx[bsize],
 output, s->coefs[ch], s->mdct_tmp);
 /* XXX: optimize all that by build the window and
 multipying/adding at the same time */
-/* multiply by the window */
-for(i=0;i<n * 2;i++) {
+/* multiply by the window and add in the frame */
-output[i] *= window[i];
-}
-/* add in the frame */
 index = (s->frame_len / 2) + s->block_pos - n4;
 ptr = &s->frame_out[ch][index];
-for(i=0;i<n * 2;i++) {
+s->dsp.vector_fmul_add_add(ptr,window,output,ptr,0,2*n,1);
-*ptr += output[i];
-ptr++;
-}
 /* specific fast case for ms-stereo : add to second
 channel if it is not coded */
 if (s->ms_stereo && !s->channel_coded[1]) {
 ptr = &s->frame_out[1][index];
-for(i=0;i<n * 2;i++) {
+s->dsp.vector_fmul_add_add(ptr,window,output,ptr,0,2*n,1);
-*ptr += output[i];
-ptr++;
-}
 }
 }
 }
 next:
 /* update block number */

Mercurial > libavcodec.hg

comparison wmadec.c @ 3592:6a358dccf2ab libavcodec