libavcodec.hg: wmadec.c comparison

comparison wmadec.c @ 4301:b43bd0c56eaa libavcodec

Bug fix for crashes when SSE is used on unaligned arrays. No measureable change in speed. This gave random crashes on Win32 and BeOS. The cause for this bug is that gcc doesn't align the stackframe. Linux and glibc always ensure this to be true thus this never affected Linux.

author	banan
date	Thu, 14 Dec 2006 17:50:23 +0000
parents	c8c591fe26f8
children	0efc832d9102

comparison

equal deleted inserted replaced

-:95044f594170
+:b43bd0c56eaa
 uint8_t channel_coded[MAX_CHANNELS]; /* true if channel is coded */
 DECLARE_ALIGNED_16(float, exponents[MAX_CHANNELS][BLOCK_MAX_SIZE]);
 float max_exponent[MAX_CHANNELS];
 int16_t coefs1[MAX_CHANNELS][BLOCK_MAX_SIZE];
 DECLARE_ALIGNED_16(float, coefs[MAX_CHANNELS][BLOCK_MAX_SIZE]);
+DECLARE_ALIGNED_16(FFTSample, output[BLOCK_MAX_SIZE * 2]);
+DECLARE_ALIGNED_16(float, window[BLOCK_MAX_SIZE * 2]);
 MDCTContext mdct_ctx[BLOCK_NB_SIZES];
 float *windows[BLOCK_NB_SIZES];
 DECLARE_ALIGNED_16(FFTSample, mdct_tmp[BLOCK_MAX_SIZE]); /* temporary storage for imdct */
 /* output buffer for one frame and the last for IMDCT windowing */
 DECLARE_ALIGNED_16(float, frame_out[MAX_CHANNELS][BLOCK_MAX_SIZE * 2]);
 unrecorrable error. */
 static int wma_decode_block(WMADecodeContext *s)
 {
 int n, v, a, ch, code, bsize;
 int coef_nb_bits, total_gain, parse_exponents;
-DECLARE_ALIGNED_16(float, window[BLOCK_MAX_SIZE * 2]);
 int nb_coefs[MAX_CHANNELS];
 float mdct_norm;
 #ifdef TRACE
 tprintf("***decode_block: %d:%d\n", s->frame_count - 1, s->block_num);
 block_len = s->block_len;
 prev_block_len = 1 << s->prev_block_len_bits;
 next_block_len = 1 << s->next_block_len_bits;
 /* right part */
-wptr = window + block_len;
+wptr = s->window + block_len;
 if (block_len <= next_block_len) {
 for(i=0;i<block_len;i++)
 *wptr++ = s->windows[bsize][i];
 } else {
 /* overlap */
 for(i=0;i<n;i++)
 *wptr++ = 0.0;
 }
 /* left part */
-wptr = window + block_len;
+wptr = s->window + block_len;
 if (block_len <= prev_block_len) {
 for(i=0;i<block_len;i++)
 *--wptr = s->windows[bsize][i];
 } else {
 /* overlap */
 }
 for(ch = 0; ch < s->nb_channels; ch++) {
 if (s->channel_coded[ch]) {
-DECLARE_ALIGNED_16(FFTSample, output[BLOCK_MAX_SIZE * 2]);
 float *ptr;
 int n4, index, n;
 n = s->block_len;
 n4 = s->block_len / 2;
 s->mdct_ctx[bsize].fft.imdct_calc(&s->mdct_ctx[bsize],
-output, s->coefs[ch], s->mdct_tmp);
+s->output, s->coefs[ch], s->mdct_tmp);
 /* XXX: optimize all that by build the window and
 multipying/adding at the same time */
 /* multiply by the window and add in the frame */
 index = (s->frame_len / 2) + s->block_pos - n4;
 ptr = &s->frame_out[ch][index];
-s->dsp.vector_fmul_add_add(ptr,window,output,ptr,0,2*n,1);
+s->dsp.vector_fmul_add_add(ptr,s->window,s->output,ptr,0,2*n,1);
 /* specific fast case for ms-stereo : add to second
 channel if it is not coded */
 if (s->ms_stereo && !s->channel_coded[1]) {
 ptr = &s->frame_out[1][index];
-s->dsp.vector_fmul_add_add(ptr,window,output,ptr,0,2*n,1);
+s->dsp.vector_fmul_add_add(ptr,s->window,s->output,ptr,0,2*n,1);
 }
 }
 }
 next:
 /* update block number */

Mercurial > libavcodec.hg

comparison wmadec.c @ 4301:b43bd0c56eaa libavcodec