# HG changeset patch # User michael # Date 1009129947 0 # Node ID f74f4524de6aa306b3dcb2649044286660978183 # Parent 265680bbdcfd48a9463023e155a5a19e3ce1681c mix3to1 in SSE diff -r 265680bbdcfd -r f74f4524de6a liba52/downmix.c --- a/liba52/downmix.c Sun Dec 23 17:32:34 2001 +0000 +++ b/liba52/downmix.c Sun Dec 23 17:52:27 2001 +0000 @@ -334,15 +334,34 @@ { int i; +#ifdef HAVE_SSE + asm volatile( + "movlps %1, %%xmm7 \n\t" + "shufps $0x00, %%xmm7, %%xmm7 \n\t" + "movl $-1024, %%esi \n\t" + "1: \n\t" + "movaps (%0, %%esi), %%xmm0 \n\t" + "movaps 1024(%0, %%esi), %%xmm1 \n\t" + "addps 2048(%0, %%esi), %%xmm0 \n\t" + "addps %%xmm7, %%xmm1 \n\t" + "addps %%xmm1, %%xmm0 \n\t" + "movaps %%xmm0, (%0, %%esi) \n\t" + "addl $16, %%esi \n\t" + " jnz 1b \n\t" + :: "r" (samples+256), "m" (bias) + : "%esi" + ); +#else for (i = 0; i < 256; i++) samples[i] += samples[i + 256] + samples[i + 512] + bias; +#endif } static void mix4to1 (sample_t * samples, sample_t bias) { int i; -#ifdef HAVE_SSE // FIXME untested +#ifdef HAVE_SSE asm volatile( "movlps %1, %%xmm7 \n\t" "shufps $0x00, %%xmm7, %%xmm7 \n\t"