libavcodec.hg: i386/fft_sse.c comparison

comparison i386/fft_sse.c @ 8031:eebc7209c47f libavcodec

Convert asm keyword into __asm__. Neither the asm() nor the __asm__() keyword is part of the C99 standard, but while GCC accepts the former in C89 syntax, it is not accepted in C99 unless GNU extensions are turned on (with -fasm). The latter form is accepted in any syntax as an extension (without requiring further command-line options). Sun Studio C99 compiler also does not accept asm() while accepting __asm__(), albeit reporting warnings that it's not valid C99 syntax.

author	flameeyes
date	Thu, 16 Oct 2008 13:34:09 +0000
parents	97383e012cb9
children

comparison

equal deleted inserted replaced

-:a512ac8fa540
+:eebc7209c47f
 ff_fft_dispatch_interleave_sse(z, s->nbits);
 if(n <= 16) {
 x86_reg i = -8*n;
-asm volatile(
+__asm__ volatile(
 "1: \n"
 "movaps     (%0,%1), %%xmm0 \n"
 "movaps      %%xmm0, %%xmm1 \n"
 "unpcklps 16(%0,%1), %%xmm0 \n"
 "unpckhps 16(%0,%1), %%xmm1 \n"
 void ff_fft_permute_sse(FFTContext *s, FFTComplex *z)
 {
 int n = 1 << s->nbits;
 int i;
 for(i=0; i<n; i+=2) {
-asm volatile(
+__asm__ volatile(
 "movaps %2, %%xmm0 \n"
 "movlps %%xmm0, %0 \n"
 "movhps %%xmm0, %1 \n"
 :"=m"(s->tmp_buf[s->revtab[i]]),
 "=m"(s->tmp_buf[s->revtab[i+1]])
 const FFTSample *tsin = s->tsin;
 FFTComplex *z = (FFTComplex *)output;
 /* pre rotation */
 for(k=n8-2; k>=0; k-=2) {
-asm volatile(
+__asm__ volatile(
 "movaps     (%2,%1,2), %%xmm0 \n" // { z[k].re,    z[k].im,    z[k+1].re,  z[k+1].im  }
 "movaps  -16(%2,%0,2), %%xmm1 \n" // { z[-k-2].re, z[-k-2].im, z[-k-1].re, z[-k-1].im }
 "movaps        %%xmm0, %%xmm2 \n"
 "shufps $0x88, %%xmm1, %%xmm0 \n" // { z[k].re,    z[k+1].re,  z[-k-2].re, z[-k-1].re }
 "shufps $0x77, %%xmm2, %%xmm1 \n" // { z[-k-1].im, z[-k-2].im, z[k+1].im,  z[k].im    }
 "r"(input+n4), "r"(tcos+n8), "r"(tsin+n8)
 );
 #ifdef ARCH_X86_64
 // if we have enough regs, don't let gcc make the luts latency-bound
 // but if not, latency is faster than spilling
-asm("movlps %%xmm0, %0 \n"
+__asm__("movlps %%xmm0, %0 \n"
 "movhps %%xmm0, %1 \n"
 "movlps %%xmm1, %2 \n"
 "movhps %%xmm1, %3 \n"
 :"=m"(z[revtab[-k-2]]),
 "=m"(z[revtab[-k-1]]),
 "=m"(z[revtab[ k  ]]),
 "=m"(z[revtab[ k+1]])
 );
 #else
-asm("movlps %%xmm0, %0" :"=m"(z[revtab[-k-2]]));
+__asm__("movlps %%xmm0, %0" :"=m"(z[revtab[-k-2]]));
-asm("movhps %%xmm0, %0" :"=m"(z[revtab[-k-1]]));
+__asm__("movhps %%xmm0, %0" :"=m"(z[revtab[-k-1]]));
-asm("movlps %%xmm1, %0" :"=m"(z[revtab[ k  ]]));
+__asm__("movlps %%xmm1, %0" :"=m"(z[revtab[ k  ]]));
-asm("movhps %%xmm1, %0" :"=m"(z[revtab[ k+1]]));
+__asm__("movhps %%xmm1, %0" :"=m"(z[revtab[ k+1]]));
 #endif
 }
 ff_fft_dispatch_sse(z, s->fft.nbits);
 "subps         %%xmm6, "#xmm0"\n"\
 "addps         %%xmm7, "#xmm1"\n"
 j = -n2;
 k = n2-16;
-asm volatile(
+__asm__ volatile(
 "1: \n"
 CMUL(%0, %%xmm0, %%xmm1)
 CMUL(%1, %%xmm4, %%xmm5)
 "shufps    $0x1b, %%xmm1, %%xmm1 \n"
 "shufps    $0x1b, %%xmm5, %%xmm5 \n"
 ff_imdct_half_sse(s, output+n4, input);
 j = -n;
 k = n-16;
-asm volatile(
+__asm__ volatile(
 "movaps %4, %%xmm7 \n"
 "1: \n"
 "movaps       (%2,%1), %%xmm0 \n"
 "movaps       (%3,%0), %%xmm1 \n"
 "shufps $0x1b, %%xmm0, %%xmm0 \n"

Mercurial > libavcodec.hg

comparison i386/fft_sse.c @ 8031:eebc7209c47f libavcodec