# HG changeset patch # User lorenm # Date 1202273061 0 # Node ID 950811a14eb3a350d54902108c8c776a62a0c8c9 # Parent bf8c9e82c7ade62dcc7c0e0c1ed2105fd5b70e81 put loop counter in a register if possible. makes some of the qpel functions 3% faster. diff -r bf8c9e82c7ad -r 950811a14eb3 i386/dsputil_mmx.c --- a/i386/dsputil_mmx.c Wed Feb 06 04:14:07 2008 +0000 +++ b/i386/dsputil_mmx.c Wed Feb 06 04:44:21 2008 +0000 @@ -2061,7 +2061,7 @@ "add %4, %1 \n\t"\ "decl %2 \n\t"\ " jnz 1b \n\t"\ - : "+a"(src), "+c"(dst), "+m"(h)\ + : "+a"(src), "+c"(dst), "+g"(h)\ : "d"((long)srcStride), "S"((long)dstStride), /*"m"(ff_pw_20), "m"(ff_pw_3),*/ "m"(temp), "m"(ROUNDER)\ : "memory"\ );\ @@ -2174,7 +2174,7 @@ "add %4, %1 \n\t"\ "decl %2 \n\t"\ " jnz 1b \n\t"\ - : "+a"(src), "+c"(dst), "+m"(h)\ + : "+a"(src), "+c"(dst), "+g"(h)\ : "S"((long)srcStride), "D"((long)dstStride), /*"m"(ff_pw_20), "m"(ff_pw_3),*/ "m"(temp), "m"(ROUNDER)\ : "memory"\ );\ diff -r bf8c9e82c7ad -r 950811a14eb3 i386/h264dsp_mmx.c --- a/i386/h264dsp_mmx.c Wed Feb 06 04:14:07 2008 +0000 +++ b/i386/h264dsp_mmx.c Wed Feb 06 04:44:21 2008 +0000 @@ -796,7 +796,7 @@ "add %4, %1 \n\t"\ "decl %2 \n\t"\ " jnz 1b \n\t"\ - : "+a"(src), "+c"(dst), "+m"(h)\ + : "+a"(src), "+c"(dst), "+g"(h)\ : "d"((long)srcStride), "S"((long)dstStride), "m"(ff_pw_5), "m"(ff_pw_16)\ : "memory"\ );\ @@ -930,7 +930,7 @@ "add %3, %1 \n\t"\ "decl %2 \n\t"\ " jnz 1b \n\t"\ - : "+a"(tmp), "+c"(dst), "+m"(h)\ + : "+a"(tmp), "+c"(dst), "+g"(h)\ : "S"((long)dstStride)\ : "memory"\ );\ @@ -987,7 +987,7 @@ "add %4, %1 \n\t"\ "decl %2 \n\t"\ " jnz 1b \n\t"\ - : "+a"(src), "+c"(dst), "+m"(h)\ + : "+a"(src), "+c"(dst), "+g"(h)\ : "d"((long)srcStride), "S"((long)dstStride), "m"(ff_pw_5), "m"(ff_pw_16)\ : "memory"\ );\ @@ -1201,7 +1201,7 @@ "add %3, %1 \n\t"\ "decl %2 \n\t"\ " jnz 1b \n\t"\ - : "+a"(tmp), "+c"(dst), "+m"(h)\ + : "+a"(tmp), "+c"(dst), "+g"(h)\ : "S"((long)dstStride)\ : "memory"\ );\