Mercurial > libavcodec.hg
view alpha/regdef.h @ 4040:9eaea06c5ba6 libavcodec
optimize sign decoding code in decode_residual()
x86 is 4% faster on P3
C sign stuff + x86 code for everything else is also faster then before (sorry forgot to test pure C)
... and if i replace the second occurance of the sign decoding in decode_residual by the asm too then everything gets slower iam starting to think that it might be best to write the whole function in asm, playing this avoid random deoptimizations game with gcc is not fun at all
author | michael |
---|---|
date | Thu, 19 Oct 2006 01:19:03 +0000 |
parents | c8c591fe26f8 |
children | 1d83e9c34641 |
line wrap: on
line source
/* * Alpha optimized DSP utils * copyright (c) 2002 Falk Hueffner <falk@debian.org> * * This file is part of FFmpeg. * * FFmpeg is free software; you can redistribute it and/or * modify it under the terms of the GNU Lesser General Public * License as published by the Free Software Foundation; either * version 2.1 of the License, or (at your option) any later version. * * FFmpeg is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU * Lesser General Public License for more details. * * You should have received a copy of the GNU Lesser General Public * License along with FFmpeg; if not, write to the Free Software * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA */ /* Some BSDs don't seem to have regdef.h... sigh */ #ifndef alpha_regdef_h #define alpha_regdef_h #define v0 $0 /* function return value */ #define t0 $1 /* temporary registers (caller-saved) */ #define t1 $2 #define t2 $3 #define t3 $4 #define t4 $5 #define t5 $6 #define t6 $7 #define t7 $8 #define s0 $9 /* saved-registers (callee-saved registers) */ #define s1 $10 #define s2 $11 #define s3 $12 #define s4 $13 #define s5 $14 #define s6 $15 #define fp s6 /* frame-pointer (s6 in frame-less procedures) */ #define a0 $16 /* argument registers (caller-saved) */ #define a1 $17 #define a2 $18 #define a3 $19 #define a4 $20 #define a5 $21 #define t8 $22 /* more temps (caller-saved) */ #define t9 $23 #define t10 $24 #define t11 $25 #define ra $26 /* return address register */ #define t12 $27 #define pv t12 /* procedure-variable register */ #define AT $at /* assembler temporary */ #define gp $29 /* global pointer */ #define sp $30 /* stack pointer */ #define zero $31 /* reads as zero, writes are noops */ #endif /* alpha_regdef_h */