# HG changeset patch # User michael # Date 1160313622 0 # Node ID 0910f2844f9a4d61722780a4b0b134f05b526ce9 # Parent 051a9c8b257f04173074f898acca84fcf72ea047 branchless renormalization (1% faster get_cabac) old branchless renormalization wasnt faster because gcc was scared of the shift variable (missusing bit variable now) diff -r 051a9c8b257f -r 0910f2844f9a cabac.c --- a/cabac.c Sun Oct 08 11:24:37 2006 +0000 +++ b/cabac.c Sun Oct 08 13:20:22 2006 +0000 @@ -73,22 +73,22 @@ }; const uint8_t ff_h264_norm_shift[256]= { - 8,7,6,6,5,5,5,5,4,4,4,4,4,4,4,4, + 9,8,7,7,6,6,6,6,5,5,5,5,5,5,5,5, + 4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4, 3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3, + 3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3, + 2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2, + 2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2, 2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2, 2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2, 1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1, 1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1, 1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1, 1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1, - 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, - 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, - 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, - 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, - 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, - 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, - 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, - 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, + 1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1, + 1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1, + 1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1, + 1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1, }; /** diff -r 051a9c8b257f -r 0910f2844f9a cabac.h --- a/cabac.h Sun Oct 08 11:24:37 2006 +0000 +++ b/cabac.h Sun Oct 08 13:20:22 2006 +0000 @@ -266,16 +266,16 @@ c->bytestream+= CABAC_BITS/8; } -#if 0 /* all use commented */ +#if 1 /* all use commented */ static void refill2(CABACContext *c){ int i, x; x= c->low ^ (c->low-1); - i= 8 - ff_h264_norm_shift[x>>(CABAC_BITS+1)]; + i= 9 - ff_h264_norm_shift[x>>(CABAC_BITS+1)]; x= -CABAC_MASK; - if(c->bytestream < c->bytestream_end) + if(c->bytestream <= c->bytestream_end) #if CABAC_BITS == 16 x+= (c->bytestream[0]<<9) + (c->bytestream[1]<<1); #else @@ -395,17 +395,18 @@ #endif renorm_cabac_decoder_once(c); }else{ -// int shift= ff_h264_norm_shift[RangeLPS>>17]; - bit= (s&1)^1; + bit= ff_h264_norm_shift[RangeLPS>>17]; c->low -= c->range; *state= c->lps_state[s]; - c->range = RangeLPS; - renorm_cabac_decoder(c); -/* c->range = RangeLPS<low <<= shift; +// c->range = RangeLPS; +// renorm_cabac_decoder(c); + c->range = RangeLPS<low <<= bit; + bit= (s&1)^1; + if(!(c->low & 0xFFFF)){ refill2(c); - }*/ + } } #else lps_mask= (c->range - c->low)>>31;