diff cabac.h @ 3956:0910f2844f9a libavcodec

branchless renormalization (1% faster get_cabac) old branchless renormalization wasnt faster because gcc was scared of the shift variable (missusing bit variable now)
author michael
date Sun, 08 Oct 2006 13:20:22 +0000
parents 051a9c8b257f
children 2acfc35c3075
line wrap: on
line diff
--- a/cabac.h	Sun Oct 08 11:24:37 2006 +0000
+++ b/cabac.h	Sun Oct 08 13:20:22 2006 +0000
@@ -266,16 +266,16 @@
     c->bytestream+= CABAC_BITS/8;
 }
 
-#if 0 /* all use commented */
+#if 1 /* all use commented */
 static void refill2(CABACContext *c){
     int i, x;
 
     x= c->low ^ (c->low-1);
-    i= 8 - ff_h264_norm_shift[x>>(CABAC_BITS+1)];
+    i= 9 - ff_h264_norm_shift[x>>(CABAC_BITS+1)];
 
     x= -CABAC_MASK;
 
-    if(c->bytestream < c->bytestream_end)
+    if(c->bytestream <= c->bytestream_end)
 #if CABAC_BITS == 16
         x+= (c->bytestream[0]<<9) + (c->bytestream[1]<<1);
 #else
@@ -395,17 +395,18 @@
 #endif
         renorm_cabac_decoder_once(c);
     }else{
-//        int shift= ff_h264_norm_shift[RangeLPS>>17];
-        bit= (s&1)^1;
+        bit= ff_h264_norm_shift[RangeLPS>>17];
         c->low -= c->range;
         *state= c->lps_state[s];
-        c->range = RangeLPS;
-        renorm_cabac_decoder(c);
-/*        c->range = RangeLPS<<shift;
-        c->low <<= shift;
+//        c->range = RangeLPS;
+//        renorm_cabac_decoder(c);
+        c->range = RangeLPS<<bit;
+        c->low <<= bit;
+        bit= (s&1)^1;
+
         if(!(c->low & 0xFFFF)){
             refill2(c);
-        }*/
+        }
     }
 #else
     lps_mask= (c->range - c->low)>>31;