Mercurial > libavcodec.hg
annotate cabac.c @ 4014:b2582438effe libavcodec
dehack *ps_state indexing in the branchless decoder
author | michael |
---|---|
date | Fri, 13 Oct 2006 14:21:25 +0000 |
parents | 8b7c59b7af01 |
children | d550343b5dac |
rev | line source |
---|---|
1287 | 1 /* |
2 * H.26L/H.264/AVC/JVT/14496-10/... encoder/decoder | |
3 * Copyright (c) 2003 Michael Niedermayer <michaelni@gmx.at> | |
4 * | |
3947
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3036
diff
changeset
|
5 * This file is part of FFmpeg. |
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3036
diff
changeset
|
6 * |
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3036
diff
changeset
|
7 * FFmpeg is free software; you can redistribute it and/or |
1287 | 8 * modify it under the terms of the GNU Lesser General Public |
9 * License as published by the Free Software Foundation; either | |
3947
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3036
diff
changeset
|
10 * version 2.1 of the License, or (at your option) any later version. |
1287 | 11 * |
3947
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3036
diff
changeset
|
12 * FFmpeg is distributed in the hope that it will be useful, |
1287 | 13 * but WITHOUT ANY WARRANTY; without even the implied warranty of |
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | |
15 * Lesser General Public License for more details. | |
16 * | |
17 * You should have received a copy of the GNU Lesser General Public | |
3947
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3036
diff
changeset
|
18 * License along with FFmpeg; if not, write to the Free Software |
3036
0b546eab515d
Update licensing information: The FSF changed postal address.
diego
parents:
2967
diff
changeset
|
19 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA |
1287 | 20 * |
21 */ | |
22 | |
23 /** | |
24 * @file cabac.c | |
25 * Context Adaptive Binary Arithmetic Coder. | |
26 */ | |
27 | |
28 #include <string.h> | |
29 | |
30 #include "common.h" | |
2398
582e635cfa08
common.c -> bitstream.c (and the single non bitstream func -> utils.c)
michael
parents:
2323
diff
changeset
|
31 #include "bitstream.h" |
1287 | 32 #include "cabac.h" |
33 | |
3991
72bae00a317f
make lps_range a global table its constant anyway (saves 1 addition for accessing it)
michael
parents:
3984
diff
changeset
|
34 static const uint8_t lps_range[64][4]= { |
1287 | 35 {128,176,208,240}, {128,167,197,227}, {128,158,187,216}, {123,150,178,205}, |
36 {116,142,169,195}, {111,135,160,185}, {105,128,152,175}, {100,122,144,166}, | |
37 { 95,116,137,158}, { 90,110,130,150}, { 85,104,123,142}, { 81, 99,117,135}, | |
38 { 77, 94,111,128}, { 73, 89,105,122}, { 69, 85,100,116}, { 66, 80, 95,110}, | |
39 { 62, 76, 90,104}, { 59, 72, 86, 99}, { 56, 69, 81, 94}, { 53, 65, 77, 89}, | |
40 { 51, 62, 73, 85}, { 48, 59, 69, 80}, { 46, 56, 66, 76}, { 43, 53, 63, 72}, | |
41 { 41, 50, 59, 69}, { 39, 48, 56, 65}, { 37, 45, 54, 62}, { 35, 43, 51, 59}, | |
42 { 33, 41, 48, 56}, { 32, 39, 46, 53}, { 30, 37, 43, 50}, { 29, 35, 41, 48}, | |
43 { 27, 33, 39, 45}, { 26, 31, 37, 43}, { 24, 30, 35, 41}, { 23, 28, 33, 39}, | |
44 { 22, 27, 32, 37}, { 21, 26, 30, 35}, { 20, 24, 29, 33}, { 19, 23, 27, 31}, | |
45 { 18, 22, 26, 30}, { 17, 21, 25, 28}, { 16, 20, 23, 27}, { 15, 19, 22, 25}, | |
46 { 14, 18, 21, 24}, { 14, 17, 20, 23}, { 13, 16, 19, 22}, { 12, 15, 18, 21}, | |
47 { 12, 14, 17, 20}, { 11, 14, 16, 19}, { 11, 13, 15, 18}, { 10, 12, 15, 17}, | |
48 { 10, 12, 14, 16}, { 9, 11, 13, 15}, { 9, 11, 12, 14}, { 8, 10, 12, 14}, | |
49 { 8, 9, 11, 13}, { 7, 9, 11, 12}, { 7, 9, 10, 12}, { 7, 8, 10, 11}, | |
50 { 6, 8, 9, 11}, { 6, 7, 9, 10}, { 6, 7, 8, 9}, { 2, 2, 2, 2}, | |
51 }; | |
52 | |
4014
b2582438effe
dehack *ps_state indexing in the branchless decoder
michael
parents:
3993
diff
changeset
|
53 uint8_t ff_h264_mlps_state[4*64]; |
3991
72bae00a317f
make lps_range a global table its constant anyway (saves 1 addition for accessing it)
michael
parents:
3984
diff
changeset
|
54 uint8_t ff_h264_lps_range[2*65][4]; |
3993
8b7c59b7af01
make state transition tables global as they are constant and the code is slightly faster that way
michael
parents:
3991
diff
changeset
|
55 uint8_t ff_h264_lps_state[2*64]; |
8b7c59b7af01
make state transition tables global as they are constant and the code is slightly faster that way
michael
parents:
3991
diff
changeset
|
56 uint8_t ff_h264_mps_state[2*64]; |
3991
72bae00a317f
make lps_range a global table its constant anyway (saves 1 addition for accessing it)
michael
parents:
3984
diff
changeset
|
57 |
3993
8b7c59b7af01
make state transition tables global as they are constant and the code is slightly faster that way
michael
parents:
3991
diff
changeset
|
58 static const uint8_t mps_state[64]= { |
1287 | 59 1, 2, 3, 4, 5, 6, 7, 8, |
60 9,10,11,12,13,14,15,16, | |
61 17,18,19,20,21,22,23,24, | |
62 25,26,27,28,29,30,31,32, | |
63 33,34,35,36,37,38,39,40, | |
64 41,42,43,44,45,46,47,48, | |
65 49,50,51,52,53,54,55,56, | |
66 57,58,59,60,61,62,62,63, | |
67 }; | |
68 | |
3993
8b7c59b7af01
make state transition tables global as they are constant and the code is slightly faster that way
michael
parents:
3991
diff
changeset
|
69 static const uint8_t lps_state[64]= { |
1287 | 70 0, 0, 1, 2, 2, 4, 4, 5, |
71 6, 7, 8, 9, 9,11,11,12, | |
72 13,13,15,15,16,16,18,18, | |
73 19,19,21,21,22,22,23,24, | |
74 24,25,26,26,27,27,28,29, | |
75 29,30,30,30,31,32,32,33, | |
76 33,33,34,34,35,35,35,36, | |
77 36,36,37,37,37,38,38,63, | |
78 }; | |
79 | |
3964 | 80 const uint8_t ff_h264_norm_shift[128]= { |
81 7,6,5,5,4,4,4,4,3,3,3,3,3,3,3,3, | |
2323 | 82 2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2, |
83 1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1, | |
84 1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1, | |
3964 | 85 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, |
86 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, | |
87 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, | |
88 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, | |
2323 | 89 }; |
90 | |
1287 | 91 /** |
92 * | |
93 * @param buf_size size of buf in bits | |
94 */ | |
95 void ff_init_cabac_encoder(CABACContext *c, uint8_t *buf, int buf_size){ | |
1522
79dddc5cd990
removed the obsolete and unused parameters of init_put_bits
alex
parents:
1300
diff
changeset
|
96 init_put_bits(&c->pb, buf, buf_size); |
1287 | 97 |
98 c->low= 0; | |
99 c->range= 0x1FE; | |
100 c->outstanding_count= 0; | |
101 #ifdef STRICT_LIMITS | |
102 c->sym_count =0; | |
103 #endif | |
2967 | 104 |
1287 | 105 c->pb.bit_left++; //avoids firstBitFlag |
106 } | |
107 | |
108 /** | |
109 * | |
110 * @param buf_size size of buf in bits | |
111 */ | |
2024
f65d87bfdd5a
some of the warning fixes by (Michael Roitzsch <mroi at users dot sourceforge dot net>)
michael
parents:
1908
diff
changeset
|
112 void ff_init_cabac_decoder(CABACContext *c, const uint8_t *buf, int buf_size){ |
2967 | 113 c->bytestream_start= |
1287 | 114 c->bytestream= buf; |
2116 | 115 c->bytestream_end= buf + buf_size; |
1287 | 116 |
2323 | 117 #if CABAC_BITS == 16 |
118 c->low = (*c->bytestream++)<<18; | |
119 c->low+= (*c->bytestream++)<<10; | |
120 #else | |
121 c->low = (*c->bytestream++)<<10; | |
122 #endif | |
123 c->low+= ((*c->bytestream++)<<2) + 2; | |
124 c->range= 0x1FE<<(CABAC_BITS + 1); | |
1287 | 125 } |
126 | |
3993
8b7c59b7af01
make state transition tables global as they are constant and the code is slightly faster that way
michael
parents:
3991
diff
changeset
|
127 void ff_init_cabac_states(CABACContext *c){ |
1287 | 128 int i, j; |
2967 | 129 |
3993
8b7c59b7af01
make state transition tables global as they are constant and the code is slightly faster that way
michael
parents:
3991
diff
changeset
|
130 for(i=0; i<64; i++){ |
1287 | 131 for(j=0; j<4; j++){ //FIXME check if this is worth the 1 shift we save |
3991
72bae00a317f
make lps_range a global table its constant anyway (saves 1 addition for accessing it)
michael
parents:
3984
diff
changeset
|
132 ff_h264_lps_range[2*i+0][j+4]= |
72bae00a317f
make lps_range a global table its constant anyway (saves 1 addition for accessing it)
michael
parents:
3984
diff
changeset
|
133 ff_h264_lps_range[2*i+1][j+4]= lps_range[i][j]; |
1287 | 134 } |
135 | |
4014
b2582438effe
dehack *ps_state indexing in the branchless decoder
michael
parents:
3993
diff
changeset
|
136 ff_h264_mlps_state[128+2*i+0]= |
3993
8b7c59b7af01
make state transition tables global as they are constant and the code is slightly faster that way
michael
parents:
3991
diff
changeset
|
137 ff_h264_mps_state[2*i+0]= 2*mps_state[i]+0; |
4014
b2582438effe
dehack *ps_state indexing in the branchless decoder
michael
parents:
3993
diff
changeset
|
138 ff_h264_mlps_state[128+2*i+1]= |
3993
8b7c59b7af01
make state transition tables global as they are constant and the code is slightly faster that way
michael
parents:
3991
diff
changeset
|
139 ff_h264_mps_state[2*i+1]= 2*mps_state[i]+1; |
1287 | 140 |
1908
e20fd60b215c
h264 - progressive I frame CABAC support patch by (Laurent Aimar <fenrir at via dot ecp dot fr>)
michael
parents:
1522
diff
changeset
|
141 if( i ){ |
3984 | 142 #ifdef BRANCHLESS_CABAC_DECODER |
4014
b2582438effe
dehack *ps_state indexing in the branchless decoder
michael
parents:
3993
diff
changeset
|
143 ff_h264_mlps_state[128-2*i-1]= 2*lps_state[i]+0; |
b2582438effe
dehack *ps_state indexing in the branchless decoder
michael
parents:
3993
diff
changeset
|
144 ff_h264_mlps_state[128-2*i-2]= 2*lps_state[i]+1; |
3974 | 145 }else{ |
4014
b2582438effe
dehack *ps_state indexing in the branchless decoder
michael
parents:
3993
diff
changeset
|
146 ff_h264_mlps_state[128-2*i-1]= 1; |
b2582438effe
dehack *ps_state indexing in the branchless decoder
michael
parents:
3993
diff
changeset
|
147 ff_h264_mlps_state[128-2*i-2]= 0; |
3974 | 148 #else |
3993
8b7c59b7af01
make state transition tables global as they are constant and the code is slightly faster that way
michael
parents:
3991
diff
changeset
|
149 ff_h264_lps_state[2*i+0]= 2*lps_state[i]+0; |
8b7c59b7af01
make state transition tables global as they are constant and the code is slightly faster that way
michael
parents:
3991
diff
changeset
|
150 ff_h264_lps_state[2*i+1]= 2*lps_state[i]+1; |
1287 | 151 }else{ |
3993
8b7c59b7af01
make state transition tables global as they are constant and the code is slightly faster that way
michael
parents:
3991
diff
changeset
|
152 ff_h264_lps_state[2*i+0]= 1; |
8b7c59b7af01
make state transition tables global as they are constant and the code is slightly faster that way
michael
parents:
3991
diff
changeset
|
153 ff_h264_lps_state[2*i+1]= 0; |
3974 | 154 #endif |
1287 | 155 } |
156 } | |
157 } | |
158 | |
159 #if 0 //selftest | |
160 #define SIZE 10240 | |
2420 | 161 |
162 #include "avcodec.h" | |
163 | |
1287 | 164 int main(){ |
165 CABACContext c; | |
166 uint8_t b[9*SIZE]; | |
1290 | 167 uint8_t r[9*SIZE]; |
1287 | 168 int i; |
1290 | 169 uint8_t state[10]= {0}; |
2967 | 170 |
1287 | 171 ff_init_cabac_encoder(&c, b, SIZE); |
172 ff_init_cabac_states(&c, ff_h264_lps_range, ff_h264_mps_state, ff_h264_lps_state, 64); | |
2967 | 173 |
1287 | 174 for(i=0; i<SIZE; i++){ |
1290 | 175 r[i]= random()%7; |
1287 | 176 } |
2967 | 177 |
1287 | 178 for(i=0; i<SIZE; i++){ |
179 START_TIMER | |
1290 | 180 put_cabac_bypass(&c, r[i]&1); |
1287 | 181 STOP_TIMER("put_cabac_bypass") |
182 } | |
2967 | 183 |
1287 | 184 for(i=0; i<SIZE; i++){ |
185 START_TIMER | |
1290 | 186 put_cabac(&c, state, r[i]&1); |
1287 | 187 STOP_TIMER("put_cabac") |
188 } | |
189 | |
1290 | 190 for(i=0; i<SIZE; i++){ |
191 START_TIMER | |
192 put_cabac_u(&c, state, r[i], 6, 3, i&1); | |
193 STOP_TIMER("put_cabac_u") | |
2967 | 194 } |
1290 | 195 |
196 for(i=0; i<SIZE; i++){ | |
197 START_TIMER | |
1298 | 198 put_cabac_ueg(&c, state, r[i], 3, 0, 1, 2); |
1290 | 199 STOP_TIMER("put_cabac_ueg") |
2967 | 200 } |
201 | |
1287 | 202 put_cabac_terminate(&c, 1); |
2967 | 203 |
1287 | 204 ff_init_cabac_decoder(&c, b, SIZE); |
2967 | 205 |
1290 | 206 memset(state, 0, sizeof(state)); |
2967 | 207 |
1287 | 208 for(i=0; i<SIZE; i++){ |
209 START_TIMER | |
1290 | 210 if( (r[i]&1) != get_cabac_bypass(&c) ) |
2420 | 211 av_log(NULL, AV_LOG_ERROR, "CABAC bypass failure at %d\n", i); |
1287 | 212 STOP_TIMER("get_cabac_bypass") |
213 } | |
2967 | 214 |
1287 | 215 for(i=0; i<SIZE; i++){ |
216 START_TIMER | |
1290 | 217 if( (r[i]&1) != get_cabac(&c, state) ) |
2420 | 218 av_log(NULL, AV_LOG_ERROR, "CABAC failure at %d\n", i); |
1287 | 219 STOP_TIMER("get_cabac") |
220 } | |
2420 | 221 #if 0 |
1290 | 222 for(i=0; i<SIZE; i++){ |
223 START_TIMER | |
224 if( r[i] != get_cabac_u(&c, state, (i&1) ? 6 : 7, 3, i&1) ) | |
2420 | 225 av_log(NULL, AV_LOG_ERROR, "CABAC unary (truncated) binarization failure at %d\n", i); |
1290 | 226 STOP_TIMER("get_cabac_u") |
227 } | |
228 | |
229 for(i=0; i<SIZE; i++){ | |
230 START_TIMER | |
231 if( r[i] != get_cabac_ueg(&c, state, 3, 0, 1, 2)) | |
2420 | 232 av_log(NULL, AV_LOG_ERROR, "CABAC unary (truncated) binarization failure at %d\n", i); |
1290 | 233 STOP_TIMER("get_cabac_ueg") |
234 } | |
2420 | 235 #endif |
1287 | 236 if(!get_cabac_terminate(&c)) |
2420 | 237 av_log(NULL, AV_LOG_ERROR, "where's the Terminator?\n"); |
2967 | 238 |
1287 | 239 return 0; |
240 } | |
241 | |
242 #endif |