Mercurial > libavcodec.hg
annotate cabac.c @ 3993:8b7c59b7af01 libavcodec
make state transition tables global as they are constant and the code is slightly faster that way
author | michael |
---|---|
date | Wed, 11 Oct 2006 14:44:17 +0000 |
parents | 72bae00a317f |
children | b2582438effe |
rev | line source |
---|---|
1287 | 1 /* |
2 * H.26L/H.264/AVC/JVT/14496-10/... encoder/decoder | |
3 * Copyright (c) 2003 Michael Niedermayer <michaelni@gmx.at> | |
4 * | |
3947
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3036
diff
changeset
|
5 * This file is part of FFmpeg. |
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3036
diff
changeset
|
6 * |
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3036
diff
changeset
|
7 * FFmpeg is free software; you can redistribute it and/or |
1287 | 8 * modify it under the terms of the GNU Lesser General Public |
9 * License as published by the Free Software Foundation; either | |
3947
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3036
diff
changeset
|
10 * version 2.1 of the License, or (at your option) any later version. |
1287 | 11 * |
3947
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3036
diff
changeset
|
12 * FFmpeg is distributed in the hope that it will be useful, |
1287 | 13 * but WITHOUT ANY WARRANTY; without even the implied warranty of |
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | |
15 * Lesser General Public License for more details. | |
16 * | |
17 * You should have received a copy of the GNU Lesser General Public | |
3947
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3036
diff
changeset
|
18 * License along with FFmpeg; if not, write to the Free Software |
3036
0b546eab515d
Update licensing information: The FSF changed postal address.
diego
parents:
2967
diff
changeset
|
19 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA |
1287 | 20 * |
21 */ | |
22 | |
23 /** | |
24 * @file cabac.c | |
25 * Context Adaptive Binary Arithmetic Coder. | |
26 */ | |
27 | |
28 #include <string.h> | |
29 | |
30 #include "common.h" | |
2398
582e635cfa08
common.c -> bitstream.c (and the single non bitstream func -> utils.c)
michael
parents:
2323
diff
changeset
|
31 #include "bitstream.h" |
1287 | 32 #include "cabac.h" |
33 | |
3991
72bae00a317f
make lps_range a global table its constant anyway (saves 1 addition for accessing it)
michael
parents:
3984
diff
changeset
|
34 static const uint8_t lps_range[64][4]= { |
1287 | 35 {128,176,208,240}, {128,167,197,227}, {128,158,187,216}, {123,150,178,205}, |
36 {116,142,169,195}, {111,135,160,185}, {105,128,152,175}, {100,122,144,166}, | |
37 { 95,116,137,158}, { 90,110,130,150}, { 85,104,123,142}, { 81, 99,117,135}, | |
38 { 77, 94,111,128}, { 73, 89,105,122}, { 69, 85,100,116}, { 66, 80, 95,110}, | |
39 { 62, 76, 90,104}, { 59, 72, 86, 99}, { 56, 69, 81, 94}, { 53, 65, 77, 89}, | |
40 { 51, 62, 73, 85}, { 48, 59, 69, 80}, { 46, 56, 66, 76}, { 43, 53, 63, 72}, | |
41 { 41, 50, 59, 69}, { 39, 48, 56, 65}, { 37, 45, 54, 62}, { 35, 43, 51, 59}, | |
42 { 33, 41, 48, 56}, { 32, 39, 46, 53}, { 30, 37, 43, 50}, { 29, 35, 41, 48}, | |
43 { 27, 33, 39, 45}, { 26, 31, 37, 43}, { 24, 30, 35, 41}, { 23, 28, 33, 39}, | |
44 { 22, 27, 32, 37}, { 21, 26, 30, 35}, { 20, 24, 29, 33}, { 19, 23, 27, 31}, | |
45 { 18, 22, 26, 30}, { 17, 21, 25, 28}, { 16, 20, 23, 27}, { 15, 19, 22, 25}, | |
46 { 14, 18, 21, 24}, { 14, 17, 20, 23}, { 13, 16, 19, 22}, { 12, 15, 18, 21}, | |
47 { 12, 14, 17, 20}, { 11, 14, 16, 19}, { 11, 13, 15, 18}, { 10, 12, 15, 17}, | |
48 { 10, 12, 14, 16}, { 9, 11, 13, 15}, { 9, 11, 12, 14}, { 8, 10, 12, 14}, | |
49 { 8, 9, 11, 13}, { 7, 9, 11, 12}, { 7, 9, 10, 12}, { 7, 8, 10, 11}, | |
50 { 6, 8, 9, 11}, { 6, 7, 9, 10}, { 6, 7, 8, 9}, { 2, 2, 2, 2}, | |
51 }; | |
52 | |
3991
72bae00a317f
make lps_range a global table its constant anyway (saves 1 addition for accessing it)
michael
parents:
3984
diff
changeset
|
53 uint8_t ff_h264_lps_range[2*65][4]; |
3993
8b7c59b7af01
make state transition tables global as they are constant and the code is slightly faster that way
michael
parents:
3991
diff
changeset
|
54 uint8_t ff_h264_lps_state[2*64]; |
8b7c59b7af01
make state transition tables global as they are constant and the code is slightly faster that way
michael
parents:
3991
diff
changeset
|
55 uint8_t ff_h264_mps_state[2*64]; |
3991
72bae00a317f
make lps_range a global table its constant anyway (saves 1 addition for accessing it)
michael
parents:
3984
diff
changeset
|
56 |
3993
8b7c59b7af01
make state transition tables global as they are constant and the code is slightly faster that way
michael
parents:
3991
diff
changeset
|
57 static const uint8_t mps_state[64]= { |
1287 | 58 1, 2, 3, 4, 5, 6, 7, 8, |
59 9,10,11,12,13,14,15,16, | |
60 17,18,19,20,21,22,23,24, | |
61 25,26,27,28,29,30,31,32, | |
62 33,34,35,36,37,38,39,40, | |
63 41,42,43,44,45,46,47,48, | |
64 49,50,51,52,53,54,55,56, | |
65 57,58,59,60,61,62,62,63, | |
66 }; | |
67 | |
3993
8b7c59b7af01
make state transition tables global as they are constant and the code is slightly faster that way
michael
parents:
3991
diff
changeset
|
68 static const uint8_t lps_state[64]= { |
1287 | 69 0, 0, 1, 2, 2, 4, 4, 5, |
70 6, 7, 8, 9, 9,11,11,12, | |
71 13,13,15,15,16,16,18,18, | |
72 19,19,21,21,22,22,23,24, | |
73 24,25,26,26,27,27,28,29, | |
74 29,30,30,30,31,32,32,33, | |
75 33,33,34,34,35,35,35,36, | |
76 36,36,37,37,37,38,38,63, | |
77 }; | |
78 | |
3964 | 79 const uint8_t ff_h264_norm_shift[128]= { |
80 7,6,5,5,4,4,4,4,3,3,3,3,3,3,3,3, | |
2323 | 81 2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2, |
82 1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1, | |
83 1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1, | |
3964 | 84 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, |
85 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, | |
86 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, | |
87 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, | |
2323 | 88 }; |
89 | |
1287 | 90 /** |
91 * | |
92 * @param buf_size size of buf in bits | |
93 */ | |
94 void ff_init_cabac_encoder(CABACContext *c, uint8_t *buf, int buf_size){ | |
1522
79dddc5cd990
removed the obsolete and unused parameters of init_put_bits
alex
parents:
1300
diff
changeset
|
95 init_put_bits(&c->pb, buf, buf_size); |
1287 | 96 |
97 c->low= 0; | |
98 c->range= 0x1FE; | |
99 c->outstanding_count= 0; | |
100 #ifdef STRICT_LIMITS | |
101 c->sym_count =0; | |
102 #endif | |
2967 | 103 |
1287 | 104 c->pb.bit_left++; //avoids firstBitFlag |
105 } | |
106 | |
107 /** | |
108 * | |
109 * @param buf_size size of buf in bits | |
110 */ | |
2024
f65d87bfdd5a
some of the warning fixes by (Michael Roitzsch <mroi at users dot sourceforge dot net>)
michael
parents:
1908
diff
changeset
|
111 void ff_init_cabac_decoder(CABACContext *c, const uint8_t *buf, int buf_size){ |
2967 | 112 c->bytestream_start= |
1287 | 113 c->bytestream= buf; |
2116 | 114 c->bytestream_end= buf + buf_size; |
1287 | 115 |
2323 | 116 #if CABAC_BITS == 16 |
117 c->low = (*c->bytestream++)<<18; | |
118 c->low+= (*c->bytestream++)<<10; | |
119 #else | |
120 c->low = (*c->bytestream++)<<10; | |
121 #endif | |
122 c->low+= ((*c->bytestream++)<<2) + 2; | |
123 c->range= 0x1FE<<(CABAC_BITS + 1); | |
1287 | 124 } |
125 | |
3993
8b7c59b7af01
make state transition tables global as they are constant and the code is slightly faster that way
michael
parents:
3991
diff
changeset
|
126 void ff_init_cabac_states(CABACContext *c){ |
1287 | 127 int i, j; |
2967 | 128 |
3993
8b7c59b7af01
make state transition tables global as they are constant and the code is slightly faster that way
michael
parents:
3991
diff
changeset
|
129 for(i=0; i<64; i++){ |
1287 | 130 for(j=0; j<4; j++){ //FIXME check if this is worth the 1 shift we save |
3991
72bae00a317f
make lps_range a global table its constant anyway (saves 1 addition for accessing it)
michael
parents:
3984
diff
changeset
|
131 ff_h264_lps_range[2*i+0][j+4]= |
72bae00a317f
make lps_range a global table its constant anyway (saves 1 addition for accessing it)
michael
parents:
3984
diff
changeset
|
132 ff_h264_lps_range[2*i+1][j+4]= lps_range[i][j]; |
1287 | 133 } |
134 | |
3993
8b7c59b7af01
make state transition tables global as they are constant and the code is slightly faster that way
michael
parents:
3991
diff
changeset
|
135 ff_h264_mps_state[2*i+0]= 2*mps_state[i]+0; |
8b7c59b7af01
make state transition tables global as they are constant and the code is slightly faster that way
michael
parents:
3991
diff
changeset
|
136 ff_h264_mps_state[2*i+1]= 2*mps_state[i]+1; |
1287 | 137 |
1908
e20fd60b215c
h264 - progressive I frame CABAC support patch by (Laurent Aimar <fenrir at via dot ecp dot fr>)
michael
parents:
1522
diff
changeset
|
138 if( i ){ |
3984 | 139 #ifdef BRANCHLESS_CABAC_DECODER |
3993
8b7c59b7af01
make state transition tables global as they are constant and the code is slightly faster that way
michael
parents:
3991
diff
changeset
|
140 ff_h264_mps_state[-2*i-1]= 2*lps_state[i]+0; //FIXME yes this is not valid C but iam lazy, cleanup welcome |
8b7c59b7af01
make state transition tables global as they are constant and the code is slightly faster that way
michael
parents:
3991
diff
changeset
|
141 ff_h264_mps_state[-2*i-2]= 2*lps_state[i]+1; |
3974 | 142 }else{ |
3993
8b7c59b7af01
make state transition tables global as they are constant and the code is slightly faster that way
michael
parents:
3991
diff
changeset
|
143 ff_h264_mps_state[-2*i-1]= 1; |
8b7c59b7af01
make state transition tables global as they are constant and the code is slightly faster that way
michael
parents:
3991
diff
changeset
|
144 ff_h264_mps_state[-2*i-2]= 0; |
3974 | 145 #else |
3993
8b7c59b7af01
make state transition tables global as they are constant and the code is slightly faster that way
michael
parents:
3991
diff
changeset
|
146 ff_h264_lps_state[2*i+0]= 2*lps_state[i]+0; |
8b7c59b7af01
make state transition tables global as they are constant and the code is slightly faster that way
michael
parents:
3991
diff
changeset
|
147 ff_h264_lps_state[2*i+1]= 2*lps_state[i]+1; |
1287 | 148 }else{ |
3993
8b7c59b7af01
make state transition tables global as they are constant and the code is slightly faster that way
michael
parents:
3991
diff
changeset
|
149 ff_h264_lps_state[2*i+0]= 1; |
8b7c59b7af01
make state transition tables global as they are constant and the code is slightly faster that way
michael
parents:
3991
diff
changeset
|
150 ff_h264_lps_state[2*i+1]= 0; |
3974 | 151 #endif |
1287 | 152 } |
153 } | |
154 } | |
155 | |
156 #if 0 //selftest | |
157 #define SIZE 10240 | |
2420 | 158 |
159 #include "avcodec.h" | |
160 | |
1287 | 161 int main(){ |
162 CABACContext c; | |
163 uint8_t b[9*SIZE]; | |
1290 | 164 uint8_t r[9*SIZE]; |
1287 | 165 int i; |
1290 | 166 uint8_t state[10]= {0}; |
2967 | 167 |
1287 | 168 ff_init_cabac_encoder(&c, b, SIZE); |
169 ff_init_cabac_states(&c, ff_h264_lps_range, ff_h264_mps_state, ff_h264_lps_state, 64); | |
2967 | 170 |
1287 | 171 for(i=0; i<SIZE; i++){ |
1290 | 172 r[i]= random()%7; |
1287 | 173 } |
2967 | 174 |
1287 | 175 for(i=0; i<SIZE; i++){ |
176 START_TIMER | |
1290 | 177 put_cabac_bypass(&c, r[i]&1); |
1287 | 178 STOP_TIMER("put_cabac_bypass") |
179 } | |
2967 | 180 |
1287 | 181 for(i=0; i<SIZE; i++){ |
182 START_TIMER | |
1290 | 183 put_cabac(&c, state, r[i]&1); |
1287 | 184 STOP_TIMER("put_cabac") |
185 } | |
186 | |
1290 | 187 for(i=0; i<SIZE; i++){ |
188 START_TIMER | |
189 put_cabac_u(&c, state, r[i], 6, 3, i&1); | |
190 STOP_TIMER("put_cabac_u") | |
2967 | 191 } |
1290 | 192 |
193 for(i=0; i<SIZE; i++){ | |
194 START_TIMER | |
1298 | 195 put_cabac_ueg(&c, state, r[i], 3, 0, 1, 2); |
1290 | 196 STOP_TIMER("put_cabac_ueg") |
2967 | 197 } |
198 | |
1287 | 199 put_cabac_terminate(&c, 1); |
2967 | 200 |
1287 | 201 ff_init_cabac_decoder(&c, b, SIZE); |
2967 | 202 |
1290 | 203 memset(state, 0, sizeof(state)); |
2967 | 204 |
1287 | 205 for(i=0; i<SIZE; i++){ |
206 START_TIMER | |
1290 | 207 if( (r[i]&1) != get_cabac_bypass(&c) ) |
2420 | 208 av_log(NULL, AV_LOG_ERROR, "CABAC bypass failure at %d\n", i); |
1287 | 209 STOP_TIMER("get_cabac_bypass") |
210 } | |
2967 | 211 |
1287 | 212 for(i=0; i<SIZE; i++){ |
213 START_TIMER | |
1290 | 214 if( (r[i]&1) != get_cabac(&c, state) ) |
2420 | 215 av_log(NULL, AV_LOG_ERROR, "CABAC failure at %d\n", i); |
1287 | 216 STOP_TIMER("get_cabac") |
217 } | |
2420 | 218 #if 0 |
1290 | 219 for(i=0; i<SIZE; i++){ |
220 START_TIMER | |
221 if( r[i] != get_cabac_u(&c, state, (i&1) ? 6 : 7, 3, i&1) ) | |
2420 | 222 av_log(NULL, AV_LOG_ERROR, "CABAC unary (truncated) binarization failure at %d\n", i); |
1290 | 223 STOP_TIMER("get_cabac_u") |
224 } | |
225 | |
226 for(i=0; i<SIZE; i++){ | |
227 START_TIMER | |
228 if( r[i] != get_cabac_ueg(&c, state, 3, 0, 1, 2)) | |
2420 | 229 av_log(NULL, AV_LOG_ERROR, "CABAC unary (truncated) binarization failure at %d\n", i); |
1290 | 230 STOP_TIMER("get_cabac_ueg") |
231 } | |
2420 | 232 #endif |
1287 | 233 if(!get_cabac_terminate(&c)) |
2420 | 234 av_log(NULL, AV_LOG_ERROR, "where's the Terminator?\n"); |
2967 | 235 |
1287 | 236 return 0; |
237 } | |
238 | |
239 #endif |