Mercurial > libavcodec.hg
annotate cabac.c @ 3974:93746612bc78 libavcodec
optimize branchless C CABAC decoder
author | michael |
---|---|
date | Mon, 09 Oct 2006 20:44:11 +0000 |
parents | 162bea01a5d4 |
children | 27e90123b346 |
rev | line source |
---|---|
1287 | 1 /* |
2 * H.26L/H.264/AVC/JVT/14496-10/... encoder/decoder | |
3 * Copyright (c) 2003 Michael Niedermayer <michaelni@gmx.at> | |
4 * | |
3947
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3036
diff
changeset
|
5 * This file is part of FFmpeg. |
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3036
diff
changeset
|
6 * |
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3036
diff
changeset
|
7 * FFmpeg is free software; you can redistribute it and/or |
1287 | 8 * modify it under the terms of the GNU Lesser General Public |
9 * License as published by the Free Software Foundation; either | |
3947
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3036
diff
changeset
|
10 * version 2.1 of the License, or (at your option) any later version. |
1287 | 11 * |
3947
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3036
diff
changeset
|
12 * FFmpeg is distributed in the hope that it will be useful, |
1287 | 13 * but WITHOUT ANY WARRANTY; without even the implied warranty of |
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | |
15 * Lesser General Public License for more details. | |
16 * | |
17 * You should have received a copy of the GNU Lesser General Public | |
3947
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3036
diff
changeset
|
18 * License along with FFmpeg; if not, write to the Free Software |
3036
0b546eab515d
Update licensing information: The FSF changed postal address.
diego
parents:
2967
diff
changeset
|
19 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA |
1287 | 20 * |
21 */ | |
22 | |
23 /** | |
24 * @file cabac.c | |
25 * Context Adaptive Binary Arithmetic Coder. | |
26 */ | |
27 | |
28 #include <string.h> | |
29 | |
30 #include "common.h" | |
2398
582e635cfa08
common.c -> bitstream.c (and the single non bitstream func -> utils.c)
michael
parents:
2323
diff
changeset
|
31 #include "bitstream.h" |
1287 | 32 #include "cabac.h" |
33 | |
34 const uint8_t ff_h264_lps_range[64][4]= { | |
35 {128,176,208,240}, {128,167,197,227}, {128,158,187,216}, {123,150,178,205}, | |
36 {116,142,169,195}, {111,135,160,185}, {105,128,152,175}, {100,122,144,166}, | |
37 { 95,116,137,158}, { 90,110,130,150}, { 85,104,123,142}, { 81, 99,117,135}, | |
38 { 77, 94,111,128}, { 73, 89,105,122}, { 69, 85,100,116}, { 66, 80, 95,110}, | |
39 { 62, 76, 90,104}, { 59, 72, 86, 99}, { 56, 69, 81, 94}, { 53, 65, 77, 89}, | |
40 { 51, 62, 73, 85}, { 48, 59, 69, 80}, { 46, 56, 66, 76}, { 43, 53, 63, 72}, | |
41 { 41, 50, 59, 69}, { 39, 48, 56, 65}, { 37, 45, 54, 62}, { 35, 43, 51, 59}, | |
42 { 33, 41, 48, 56}, { 32, 39, 46, 53}, { 30, 37, 43, 50}, { 29, 35, 41, 48}, | |
43 { 27, 33, 39, 45}, { 26, 31, 37, 43}, { 24, 30, 35, 41}, { 23, 28, 33, 39}, | |
44 { 22, 27, 32, 37}, { 21, 26, 30, 35}, { 20, 24, 29, 33}, { 19, 23, 27, 31}, | |
45 { 18, 22, 26, 30}, { 17, 21, 25, 28}, { 16, 20, 23, 27}, { 15, 19, 22, 25}, | |
46 { 14, 18, 21, 24}, { 14, 17, 20, 23}, { 13, 16, 19, 22}, { 12, 15, 18, 21}, | |
47 { 12, 14, 17, 20}, { 11, 14, 16, 19}, { 11, 13, 15, 18}, { 10, 12, 15, 17}, | |
48 { 10, 12, 14, 16}, { 9, 11, 13, 15}, { 9, 11, 12, 14}, { 8, 10, 12, 14}, | |
49 { 8, 9, 11, 13}, { 7, 9, 11, 12}, { 7, 9, 10, 12}, { 7, 8, 10, 11}, | |
50 { 6, 8, 9, 11}, { 6, 7, 9, 10}, { 6, 7, 8, 9}, { 2, 2, 2, 2}, | |
51 }; | |
52 | |
53 const uint8_t ff_h264_mps_state[64]= { | |
54 1, 2, 3, 4, 5, 6, 7, 8, | |
55 9,10,11,12,13,14,15,16, | |
56 17,18,19,20,21,22,23,24, | |
57 25,26,27,28,29,30,31,32, | |
58 33,34,35,36,37,38,39,40, | |
59 41,42,43,44,45,46,47,48, | |
60 49,50,51,52,53,54,55,56, | |
61 57,58,59,60,61,62,62,63, | |
62 }; | |
63 | |
64 const uint8_t ff_h264_lps_state[64]= { | |
65 0, 0, 1, 2, 2, 4, 4, 5, | |
66 6, 7, 8, 9, 9,11,11,12, | |
67 13,13,15,15,16,16,18,18, | |
68 19,19,21,21,22,22,23,24, | |
69 24,25,26,26,27,27,28,29, | |
70 29,30,30,30,31,32,32,33, | |
71 33,33,34,34,35,35,35,36, | |
72 36,36,37,37,37,38,38,63, | |
73 }; | |
74 | |
3964 | 75 const uint8_t ff_h264_norm_shift[128]= { |
76 7,6,5,5,4,4,4,4,3,3,3,3,3,3,3,3, | |
2323 | 77 2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2, |
78 1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1, | |
79 1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1, | |
3964 | 80 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, |
81 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, | |
82 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, | |
83 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, | |
2323 | 84 }; |
85 | |
1287 | 86 /** |
87 * | |
88 * @param buf_size size of buf in bits | |
89 */ | |
90 void ff_init_cabac_encoder(CABACContext *c, uint8_t *buf, int buf_size){ | |
1522
79dddc5cd990
removed the obsolete and unused parameters of init_put_bits
alex
parents:
1300
diff
changeset
|
91 init_put_bits(&c->pb, buf, buf_size); |
1287 | 92 |
93 c->low= 0; | |
94 c->range= 0x1FE; | |
95 c->outstanding_count= 0; | |
96 #ifdef STRICT_LIMITS | |
97 c->sym_count =0; | |
98 #endif | |
2967 | 99 |
1287 | 100 c->pb.bit_left++; //avoids firstBitFlag |
101 } | |
102 | |
103 /** | |
104 * | |
105 * @param buf_size size of buf in bits | |
106 */ | |
2024
f65d87bfdd5a
some of the warning fixes by (Michael Roitzsch <mroi at users dot sourceforge dot net>)
michael
parents:
1908
diff
changeset
|
107 void ff_init_cabac_decoder(CABACContext *c, const uint8_t *buf, int buf_size){ |
2967 | 108 c->bytestream_start= |
1287 | 109 c->bytestream= buf; |
2116 | 110 c->bytestream_end= buf + buf_size; |
1287 | 111 |
2323 | 112 #if CABAC_BITS == 16 |
113 c->low = (*c->bytestream++)<<18; | |
114 c->low+= (*c->bytestream++)<<10; | |
115 #else | |
116 c->low = (*c->bytestream++)<<10; | |
117 #endif | |
118 c->low+= ((*c->bytestream++)<<2) + 2; | |
119 c->range= 0x1FE<<(CABAC_BITS + 1); | |
1287 | 120 } |
121 | |
2967 | 122 void ff_init_cabac_states(CABACContext *c, uint8_t const (*lps_range)[4], |
1287 | 123 uint8_t const *mps_state, uint8_t const *lps_state, int state_count){ |
124 int i, j; | |
2967 | 125 |
1287 | 126 for(i=0; i<state_count; i++){ |
127 for(j=0; j<4; j++){ //FIXME check if this is worth the 1 shift we save | |
3955 | 128 c->lps_range[2*i+2][j+4]= |
129 c->lps_range[2*i+3][j+4]= lps_range[i][j]; | |
1287 | 130 } |
131 | |
3955 | 132 c->mps_state[2*i+2]= 2*mps_state[i]+2; |
133 c->mps_state[2*i+3]= 2*mps_state[i]+3; | |
1287 | 134 |
1908
e20fd60b215c
h264 - progressive I frame CABAC support patch by (Laurent Aimar <fenrir at via dot ecp dot fr>)
michael
parents:
1522
diff
changeset
|
135 if( i ){ |
3974 | 136 #ifdef BRANCHLESS_CABAD |
137 c->mps_state[-2*i-3]= 2*lps_state[i]+2; //FIXME yes this is not valid C but iam lazy, cleanup welcome | |
138 c->mps_state[-2*i-4]= 2*lps_state[i]+3; | |
139 }else{ | |
140 c->mps_state[-2*i-3]= 3; | |
141 c->mps_state[-2*i-4]= 2; | |
142 #else | |
3955 | 143 c->lps_state[2*i+2]= 2*lps_state[i]+2; |
144 c->lps_state[2*i+3]= 2*lps_state[i]+3; | |
1287 | 145 }else{ |
3955 | 146 c->lps_state[2*i+2]= 3; |
147 c->lps_state[2*i+3]= 2; | |
3974 | 148 #endif |
1287 | 149 } |
150 } | |
151 } | |
152 | |
153 #if 0 //selftest | |
154 #define SIZE 10240 | |
2420 | 155 |
156 #include "avcodec.h" | |
157 | |
1287 | 158 int main(){ |
159 CABACContext c; | |
160 uint8_t b[9*SIZE]; | |
1290 | 161 uint8_t r[9*SIZE]; |
1287 | 162 int i; |
1290 | 163 uint8_t state[10]= {0}; |
2967 | 164 |
1287 | 165 ff_init_cabac_encoder(&c, b, SIZE); |
166 ff_init_cabac_states(&c, ff_h264_lps_range, ff_h264_mps_state, ff_h264_lps_state, 64); | |
2967 | 167 |
1287 | 168 for(i=0; i<SIZE; i++){ |
1290 | 169 r[i]= random()%7; |
1287 | 170 } |
2967 | 171 |
1287 | 172 for(i=0; i<SIZE; i++){ |
173 START_TIMER | |
1290 | 174 put_cabac_bypass(&c, r[i]&1); |
1287 | 175 STOP_TIMER("put_cabac_bypass") |
176 } | |
2967 | 177 |
1287 | 178 for(i=0; i<SIZE; i++){ |
179 START_TIMER | |
1290 | 180 put_cabac(&c, state, r[i]&1); |
1287 | 181 STOP_TIMER("put_cabac") |
182 } | |
183 | |
1290 | 184 for(i=0; i<SIZE; i++){ |
185 START_TIMER | |
186 put_cabac_u(&c, state, r[i], 6, 3, i&1); | |
187 STOP_TIMER("put_cabac_u") | |
2967 | 188 } |
1290 | 189 |
190 for(i=0; i<SIZE; i++){ | |
191 START_TIMER | |
1298 | 192 put_cabac_ueg(&c, state, r[i], 3, 0, 1, 2); |
1290 | 193 STOP_TIMER("put_cabac_ueg") |
2967 | 194 } |
195 | |
1287 | 196 put_cabac_terminate(&c, 1); |
2967 | 197 |
1287 | 198 ff_init_cabac_decoder(&c, b, SIZE); |
2967 | 199 |
1290 | 200 memset(state, 0, sizeof(state)); |
2967 | 201 |
1287 | 202 for(i=0; i<SIZE; i++){ |
203 START_TIMER | |
1290 | 204 if( (r[i]&1) != get_cabac_bypass(&c) ) |
2420 | 205 av_log(NULL, AV_LOG_ERROR, "CABAC bypass failure at %d\n", i); |
1287 | 206 STOP_TIMER("get_cabac_bypass") |
207 } | |
2967 | 208 |
1287 | 209 for(i=0; i<SIZE; i++){ |
210 START_TIMER | |
1290 | 211 if( (r[i]&1) != get_cabac(&c, state) ) |
2420 | 212 av_log(NULL, AV_LOG_ERROR, "CABAC failure at %d\n", i); |
1287 | 213 STOP_TIMER("get_cabac") |
214 } | |
2420 | 215 #if 0 |
1290 | 216 for(i=0; i<SIZE; i++){ |
217 START_TIMER | |
218 if( r[i] != get_cabac_u(&c, state, (i&1) ? 6 : 7, 3, i&1) ) | |
2420 | 219 av_log(NULL, AV_LOG_ERROR, "CABAC unary (truncated) binarization failure at %d\n", i); |
1290 | 220 STOP_TIMER("get_cabac_u") |
221 } | |
222 | |
223 for(i=0; i<SIZE; i++){ | |
224 START_TIMER | |
225 if( r[i] != get_cabac_ueg(&c, state, 3, 0, 1, 2)) | |
2420 | 226 av_log(NULL, AV_LOG_ERROR, "CABAC unary (truncated) binarization failure at %d\n", i); |
1290 | 227 STOP_TIMER("get_cabac_ueg") |
228 } | |
2420 | 229 #endif |
1287 | 230 if(!get_cabac_terminate(&c)) |
2420 | 231 av_log(NULL, AV_LOG_ERROR, "where's the Terminator?\n"); |
2967 | 232 |
1287 | 233 return 0; |
234 } | |
235 | |
236 #endif |