Mercurial > libavcodec.hg
diff huffyuv.c @ 5063:d5640ea6d4a6 libavcodec
merge huffman tables so that we read 2 symbols at a time. 30% faster huffyuv decoding.
author | lorenm |
---|---|
date | Wed, 23 May 2007 09:02:07 +0000 |
parents | 5c6cd6601371 |
children | 1aec7fab94c4 |
line wrap: on
line diff
--- a/huffyuv.c Tue May 22 07:08:38 2007 +0000 +++ b/huffyuv.c Wed May 23 09:02:07 2007 +0000 @@ -70,7 +70,8 @@ uint64_t stats[3][256]; uint8_t len[3][256]; uint32_t bits[3][256]; - VLC vlc[3]; + VLC vlc[6]; //Y,U,V,YY,YU,YV + uint16_t pix2_map[3][1<<VLC_BITS]; AVFrame picture; uint8_t *bitstream_buffer; unsigned int bitstream_buffer_size; @@ -318,6 +319,35 @@ } #endif /* CONFIG_ENCODERS */ +static void generate_joint_tables(HYuvContext *s){ + // TODO modify init_vlc to allow sparse tables, and eliminate pix2_map + // TODO rgb + if(s->bitstream_bpp < 24){ + uint16_t bits[1<<VLC_BITS]; + uint8_t len[1<<VLC_BITS]; + int p, i, y, u; + for(p=0; p<3; p++){ + for(i=y=0; y<256; y++){ + int len0 = s->len[0][y]; + int limit = VLC_BITS - len0; + if(limit > 0){ + for(u=0; u<256; u++){ + int len1 = s->len[p][u]; + if(len1 <= limit){ + len[i] = len0 + len1; + bits[i] = (s->bits[0][y] << len1) + s->bits[p][u]; + s->pix2_map[p][i] = (y<<8) + u; + i++; + } + } + } + } + free_vlc(&s->vlc[3+p]); + init_vlc(&s->vlc[3+p], VLC_BITS, i, len, 1, 1, bits, 2, 2, 0); + } + } +} + static int read_huffman_tables(HYuvContext *s, uint8_t *src, int length){ GetBitContext gb; int i; @@ -339,6 +369,8 @@ init_vlc(&s->vlc[i], VLC_BITS, 256, s->len[i], 1, 1, s->bits[i], 4, 4, 0); } + generate_joint_tables(s); + return (get_bits_count(&gb)+7)/8; } @@ -367,6 +399,8 @@ init_vlc(&s->vlc[i], VLC_BITS, 256, s->len[i], 1, 1, s->bits[i], 4, 4, 0); } + generate_joint_tables(s); + return 0; #else av_log(s->avctx, AV_LOG_DEBUG, "v1 huffyuv is not supported \n"); @@ -653,16 +687,28 @@ } #endif /* CONFIG_ENCODERS */ +/* TODO instead of restarting the read when the code isn't in the first level + * of the joint table, jump into the 2nd level of the individual table. */ +#define READ_2PIX(dst0, dst1, plane1){\ + int code = get_vlc2(&s->gb, s->vlc[3+plane1].table, VLC_BITS, 1);\ + if(code >= 0){\ + int x = s->pix2_map[plane1][code];\ + dst0 = x>>8;\ + dst1 = x;\ + }else{\ + dst0 = get_vlc2(&s->gb, s->vlc[0].table, VLC_BITS, 3);\ + dst1 = get_vlc2(&s->gb, s->vlc[plane1].table, VLC_BITS, 3);\ + }\ +} + static void decode_422_bitstream(HYuvContext *s, int count){ int i; count/=2; for(i=0; i<count; i++){ - s->temp[0][2*i ]= get_vlc2(&s->gb, s->vlc[0].table, VLC_BITS, 3); - s->temp[1][ i ]= get_vlc2(&s->gb, s->vlc[1].table, VLC_BITS, 3); - s->temp[0][2*i+1]= get_vlc2(&s->gb, s->vlc[0].table, VLC_BITS, 3); - s->temp[2][ i ]= get_vlc2(&s->gb, s->vlc[2].table, VLC_BITS, 3); + READ_2PIX(s->temp[0][2*i ], s->temp[1][i], 1); + READ_2PIX(s->temp[0][2*i+1], s->temp[2][i], 2); } } @@ -672,8 +718,7 @@ count/=2; for(i=0; i<count; i++){ - s->temp[0][2*i ]= get_vlc2(&s->gb, s->vlc[0].table, VLC_BITS, 3); - s->temp[0][2*i+1]= get_vlc2(&s->gb, s->vlc[0].table, VLC_BITS, 3); + READ_2PIX(s->temp[0][2*i ], s->temp[0][2*i+1], 0); } }