Mercurial > libavcodec.hg
annotate mpegvideo.h @ 265:4e9e728021d8 libavcodec
use ac prediction in mpeg4 encoding (5% smaller intra-blocks/keyframes)
some minor optimizations
last non zero index cant be 64 bugfix
author | michaelni |
---|---|
date | Fri, 15 Mar 2002 04:10:53 +0000 |
parents | 7d941b8c4e84 |
children | 252444e5259b |
rev | line source |
---|---|
0 | 1 /* |
2 * Generic DCT based hybrid video encoder | |
3 * Copyright (c) 2000,2001 Gerard Lantau. | |
4 * | |
5 * This program is free software; you can redistribute it and/or modify | |
6 * it under the terms of the GNU General Public License as published by | |
7 * the Free Software Foundation; either version 2 of the License, or | |
8 * (at your option) any later version. | |
9 * | |
10 * This program is distributed in the hope that it will be useful, | |
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of | |
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
13 * GNU General Public License for more details. | |
14 * | |
15 * You should have received a copy of the GNU General Public License | |
16 * along with this program; if not, write to the Free Software | |
17 * Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. | |
18 */ | |
19 | |
20 /* Macros for picture code type. */ | |
21 #define I_TYPE 1 | |
22 #define P_TYPE 2 | |
23 #define B_TYPE 3 | |
253
4448dd55d415
parsing more of the mpeg4 header & print some "not supported" stuff
michaelni
parents:
248
diff
changeset
|
24 #define S_TYPE 4 //S(GMC)-VOP MPEG4 |
0 | 25 |
26 enum OutputFormat { | |
27 FMT_MPEG1, | |
28 FMT_H263, | |
29 FMT_MJPEG, | |
30 }; | |
31 | |
32 #define MPEG_BUF_SIZE (16 * 1024) | |
33 | |
220 | 34 #define QMAT_SHIFT_MMX 19 |
35 #define QMAT_SHIFT 25 | |
36 | |
0 | 37 typedef struct MpegEncContext { |
71 | 38 struct AVCodecContext *avctx; |
0 | 39 /* the following parameters must be initialized before encoding */ |
40 int width, height; /* picture size. must be a multiple of 16 */ | |
41 int gop_size; | |
42 int frame_rate; /* number of frames per second */ | |
43 int intra_only; /* if true, only intra pictures are generated */ | |
44 int bit_rate; /* wanted bit rate */ | |
45 enum OutputFormat out_format; /* output format */ | |
46 int h263_plus; /* h263 plus headers */ | |
47 int h263_rv10; /* use RV10 variation for H263 */ | |
71 | 48 int h263_pred; /* use mpeg4/h263 ac/dc predictions */ |
0 | 49 int h263_msmpeg4; /* generate MSMPEG4 compatible stream */ |
50 int h263_intel; /* use I263 intel h263 header */ | |
51 int fixed_qscale; /* fixed qscale if non zero */ | |
7
1d3ac9654178
added skip macroblock optimization (big perf win on black regions for example)
glantau
parents:
0
diff
changeset
|
52 int encoding; /* true if we are encoding (vs decoding) */ |
0 | 53 /* the following fields are managed internally by the encoder */ |
54 | |
55 /* bit output */ | |
56 PutBitContext pb; | |
57 | |
58 /* sequence parameters */ | |
59 int context_initialized; | |
60 int picture_number; | |
61 int fake_picture_number; /* picture number at the bitstream frame rate */ | |
233
3f5b72726118
- More work on preliminary bit rate control, just to be able to get an
pulento
parents:
232
diff
changeset
|
62 int gop_picture_number; /* index of the first picture of a GOP */ |
0 | 63 int mb_width, mb_height; |
233
3f5b72726118
- More work on preliminary bit rate control, just to be able to get an
pulento
parents:
232
diff
changeset
|
64 int mb_num; /* number of MBs of a picture */ |
0 | 65 int linesize; /* line size, in bytes, may be different from width */ |
66 UINT8 *new_picture[3]; /* picture to be compressed */ | |
67 UINT8 *last_picture[3]; /* previous picture */ | |
68 UINT8 *last_picture_base[3]; /* real start of the picture */ | |
69 UINT8 *next_picture[3]; /* previous picture (for bidir pred) */ | |
70 UINT8 *next_picture_base[3]; /* real start of the picture */ | |
71 UINT8 *aux_picture[3]; /* aux picture (for B frames only) */ | |
72 UINT8 *aux_picture_base[3]; /* real start of the picture */ | |
73 UINT8 *current_picture[3]; /* buffer to store the decompressed current picture */ | |
74 int last_dc[3]; /* last DC values for MPEG1 */ | |
75 INT16 *dc_val[3]; /* used for mpeg4 DC prediction */ | |
76 int y_dc_scale, c_dc_scale; | |
77 UINT8 *coded_block; /* used for coded block pattern prediction */ | |
78 INT16 (*ac_val[3])[16]; /* used for for mpeg4 AC prediction */ | |
79 int ac_pred; | |
7
1d3ac9654178
added skip macroblock optimization (big perf win on black regions for example)
glantau
parents:
0
diff
changeset
|
80 int mb_skiped; /* MUST BE SET only during DECODING */ |
1d3ac9654178
added skip macroblock optimization (big perf win on black regions for example)
glantau
parents:
0
diff
changeset
|
81 UINT8 *mbskip_table; /* used to avoid copy if macroblock |
1d3ac9654178
added skip macroblock optimization (big perf win on black regions for example)
glantau
parents:
0
diff
changeset
|
82 skipped (for black regions for example) */ |
191
883f184537e6
AC table reset (memset) optimization - patch by Michael Niedermayer <michaelni@gmx.at>
uid46427
parents:
162
diff
changeset
|
83 UINT8 *mbintra_table; /* used to kill a few memsets */ |
0 | 84 |
85 int qscale; | |
86 int pict_type; | |
262 | 87 int last_non_b_pict_type; /* used for mpeg4 gmc b-frames */ |
0 | 88 int frame_rate_index; |
89 /* motion compensation */ | |
90 int unrestricted_mv; | |
91 int h263_long_vectors; /* use horrible h263v1 long vector mode */ | |
92 | |
93 int f_code; /* resolution */ | |
262 | 94 int b_code; /* backward resolution for B Frames (mpeg4) */ |
95 INT16 *mv_table[2]; /* MV table (1MV per MB)*/ | |
96 INT16 (*motion_val)[2]; /* used for MV prediction (4MV per MB)*/ | |
0 | 97 int full_search; |
98 int mv_dir; | |
99 #define MV_DIR_BACKWARD 1 | |
100 #define MV_DIR_FORWARD 2 | |
262 | 101 #define MV_DIRECT 4 // bidirectional mode where the difference equals the MV of the last P/S/I-Frame (mpeg4) |
0 | 102 int mv_type; |
103 #define MV_TYPE_16X16 0 /* 1 vector for the whole mb */ | |
104 #define MV_TYPE_8X8 1 /* 4 vectors (h263) */ | |
105 #define MV_TYPE_16X8 2 /* 2 vectors, one per 16x8 block */ | |
106 #define MV_TYPE_FIELD 3 /* 2 vectors, one per field */ | |
107 #define MV_TYPE_DMV 4 /* 2 vectors, special mpeg2 Dual Prime Vectors */ | |
108 /* motion vectors for a macroblock | |
109 first coordinate : 0 = forward 1 = backward | |
110 second " : depend on type | |
111 third " : 0 = x, 1 = y | |
112 */ | |
113 int mv[2][4][2]; | |
114 int field_select[2][2]; | |
115 int last_mv[2][2][2]; | |
116 | |
117 int has_b_frames; | |
118 int no_rounding; /* apply no rounding to motion estimation (MPEG4) */ | |
119 | |
120 /* macroblock layer */ | |
121 int mb_x, mb_y; | |
122 int mb_incr; | |
123 int mb_intra; | |
239 | 124 INT16 *mb_var; /* Table for MB variances */ |
232
b640ec5948b0
- Now the ME is done for the entire picture when enconding, the
pulento
parents:
231
diff
changeset
|
125 char *mb_type; /* Table for MB type */ |
b640ec5948b0
- Now the ME is done for the entire picture when enconding, the
pulento
parents:
231
diff
changeset
|
126 |
0 | 127 /* matrix transmitted in the bitstream */ |
128 UINT16 intra_matrix[64]; | |
129 UINT16 chroma_intra_matrix[64]; | |
130 UINT16 non_intra_matrix[64]; | |
131 UINT16 chroma_non_intra_matrix[64]; | |
132 /* precomputed matrix (combine qscale and DCT renorm) */ | |
133 int q_intra_matrix[64]; | |
134 int q_non_intra_matrix[64]; | |
220 | 135 /* identical to the above but for MMX & these are not permutated */ |
136 UINT16 __align8 q_intra_matrix16[64] ; | |
137 UINT16 __align8 q_non_intra_matrix16[64]; | |
0 | 138 int block_last_index[6]; /* last non zero coefficient in block */ |
139 | |
140 void *opaque; /* private data for the user */ | |
141 | |
142 /* bit rate control */ | |
143 int I_frame_bits; /* wanted number of bits per I frame */ | |
144 int P_frame_bits; /* same for P frame */ | |
233
3f5b72726118
- More work on preliminary bit rate control, just to be able to get an
pulento
parents:
232
diff
changeset
|
145 int avg_mb_var; /* average MB variance for current frame */ |
64 | 146 INT64 wanted_bits; |
147 INT64 total_bits; | |
265
4e9e728021d8
use ac prediction in mpeg4 encoding (5% smaller intra-blocks/keyframes)
michaelni
parents:
262
diff
changeset
|
148 |
154
f914f710b8d0
- Fixed a bug on H.263 MV prediction for MB on GOBs limits.
pulento
parents:
151
diff
changeset
|
149 /* H.263 specific */ |
f914f710b8d0
- Fixed a bug on H.263 MV prediction for MB on GOBs limits.
pulento
parents:
151
diff
changeset
|
150 int gob_number; |
162 | 151 int gob_index; |
154
f914f710b8d0
- Fixed a bug on H.263 MV prediction for MB on GOBs limits.
pulento
parents:
151
diff
changeset
|
152 int first_gob_line; |
248
56ee684c48bb
- H.263+ decoder support for Advanded INTRA Coding (buggy)
pulento
parents:
243
diff
changeset
|
153 |
79
82e579c37bc3
Moved some H.263+ variables to MpegEncContext to be thread-safe.
pulento
parents:
71
diff
changeset
|
154 /* H.263+ specific */ |
82e579c37bc3
Moved some H.263+ variables to MpegEncContext to be thread-safe.
pulento
parents:
71
diff
changeset
|
155 int umvplus; |
82e579c37bc3
Moved some H.263+ variables to MpegEncContext to be thread-safe.
pulento
parents:
71
diff
changeset
|
156 int umvplus_dec; |
248
56ee684c48bb
- H.263+ decoder support for Advanded INTRA Coding (buggy)
pulento
parents:
243
diff
changeset
|
157 int h263_aic; /* Advanded INTRA Coding (AIC) */ |
56ee684c48bb
- H.263+ decoder support for Advanded INTRA Coding (buggy)
pulento
parents:
243
diff
changeset
|
158 int h263_aic_dir; /* AIC direction: 0 = left, 1 = top */ |
79
82e579c37bc3
Moved some H.263+ variables to MpegEncContext to be thread-safe.
pulento
parents:
71
diff
changeset
|
159 |
0 | 160 /* mpeg4 specific */ |
262 | 161 int time_increment_resolution; |
0 | 162 int time_increment_bits; |
262 | 163 int time_increment; |
164 int time_base; | |
165 int time; | |
166 int last_non_b_time[2]; | |
64 | 167 int shape; |
168 int vol_sprite_usage; | |
253
4448dd55d415
parsing more of the mpeg4 header & print some "not supported" stuff
michaelni
parents:
248
diff
changeset
|
169 int sprite_width; |
4448dd55d415
parsing more of the mpeg4 header & print some "not supported" stuff
michaelni
parents:
248
diff
changeset
|
170 int sprite_height; |
4448dd55d415
parsing more of the mpeg4 header & print some "not supported" stuff
michaelni
parents:
248
diff
changeset
|
171 int sprite_left; |
4448dd55d415
parsing more of the mpeg4 header & print some "not supported" stuff
michaelni
parents:
248
diff
changeset
|
172 int sprite_top; |
4448dd55d415
parsing more of the mpeg4 header & print some "not supported" stuff
michaelni
parents:
248
diff
changeset
|
173 int sprite_brightness_change; |
254
b4fed8b24e3a
gmc bitstream decoding support (the real motion compensation isnt implemnted yet)
michaelni
parents:
253
diff
changeset
|
174 int num_sprite_warping_points; |
255 | 175 int real_sprite_warping_points; |
254
b4fed8b24e3a
gmc bitstream decoding support (the real motion compensation isnt implemnted yet)
michaelni
parents:
253
diff
changeset
|
176 int sprite_offset[2][2]; |
b4fed8b24e3a
gmc bitstream decoding support (the real motion compensation isnt implemnted yet)
michaelni
parents:
253
diff
changeset
|
177 int sprite_delta[2][2][2]; |
b4fed8b24e3a
gmc bitstream decoding support (the real motion compensation isnt implemnted yet)
michaelni
parents:
253
diff
changeset
|
178 int sprite_shift[2][2]; |
b4fed8b24e3a
gmc bitstream decoding support (the real motion compensation isnt implemnted yet)
michaelni
parents:
253
diff
changeset
|
179 int mcsel; |
64 | 180 int quant_precision; |
253
4448dd55d415
parsing more of the mpeg4 header & print some "not supported" stuff
michaelni
parents:
248
diff
changeset
|
181 int quarter_sample; |
4448dd55d415
parsing more of the mpeg4 header & print some "not supported" stuff
michaelni
parents:
248
diff
changeset
|
182 int scalability; |
4448dd55d415
parsing more of the mpeg4 header & print some "not supported" stuff
michaelni
parents:
248
diff
changeset
|
183 int new_pred; |
4448dd55d415
parsing more of the mpeg4 header & print some "not supported" stuff
michaelni
parents:
248
diff
changeset
|
184 int reduced_res_vop; |
4448dd55d415
parsing more of the mpeg4 header & print some "not supported" stuff
michaelni
parents:
248
diff
changeset
|
185 int aspect_ratio_info; |
4448dd55d415
parsing more of the mpeg4 header & print some "not supported" stuff
michaelni
parents:
248
diff
changeset
|
186 int sprite_warping_accuracy; |
4448dd55d415
parsing more of the mpeg4 header & print some "not supported" stuff
michaelni
parents:
248
diff
changeset
|
187 int low_latency_sprite; |
4448dd55d415
parsing more of the mpeg4 header & print some "not supported" stuff
michaelni
parents:
248
diff
changeset
|
188 int data_partioning; |
255 | 189 |
190 /* divx specific, used to workaround (many) bugs in divx5 */ | |
191 int divx_version; | |
192 int divx_build; | |
193 | |
0 | 194 /* RV10 specific */ |
195 int rv10_version; /* RV10 version: 0 or 3 */ | |
196 int rv10_first_dc_coded[3]; | |
197 | |
198 /* MJPEG specific */ | |
199 struct MJpegContext *mjpeg_ctx; | |
229 | 200 int mjpeg_vsample[3]; /* vertical sampling factors, default = {2, 1, 1} */ |
201 int mjpeg_hsample[3]; /* horizontal sampling factors, default = {2, 1, 1} */ | |
202 int mjpeg_write_tables; /* do we want to have quantisation- and | |
203 huffmantables in the jpeg file ? */ | |
0 | 204 |
205 /* MSMPEG4 specific */ | |
206 int mv_table_index; | |
207 int rl_table_index; | |
208 int rl_chroma_table_index; | |
209 int dc_table_index; | |
210 int use_skip_mb_code; | |
211 int slice_height; /* in macroblocks */ | |
212 int first_slice_line; | |
208 | 213 int flipflop_rounding; |
214 int bitrate; | |
0 | 215 /* decompression specific */ |
216 GetBitContext gb; | |
217 | |
218 /* MPEG2 specific - I wish I had not to support this mess. */ | |
219 int progressive_sequence; | |
220 int mpeg_f_code[2][2]; | |
221 int picture_structure; | |
222 /* picture type */ | |
223 #define PICT_TOP_FIELD 1 | |
224 #define PICT_BOTTOM_FIELD 2 | |
225 #define PICT_FRAME 3 | |
226 | |
227 int intra_dc_precision; | |
228 int frame_pred_frame_dct; | |
229 int top_field_first; | |
230 int concealment_motion_vectors; | |
231 int q_scale_type; | |
232 int intra_vlc_format; | |
233 int alternate_scan; | |
234 int repeat_first_field; | |
235 int chroma_420_type; | |
236 int progressive_frame; | |
237 int mpeg2; | |
238 int full_pel[2]; | |
239 int interlaced_dct; | |
240 int last_qscale; | |
241 int first_slice; | |
162 | 242 |
243 /* RTP specific */ | |
231 | 244 /* These are explained on avcodec.h */ |
162 | 245 int rtp_mode; |
246 int rtp_payload_size; | |
231 | 247 void (*rtp_callback)(void *data, int size, int packet_number); |
162 | 248 UINT8 *ptr_lastgob; |
249 UINT8 *ptr_last_mb_line; | |
250 UINT32 mb_line_avgsize; | |
251 | |
13
174ef88f619a
use block[] in structure to have it aligned on 8 bytes for mmx optimizations - dct_unquantize is always a function pointer - added specialized dct_unquantize_h263
glantau
parents:
7
diff
changeset
|
252 DCTELEM block[6][64] __align8; |
174ef88f619a
use block[] in structure to have it aligned on 8 bytes for mmx optimizations - dct_unquantize is always a function pointer - added specialized dct_unquantize_h263
glantau
parents:
7
diff
changeset
|
253 void (*dct_unquantize)(struct MpegEncContext *s, |
174ef88f619a
use block[] in structure to have it aligned on 8 bytes for mmx optimizations - dct_unquantize is always a function pointer - added specialized dct_unquantize_h263
glantau
parents:
7
diff
changeset
|
254 DCTELEM *block, int n, int qscale); |
0 | 255 } MpegEncContext; |
256 | |
257 int MPV_common_init(MpegEncContext *s); | |
258 void MPV_common_end(MpegEncContext *s); | |
259 void MPV_decode_mb(MpegEncContext *s, DCTELEM block[6][64]); | |
260 void MPV_frame_start(MpegEncContext *s); | |
261 void MPV_frame_end(MpegEncContext *s); | |
13
174ef88f619a
use block[] in structure to have it aligned on 8 bytes for mmx optimizations - dct_unquantize is always a function pointer - added specialized dct_unquantize_h263
glantau
parents:
7
diff
changeset
|
262 #ifdef HAVE_MMX |
174ef88f619a
use block[] in structure to have it aligned on 8 bytes for mmx optimizations - dct_unquantize is always a function pointer - added specialized dct_unquantize_h263
glantau
parents:
7
diff
changeset
|
263 void MPV_common_init_mmx(MpegEncContext *s); |
174ef88f619a
use block[] in structure to have it aligned on 8 bytes for mmx optimizations - dct_unquantize is always a function pointer - added specialized dct_unquantize_h263
glantau
parents:
7
diff
changeset
|
264 #endif |
0 | 265 |
266 /* motion_est.c */ | |
267 | |
268 int estimate_motion(MpegEncContext *s, | |
269 int mb_x, int mb_y, | |
270 int *mx_ptr, int *my_ptr); | |
271 | |
272 /* mpeg12.c */ | |
41 | 273 extern INT16 default_intra_matrix[64]; |
274 extern INT16 default_non_intra_matrix[64]; | |
0 | 275 |
276 void mpeg1_encode_picture_header(MpegEncContext *s, int picture_number); | |
277 void mpeg1_encode_mb(MpegEncContext *s, | |
278 DCTELEM block[6][64], | |
279 int motion_x, int motion_y); | |
280 | |
281 /* h263enc.c */ | |
282 | |
283 /* run length table */ | |
284 #define MAX_RUN 64 | |
285 #define MAX_LEVEL 64 | |
286 | |
287 typedef struct RLTable { | |
288 int n; /* number of entries of table_vlc minus 1 */ | |
289 int last; /* number of values for last = 0 */ | |
290 const UINT16 (*table_vlc)[2]; | |
291 const INT8 *table_run; | |
292 const INT8 *table_level; | |
293 UINT8 *index_run[2]; /* encoding only */ | |
294 INT8 *max_level[2]; /* encoding & decoding */ | |
295 INT8 *max_run[2]; /* encoding & decoding */ | |
296 VLC vlc; /* decoding only */ | |
297 } RLTable; | |
298 | |
299 void init_rl(RLTable *rl); | |
300 void init_vlc_rl(RLTable *rl); | |
301 | |
243 | 302 static inline int get_rl_index(const RLTable *rl, int last, int run, int level) |
0 | 303 { |
304 int index; | |
305 index = rl->index_run[last][run]; | |
306 if (index >= rl->n) | |
307 return rl->n; | |
308 if (level > rl->max_level[last][run]) | |
309 return rl->n; | |
310 return index + level - 1; | |
311 } | |
312 | |
313 void h263_encode_mb(MpegEncContext *s, | |
314 DCTELEM block[6][64], | |
315 int motion_x, int motion_y); | |
265
4e9e728021d8
use ac prediction in mpeg4 encoding (5% smaller intra-blocks/keyframes)
michaelni
parents:
262
diff
changeset
|
316 void mpeg4_encode_mb(MpegEncContext *s, |
4e9e728021d8
use ac prediction in mpeg4 encoding (5% smaller intra-blocks/keyframes)
michaelni
parents:
262
diff
changeset
|
317 DCTELEM block[6][64], |
4e9e728021d8
use ac prediction in mpeg4 encoding (5% smaller intra-blocks/keyframes)
michaelni
parents:
262
diff
changeset
|
318 int motion_x, int motion_y); |
0 | 319 void h263_encode_picture_header(MpegEncContext *s, int picture_number); |
162 | 320 int h263_encode_gob_header(MpegEncContext * s, int mb_line); |
0 | 321 void h263_dc_scale(MpegEncContext *s); |
322 INT16 *h263_pred_motion(MpegEncContext * s, int block, | |
323 int *px, int *py); | |
324 void mpeg4_pred_ac(MpegEncContext * s, INT16 *block, int n, | |
325 int dir); | |
326 void mpeg4_encode_picture_header(MpegEncContext *s, int picture_number); | |
327 void h263_encode_init_vlc(MpegEncContext *s); | |
328 | |
329 void h263_decode_init_vlc(MpegEncContext *s); | |
330 int h263_decode_picture_header(MpegEncContext *s); | |
162 | 331 int h263_decode_gob_header(MpegEncContext *s); |
0 | 332 int mpeg4_decode_picture_header(MpegEncContext * s); |
333 int intel_h263_decode_picture_header(MpegEncContext *s); | |
334 int h263_decode_mb(MpegEncContext *s, | |
335 DCTELEM block[6][64]); | |
336 int h263_get_picture_format(int width, int height); | |
337 | |
338 /* rv10.c */ | |
339 void rv10_encode_picture_header(MpegEncContext *s, int picture_number); | |
340 int rv_decode_dc(MpegEncContext *s, int n); | |
341 | |
342 /* msmpeg4.c */ | |
343 void msmpeg4_encode_picture_header(MpegEncContext * s, int picture_number); | |
208 | 344 void msmpeg4_encode_ext_header(MpegEncContext * s); |
0 | 345 void msmpeg4_encode_mb(MpegEncContext * s, |
346 DCTELEM block[6][64], | |
347 int motion_x, int motion_y); | |
348 void msmpeg4_dc_scale(MpegEncContext * s); | |
349 int msmpeg4_decode_picture_header(MpegEncContext * s); | |
208 | 350 int msmpeg4_decode_ext_header(MpegEncContext * s, int buf_size); |
0 | 351 int msmpeg4_decode_mb(MpegEncContext *s, |
352 DCTELEM block[6][64]); | |
353 int msmpeg4_decode_init_vlc(MpegEncContext *s); | |
354 | |
355 /* mjpegenc.c */ | |
356 | |
357 int mjpeg_init(MpegEncContext *s); | |
358 void mjpeg_close(MpegEncContext *s); | |
359 void mjpeg_encode_mb(MpegEncContext *s, | |
360 DCTELEM block[6][64]); | |
361 void mjpeg_picture_header(MpegEncContext *s); | |
362 void mjpeg_picture_trailer(MpegEncContext *s); |