Mercurial > libavcodec.hg
annotate avcodec.h @ 329:5cc47d0ba53e libavcodec
fixed ratecontrol & b-frames
2pass ratecontrol
fixed hq with 2pass
inceased build num (a few more vars for the rc stuff)
hopefully no new bugs
author | michaelni |
---|---|
date | Sun, 21 Apr 2002 21:18:17 +0000 |
parents | 025825084364 |
children | c56b45669214 |
rev | line source |
---|---|
92 | 1 #ifndef AVCODEC_H |
2 #define AVCODEC_H | |
3 | |
0 | 4 #include "common.h" |
5 | |
322 | 6 #define LIBAVCODEC_VERSION_INT 0x000406 |
7 #define LIBAVCODEC_VERSION "0.4.6" | |
329 | 8 #define LIBAVCODEC_BUILD 4601 |
9 #define LIBAVCODEC_BUILD_STR "4601" | |
322 | 10 |
0 | 11 enum CodecID { |
12 CODEC_ID_NONE, | |
13 CODEC_ID_MPEG1VIDEO, | |
14 CODEC_ID_H263, | |
15 CODEC_ID_RV10, | |
16 CODEC_ID_MP2, | |
260
e1bacfb3f51f
- Added MP3 encoding through libmp3lame contributed by Lennert Buytenhek.
pulento
parents:
252
diff
changeset
|
17 CODEC_ID_MP3LAME, |
0 | 18 CODEC_ID_AC3, |
19 CODEC_ID_MJPEG, | |
67 | 20 CODEC_ID_MPEG4, |
0 | 21 CODEC_ID_RAWVIDEO, |
307 | 22 CODEC_ID_MSMPEG4V1, |
23 CODEC_ID_MSMPEG4V2, | |
24 CODEC_ID_MSMPEG4V3, | |
311 | 25 CODEC_ID_WMV1, |
0 | 26 CODEC_ID_H263P, |
27 CODEC_ID_H263I, | |
92 | 28 |
29 /* various pcm "codecs" */ | |
30 CODEC_ID_PCM_S16LE, | |
31 CODEC_ID_PCM_S16BE, | |
32 CODEC_ID_PCM_U16LE, | |
33 CODEC_ID_PCM_U16BE, | |
34 CODEC_ID_PCM_S8, | |
35 CODEC_ID_PCM_U8, | |
36 CODEC_ID_PCM_MULAW, | |
37 CODEC_ID_PCM_ALAW, | |
0 | 38 }; |
307 | 39 #define CODEC_ID_MSMPEG4 CODEC_ID_MSMPEG4V3 |
0 | 40 |
41 enum CodecType { | |
42 CODEC_TYPE_VIDEO, | |
43 CODEC_TYPE_AUDIO, | |
44 }; | |
45 | |
46 enum PixelFormat { | |
317
5afea0021fb8
- PIX_FMT_ANY = -1 to avoid breaking any stuff that could be using it.
pulento
parents:
316
diff
changeset
|
47 PIX_FMT_ANY = -1, |
0 | 48 PIX_FMT_YUV420P, |
49 PIX_FMT_YUV422, | |
50 PIX_FMT_RGB24, | |
51 PIX_FMT_BGR24, | |
27
b8723ec6c80f
added 422P and 444P formats (need to patch ffmpeg.c so that it is handled in all the program)
glantau
parents:
24
diff
changeset
|
52 PIX_FMT_YUV422P, |
b8723ec6c80f
added 422P and 444P formats (need to patch ffmpeg.c so that it is handled in all the program)
glantau
parents:
24
diff
changeset
|
53 PIX_FMT_YUV444P, |
0 | 54 }; |
55 | |
92 | 56 /* currently unused, may be used if 24/32 bits samples ever supported */ |
57 enum SampleFormat { | |
58 SAMPLE_FMT_S16 = 0, /* signed 16 bits */ | |
59 }; | |
60 | |
0 | 61 /* in bytes */ |
62 #define AVCODEC_MAX_AUDIO_FRAME_SIZE 18432 | |
63 | |
320
cda7d0857baf
- ME setting moved to AVCodecContext/MpegEncContext, no longer a global.
pulento
parents:
317
diff
changeset
|
64 /* motion estimation type, EPZS by default */ |
cda7d0857baf
- ME setting moved to AVCodecContext/MpegEncContext, no longer a global.
pulento
parents:
317
diff
changeset
|
65 enum Motion_Est_ID { |
321 | 66 ME_ZERO = 1, |
320
cda7d0857baf
- ME setting moved to AVCodecContext/MpegEncContext, no longer a global.
pulento
parents:
317
diff
changeset
|
67 ME_FULL, |
cda7d0857baf
- ME setting moved to AVCodecContext/MpegEncContext, no longer a global.
pulento
parents:
317
diff
changeset
|
68 ME_LOG, |
cda7d0857baf
- ME setting moved to AVCodecContext/MpegEncContext, no longer a global.
pulento
parents:
317
diff
changeset
|
69 ME_PHODS, |
cda7d0857baf
- ME setting moved to AVCodecContext/MpegEncContext, no longer a global.
pulento
parents:
317
diff
changeset
|
70 ME_EPZS, |
cda7d0857baf
- ME setting moved to AVCodecContext/MpegEncContext, no longer a global.
pulento
parents:
317
diff
changeset
|
71 ME_X1 |
cda7d0857baf
- ME setting moved to AVCodecContext/MpegEncContext, no longer a global.
pulento
parents:
317
diff
changeset
|
72 }; |
cda7d0857baf
- ME setting moved to AVCodecContext/MpegEncContext, no longer a global.
pulento
parents:
317
diff
changeset
|
73 |
321 | 74 /* only for ME compatiblity with old apps */ |
75 extern int motion_estimation_method; | |
76 | |
320
cda7d0857baf
- ME setting moved to AVCodecContext/MpegEncContext, no longer a global.
pulento
parents:
317
diff
changeset
|
77 /* ME algos sorted by quality */ |
322 | 78 static const int Motion_Est_QTab[] = { 1, 4, 3, 6, 5, 2 }; |
0 | 79 |
324 | 80 #define FF_MAX_B_FRAMES 4 |
81 | |
0 | 82 /* encoding support */ |
294 | 83 /* note not everything is supported yet */ |
0 | 84 |
85 #define CODEC_FLAG_HQ 0x0001 /* high quality (non real time) encoding */ | |
86 #define CODEC_FLAG_QSCALE 0x0002 /* use fixed qscale */ | |
294 | 87 #define CODEC_FLAG_4MV 0x0004 /* 4 MV per MB allowed */ |
88 #define CODEC_FLAG_QPEL 0x0010 /* use qpel MC */ | |
89 #define CODEC_FLAG_GMC 0x0020 /* use GMC */ | |
298
e20de99b6295
using Juanjo's way to pass forced type - especially as I_TYPE/P_TYPE defines aren't exported in the public interface, and the flagged method matches the way as qscale forcing work
arpi_esp
parents:
297
diff
changeset
|
90 #define CODEC_FLAG_TYPE 0x0040 /* fixed I/P frame type, from avctx->key_frame */ |
324 | 91 /* parent program gurantees that the input for b-frame containing streams is not written to |
92 for at least s->max_b_frames+1 frames, if this is not set than the input will be copied */ | |
329 | 93 #define CODEC_FLAG_INPUT_PRESERVED 0x0100 |
94 #define CODEC_FLAG_PASS1 0x0200 /* use internal 2pass ratecontrol in first pass mode */ | |
95 #define CODEC_FLAG_PASS2 0x0400 /* use internal 2pass ratecontrol in second pass mode */ | |
0 | 96 |
67 | 97 /* codec capabilities */ |
98 | |
99 /* decoder can use draw_horiz_band callback */ | |
100 #define CODEC_CAP_DRAW_HORIZ_BAND 0x0001 | |
101 | |
0 | 102 #define FRAME_RATE_BASE 10000 |
103 | |
104 typedef struct AVCodecContext { | |
105 int bit_rate; | |
268 | 106 int bit_rate_tolerance; /* amount of +- bits (>0)*/ |
0 | 107 int flags; |
108 int sub_id; /* some codecs needs additionnal format info. It is | |
109 stored there */ | |
320
cda7d0857baf
- ME setting moved to AVCodecContext/MpegEncContext, no longer a global.
pulento
parents:
317
diff
changeset
|
110 |
cda7d0857baf
- ME setting moved to AVCodecContext/MpegEncContext, no longer a global.
pulento
parents:
317
diff
changeset
|
111 int me_method; /* ME algorithm used for video coding */ |
cda7d0857baf
- ME setting moved to AVCodecContext/MpegEncContext, no longer a global.
pulento
parents:
317
diff
changeset
|
112 |
0 | 113 /* video only */ |
114 int frame_rate; /* frames per sec multiplied by FRAME_RATE_BASE */ | |
115 int width, height; | |
281
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
277
diff
changeset
|
116 int aspect_ratio_info; |
282 | 117 #define FF_ASPECT_SQUARE 1 |
118 #define FF_ASPECT_4_3_625 2 | |
119 #define FF_ASPECT_4_3_525 3 | |
120 #define FF_ASPECT_16_9_625 4 | |
121 #define FF_ASPECT_16_9_525 5 | |
0 | 122 int gop_size; /* 0 = intra only */ |
315 | 123 enum PixelFormat pix_fmt; /* pixel format, see PIX_FMT_xxx */ |
67 | 124 |
125 /* if non NULL, 'draw_horiz_band' is called by the libavcodec | |
126 decoder to draw an horizontal band. It improve cache usage. Not | |
127 all codecs can do that. You must check the codec capabilities | |
128 before */ | |
129 void (*draw_horiz_band)(struct AVCodecContext *s, | |
130 UINT8 **src_ptr, int linesize, | |
131 int y, int width, int height); | |
132 | |
0 | 133 /* audio only */ |
134 int sample_rate; /* samples per sec */ | |
135 int channels; | |
92 | 136 int sample_fmt; /* sample format, currenly unused */ |
0 | 137 |
138 /* the following data should not be initialized */ | |
139 int frame_size; /* in samples, initialized when calling 'init' */ | |
140 int frame_number; /* audio or video frame number */ | |
141 int key_frame; /* true if the previous compressed frame was | |
142 a key frame (intra, or seekable) */ | |
143 int quality; /* quality of the previous encoded frame | |
329 | 144 (between 1 (good) and 31 (bad)) |
145 this is allso used to set the quality in vbr mode | |
146 and the per frame quality in CODEC_FLAG_TYPE (second pass mode) */ | |
268 | 147 float qcompress; /* amount of qscale change between easy & hard scenes (0.0-1.0)*/ |
148 float qblur; /* amount of qscale smoothing over time (0.0-1.0) */ | |
149 int qmin; /* min qscale */ | |
150 int qmax; /* max qscale */ | |
151 int max_qdiff; /* max qscale difference between frames */ | |
324 | 152 int max_b_frames; /* maximum b frames, the output will be delayed by max_b_frames+1 relative to the input */ |
329 | 153 float b_quant_factor;/* qscale factor between ips and b frames */ |
154 int rc_strategy; | |
155 int b_frame_strategy; | |
324 | 156 |
0 | 157 struct AVCodec *codec; |
158 void *priv_data; | |
159 | |
162 | 160 /* The following data is for RTP friendly coding */ |
161 /* By now only H.263/H.263+ coder honours this */ | |
162 int rtp_mode; /* 1 for activate RTP friendly-mode */ | |
163 /* highers numbers represent more error-prone */ | |
164 /* enviroments, by now just "1" exist */ | |
165 | |
166 int rtp_payload_size; /* The size of the RTP payload, the coder will */ | |
167 /* do it's best to deliver a chunk with size */ | |
168 /* below rtp_payload_size, the chunk will start */ | |
169 /* with a start code on some codecs like H.263 */ | |
170 /* This doesn't take account of any particular */ | |
171 /* headers inside the transmited RTP payload */ | |
231 | 172 |
173 | |
174 /* The RTP callcack: This function is called */ | |
175 /* every time the encoder as a packet to send */ | |
176 /* Depends on the encoder if the data starts */ | |
177 /* with a Start Code (it should) H.263 does */ | |
178 void (*rtp_callback)(void *data, int size, int packet_number); | |
179 | |
252
ddb1a0e94cf4
- Added PSNR feature to libavcodec and ffmpeg. By now just Y PSNR until I'm
pulento
parents:
231
diff
changeset
|
180 /* These are for PSNR calculation, if you set get_psnr to 1 */ |
ddb1a0e94cf4
- Added PSNR feature to libavcodec and ffmpeg. By now just Y PSNR until I'm
pulento
parents:
231
diff
changeset
|
181 /* after encoding you will have the PSNR on psnr_y/cb/cr */ |
ddb1a0e94cf4
- Added PSNR feature to libavcodec and ffmpeg. By now just Y PSNR until I'm
pulento
parents:
231
diff
changeset
|
182 int get_psnr; |
ddb1a0e94cf4
- Added PSNR feature to libavcodec and ffmpeg. By now just Y PSNR until I'm
pulento
parents:
231
diff
changeset
|
183 float psnr_y; |
ddb1a0e94cf4
- Added PSNR feature to libavcodec and ffmpeg. By now just Y PSNR until I'm
pulento
parents:
231
diff
changeset
|
184 float psnr_cb; |
ddb1a0e94cf4
- Added PSNR feature to libavcodec and ffmpeg. By now just Y PSNR until I'm
pulento
parents:
231
diff
changeset
|
185 float psnr_cr; |
286 | 186 |
187 /* statistics, used for 2-pass encoding */ | |
188 int mv_bits; | |
189 int header_bits; | |
190 int i_tex_bits; | |
191 int p_tex_bits; | |
192 int i_count; | |
193 int p_count; | |
194 int skip_count; | |
195 int misc_bits; // cbp, mb_type | |
196 int frame_bits; | |
162 | 197 |
0 | 198 /* the following fields are ignored */ |
67 | 199 void *opaque; /* can be used to carry app specific stuff */ |
0 | 200 char codec_name[32]; |
201 int codec_type; /* see CODEC_TYPE_xxx */ | |
202 int codec_id; /* see CODEC_ID_xxx */ | |
203 unsigned int codec_tag; /* codec tag, only used if unknown codec */ | |
204 } AVCodecContext; | |
205 | |
206 typedef struct AVCodec { | |
207 char *name; | |
208 int type; | |
209 int id; | |
210 int priv_data_size; | |
211 int (*init)(AVCodecContext *); | |
212 int (*encode)(AVCodecContext *, UINT8 *buf, int buf_size, void *data); | |
213 int (*close)(AVCodecContext *); | |
214 int (*decode)(AVCodecContext *, void *outdata, int *outdata_size, | |
215 UINT8 *buf, int buf_size); | |
67 | 216 int capabilities; |
0 | 217 struct AVCodec *next; |
218 } AVCodec; | |
219 | |
220 /* three components are given, that's all */ | |
221 typedef struct AVPicture { | |
222 UINT8 *data[3]; | |
223 int linesize[3]; | |
224 } AVPicture; | |
225 | |
226 extern AVCodec ac3_encoder; | |
227 extern AVCodec mp2_encoder; | |
260
e1bacfb3f51f
- Added MP3 encoding through libmp3lame contributed by Lennert Buytenhek.
pulento
parents:
252
diff
changeset
|
228 extern AVCodec mp3lame_encoder; |
0 | 229 extern AVCodec mpeg1video_encoder; |
230 extern AVCodec h263_encoder; | |
231 extern AVCodec h263p_encoder; | |
232 extern AVCodec rv10_encoder; | |
233 extern AVCodec mjpeg_encoder; | |
67 | 234 extern AVCodec mpeg4_encoder; |
307 | 235 extern AVCodec msmpeg4v1_encoder; |
236 extern AVCodec msmpeg4v2_encoder; | |
237 extern AVCodec msmpeg4v3_encoder; | |
0 | 238 |
239 extern AVCodec h263_decoder; | |
67 | 240 extern AVCodec mpeg4_decoder; |
307 | 241 extern AVCodec msmpeg4v1_decoder; |
242 extern AVCodec msmpeg4v2_decoder; | |
243 extern AVCodec msmpeg4v3_decoder; | |
311 | 244 extern AVCodec wmv1_decoder; |
0 | 245 extern AVCodec mpeg_decoder; |
246 extern AVCodec h263i_decoder; | |
247 extern AVCodec rv10_decoder; | |
24 | 248 extern AVCodec mjpeg_decoder; |
322 | 249 extern AVCodec mp2_decoder; |
92 | 250 extern AVCodec mp3_decoder; |
0 | 251 |
92 | 252 /* pcm codecs */ |
253 #define PCM_CODEC(id, name) \ | |
254 extern AVCodec name ## _decoder; \ | |
255 extern AVCodec name ## _encoder; | |
256 | |
257 PCM_CODEC(CODEC_ID_PCM_S16LE, pcm_s16le); | |
258 PCM_CODEC(CODEC_ID_PCM_S16BE, pcm_s16be); | |
259 PCM_CODEC(CODEC_ID_PCM_U16LE, pcm_u16le); | |
260 PCM_CODEC(CODEC_ID_PCM_U16BE, pcm_u16be); | |
261 PCM_CODEC(CODEC_ID_PCM_S8, pcm_s8); | |
262 PCM_CODEC(CODEC_ID_PCM_U8, pcm_u8); | |
263 PCM_CODEC(CODEC_ID_PCM_ALAW, pcm_alaw); | |
264 PCM_CODEC(CODEC_ID_PCM_MULAW, pcm_mulaw); | |
265 | |
266 #undef PCM_CODEC | |
267 | |
268 /* dummy raw video codec */ | |
0 | 269 extern AVCodec rawvideo_codec; |
270 | |
271 /* the following codecs use external GPL libs */ | |
272 extern AVCodec ac3_decoder; | |
273 | |
274 /* resample.c */ | |
275 | |
276 struct ReSampleContext; | |
277 | |
278 typedef struct ReSampleContext ReSampleContext; | |
279 | |
280 ReSampleContext *audio_resample_init(int output_channels, int input_channels, | |
281 int output_rate, int input_rate); | |
282 int audio_resample(ReSampleContext *s, short *output, short *input, int nb_samples); | |
283 void audio_resample_close(ReSampleContext *s); | |
284 | |
285 /* YUV420 format is assumed ! */ | |
286 | |
287 struct ImgReSampleContext; | |
288 | |
289 typedef struct ImgReSampleContext ImgReSampleContext; | |
290 | |
291 ImgReSampleContext *img_resample_init(int output_width, int output_height, | |
292 int input_width, int input_height); | |
293 void img_resample(ImgReSampleContext *s, | |
294 AVPicture *output, AVPicture *input); | |
295 | |
296 void img_resample_close(ImgReSampleContext *s); | |
297 | |
49 | 298 void avpicture_fill(AVPicture *picture, UINT8 *ptr, |
299 int pix_fmt, int width, int height); | |
300 int avpicture_get_size(int pix_fmt, int width, int height); | |
301 | |
302 /* convert among pixel formats */ | |
303 int img_convert(AVPicture *dst, int dst_pix_fmt, | |
304 AVPicture *src, int pix_fmt, | |
305 int width, int height); | |
306 | |
307 /* deinterlace a picture */ | |
308 int avpicture_deinterlace(AVPicture *dst, AVPicture *src, | |
0 | 309 int pix_fmt, int width, int height); |
310 | |
311 /* external high level API */ | |
312 | |
313 extern AVCodec *first_avcodec; | |
314 | |
315 void avcodec_init(void); | |
316 | |
317 void register_avcodec(AVCodec *format); | |
318 AVCodec *avcodec_find_encoder(enum CodecID id); | |
177 | 319 AVCodec *avcodec_find_encoder_by_name(const char *name); |
0 | 320 AVCodec *avcodec_find_decoder(enum CodecID id); |
321 AVCodec *avcodec_find_decoder_by_name(const char *name); | |
322 void avcodec_string(char *buf, int buf_size, AVCodecContext *enc, int encode); | |
323 | |
324 int avcodec_open(AVCodecContext *avctx, AVCodec *codec); | |
325 int avcodec_decode_audio(AVCodecContext *avctx, INT16 *samples, | |
326 int *frame_size_ptr, | |
327 UINT8 *buf, int buf_size); | |
328 int avcodec_decode_video(AVCodecContext *avctx, AVPicture *picture, | |
329 int *got_picture_ptr, | |
330 UINT8 *buf, int buf_size); | |
331 int avcodec_encode_audio(AVCodecContext *avctx, UINT8 *buf, int buf_size, | |
332 const short *samples); | |
333 int avcodec_encode_video(AVCodecContext *avctx, UINT8 *buf, int buf_size, | |
334 const AVPicture *pict); | |
335 | |
336 int avcodec_close(AVCodecContext *avctx); | |
337 | |
338 void avcodec_register_all(void); | |
92 | 339 |
108
1e4a4af694d1
exporting qscale data for postprocessing (for MPlayer)
arpi_esp
parents:
92
diff
changeset
|
340 #ifdef FF_POSTPROCESS |
1e4a4af694d1
exporting qscale data for postprocessing (for MPlayer)
arpi_esp
parents:
92
diff
changeset
|
341 #ifndef MBC |
328
025825084364
postprocess array increased to handle images up to 2048x1536
arpi_esp
parents:
324
diff
changeset
|
342 #define MBC 128 |
025825084364
postprocess array increased to handle images up to 2048x1536
arpi_esp
parents:
324
diff
changeset
|
343 #define MBR 96 |
108
1e4a4af694d1
exporting qscale data for postprocessing (for MPlayer)
arpi_esp
parents:
92
diff
changeset
|
344 #endif |
1e4a4af694d1
exporting qscale data for postprocessing (for MPlayer)
arpi_esp
parents:
92
diff
changeset
|
345 extern int quant_store[MBR+1][MBC+1]; // [Review] |
1e4a4af694d1
exporting qscale data for postprocessing (for MPlayer)
arpi_esp
parents:
92
diff
changeset
|
346 #endif |
1e4a4af694d1
exporting qscale data for postprocessing (for MPlayer)
arpi_esp
parents:
92
diff
changeset
|
347 |
92 | 348 #endif /* AVCODEC_H */ |