Mercurial > libavcodec.hg
annotate avcodec.h @ 324:9c6f056f0e41 libavcodec
fixed mpeg4 time stuff on encoding
mpeg4 b-frame enoding support
removed old, out-commented ratecontrol
reuse motion compensation code between encoding & decoding
prefix newly added global functions with ff_ to reduce namespace polution
b-frame ME (unfinished, but working)
added some comments to mpegvideo.h
do MC on encoding only once if possible
bugs? ;)
| author | michaelni |
|---|---|
| date | Wed, 17 Apr 2002 04:32:12 +0000 |
| parents | ce35fd27bbb0 |
| children | 025825084364 |
| rev | line source |
|---|---|
| 92 | 1 #ifndef AVCODEC_H |
| 2 #define AVCODEC_H | |
| 3 | |
| 0 | 4 #include "common.h" |
| 5 | |
| 322 | 6 #define LIBAVCODEC_VERSION_INT 0x000406 |
| 7 #define LIBAVCODEC_VERSION "0.4.6" | |
| 8 #define LIBAVCODEC_BUILD 4600 | |
| 9 #define LIBAVCODEC_BUILD_STR "4600" | |
| 10 | |
| 0 | 11 enum CodecID { |
| 12 CODEC_ID_NONE, | |
| 13 CODEC_ID_MPEG1VIDEO, | |
| 14 CODEC_ID_H263, | |
| 15 CODEC_ID_RV10, | |
| 16 CODEC_ID_MP2, | |
|
260
e1bacfb3f51f
- Added MP3 encoding through libmp3lame contributed by Lennert Buytenhek.
pulento
parents:
252
diff
changeset
|
17 CODEC_ID_MP3LAME, |
| 0 | 18 CODEC_ID_AC3, |
| 19 CODEC_ID_MJPEG, | |
| 67 | 20 CODEC_ID_MPEG4, |
| 0 | 21 CODEC_ID_RAWVIDEO, |
| 307 | 22 CODEC_ID_MSMPEG4V1, |
| 23 CODEC_ID_MSMPEG4V2, | |
| 24 CODEC_ID_MSMPEG4V3, | |
| 311 | 25 CODEC_ID_WMV1, |
| 0 | 26 CODEC_ID_H263P, |
| 27 CODEC_ID_H263I, | |
| 92 | 28 |
| 29 /* various pcm "codecs" */ | |
| 30 CODEC_ID_PCM_S16LE, | |
| 31 CODEC_ID_PCM_S16BE, | |
| 32 CODEC_ID_PCM_U16LE, | |
| 33 CODEC_ID_PCM_U16BE, | |
| 34 CODEC_ID_PCM_S8, | |
| 35 CODEC_ID_PCM_U8, | |
| 36 CODEC_ID_PCM_MULAW, | |
| 37 CODEC_ID_PCM_ALAW, | |
| 0 | 38 }; |
| 307 | 39 #define CODEC_ID_MSMPEG4 CODEC_ID_MSMPEG4V3 |
| 0 | 40 |
| 41 enum CodecType { | |
| 42 CODEC_TYPE_VIDEO, | |
| 43 CODEC_TYPE_AUDIO, | |
| 44 }; | |
| 45 | |
| 46 enum PixelFormat { | |
|
317
5afea0021fb8
- PIX_FMT_ANY = -1 to avoid breaking any stuff that could be using it.
pulento
parents:
316
diff
changeset
|
47 PIX_FMT_ANY = -1, |
| 0 | 48 PIX_FMT_YUV420P, |
| 49 PIX_FMT_YUV422, | |
| 50 PIX_FMT_RGB24, | |
| 51 PIX_FMT_BGR24, | |
|
27
b8723ec6c80f
added 422P and 444P formats (need to patch ffmpeg.c so that it is handled in all the program)
glantau
parents:
24
diff
changeset
|
52 PIX_FMT_YUV422P, |
|
b8723ec6c80f
added 422P and 444P formats (need to patch ffmpeg.c so that it is handled in all the program)
glantau
parents:
24
diff
changeset
|
53 PIX_FMT_YUV444P, |
| 0 | 54 }; |
| 55 | |
| 92 | 56 /* currently unused, may be used if 24/32 bits samples ever supported */ |
| 57 enum SampleFormat { | |
| 58 SAMPLE_FMT_S16 = 0, /* signed 16 bits */ | |
| 59 }; | |
| 60 | |
| 0 | 61 /* in bytes */ |
| 62 #define AVCODEC_MAX_AUDIO_FRAME_SIZE 18432 | |
| 63 | |
|
320
cda7d0857baf
- ME setting moved to AVCodecContext/MpegEncContext, no longer a global.
pulento
parents:
317
diff
changeset
|
64 /* motion estimation type, EPZS by default */ |
|
cda7d0857baf
- ME setting moved to AVCodecContext/MpegEncContext, no longer a global.
pulento
parents:
317
diff
changeset
|
65 enum Motion_Est_ID { |
| 321 | 66 ME_ZERO = 1, |
|
320
cda7d0857baf
- ME setting moved to AVCodecContext/MpegEncContext, no longer a global.
pulento
parents:
317
diff
changeset
|
67 ME_FULL, |
|
cda7d0857baf
- ME setting moved to AVCodecContext/MpegEncContext, no longer a global.
pulento
parents:
317
diff
changeset
|
68 ME_LOG, |
|
cda7d0857baf
- ME setting moved to AVCodecContext/MpegEncContext, no longer a global.
pulento
parents:
317
diff
changeset
|
69 ME_PHODS, |
|
cda7d0857baf
- ME setting moved to AVCodecContext/MpegEncContext, no longer a global.
pulento
parents:
317
diff
changeset
|
70 ME_EPZS, |
|
cda7d0857baf
- ME setting moved to AVCodecContext/MpegEncContext, no longer a global.
pulento
parents:
317
diff
changeset
|
71 ME_X1 |
|
cda7d0857baf
- ME setting moved to AVCodecContext/MpegEncContext, no longer a global.
pulento
parents:
317
diff
changeset
|
72 }; |
|
cda7d0857baf
- ME setting moved to AVCodecContext/MpegEncContext, no longer a global.
pulento
parents:
317
diff
changeset
|
73 |
| 321 | 74 /* only for ME compatiblity with old apps */ |
| 75 extern int motion_estimation_method; | |
| 76 | |
|
320
cda7d0857baf
- ME setting moved to AVCodecContext/MpegEncContext, no longer a global.
pulento
parents:
317
diff
changeset
|
77 /* ME algos sorted by quality */ |
| 322 | 78 static const int Motion_Est_QTab[] = { 1, 4, 3, 6, 5, 2 }; |
| 0 | 79 |
| 324 | 80 #define FF_MAX_B_FRAMES 4 |
| 81 | |
| 0 | 82 /* encoding support */ |
| 294 | 83 /* note not everything is supported yet */ |
| 0 | 84 |
| 85 #define CODEC_FLAG_HQ 0x0001 /* high quality (non real time) encoding */ | |
| 86 #define CODEC_FLAG_QSCALE 0x0002 /* use fixed qscale */ | |
| 294 | 87 #define CODEC_FLAG_4MV 0x0004 /* 4 MV per MB allowed */ |
| 88 #define CODEC_FLAG_QPEL 0x0010 /* use qpel MC */ | |
| 89 #define CODEC_FLAG_GMC 0x0020 /* use GMC */ | |
|
298
e20de99b6295
using Juanjo's way to pass forced type - especially as I_TYPE/P_TYPE defines aren't exported in the public interface, and the flagged method matches the way as qscale forcing work
arpi_esp
parents:
297
diff
changeset
|
90 #define CODEC_FLAG_TYPE 0x0040 /* fixed I/P frame type, from avctx->key_frame */ |
| 324 | 91 /* parent program gurantees that the input for b-frame containing streams is not written to |
| 92 for at least s->max_b_frames+1 frames, if this is not set than the input will be copied */ | |
| 93 #define CODEC_FLAG_INPUT_PRESERVED 0x0100 | |
| 0 | 94 |
| 67 | 95 /* codec capabilities */ |
| 96 | |
| 97 /* decoder can use draw_horiz_band callback */ | |
| 98 #define CODEC_CAP_DRAW_HORIZ_BAND 0x0001 | |
| 99 | |
| 0 | 100 #define FRAME_RATE_BASE 10000 |
| 101 | |
| 102 typedef struct AVCodecContext { | |
| 103 int bit_rate; | |
| 268 | 104 int bit_rate_tolerance; /* amount of +- bits (>0)*/ |
| 0 | 105 int flags; |
| 106 int sub_id; /* some codecs needs additionnal format info. It is | |
| 107 stored there */ | |
|
320
cda7d0857baf
- ME setting moved to AVCodecContext/MpegEncContext, no longer a global.
pulento
parents:
317
diff
changeset
|
108 |
|
cda7d0857baf
- ME setting moved to AVCodecContext/MpegEncContext, no longer a global.
pulento
parents:
317
diff
changeset
|
109 int me_method; /* ME algorithm used for video coding */ |
|
cda7d0857baf
- ME setting moved to AVCodecContext/MpegEncContext, no longer a global.
pulento
parents:
317
diff
changeset
|
110 |
| 0 | 111 /* video only */ |
| 112 int frame_rate; /* frames per sec multiplied by FRAME_RATE_BASE */ | |
| 113 int width, height; | |
|
281
1fc96b02142e
mpeg4 aspect_ratio_info in AVCodecContext (requested by alex)
michaelni
parents:
277
diff
changeset
|
114 int aspect_ratio_info; |
| 282 | 115 #define FF_ASPECT_SQUARE 1 |
| 116 #define FF_ASPECT_4_3_625 2 | |
| 117 #define FF_ASPECT_4_3_525 3 | |
| 118 #define FF_ASPECT_16_9_625 4 | |
| 119 #define FF_ASPECT_16_9_525 5 | |
| 0 | 120 int gop_size; /* 0 = intra only */ |
| 315 | 121 enum PixelFormat pix_fmt; /* pixel format, see PIX_FMT_xxx */ |
| 67 | 122 |
| 123 /* if non NULL, 'draw_horiz_band' is called by the libavcodec | |
| 124 decoder to draw an horizontal band. It improve cache usage. Not | |
| 125 all codecs can do that. You must check the codec capabilities | |
| 126 before */ | |
| 127 void (*draw_horiz_band)(struct AVCodecContext *s, | |
| 128 UINT8 **src_ptr, int linesize, | |
| 129 int y, int width, int height); | |
| 130 | |
| 0 | 131 /* audio only */ |
| 132 int sample_rate; /* samples per sec */ | |
| 133 int channels; | |
| 92 | 134 int sample_fmt; /* sample format, currenly unused */ |
| 0 | 135 |
| 136 /* the following data should not be initialized */ | |
| 137 int frame_size; /* in samples, initialized when calling 'init' */ | |
| 138 int frame_number; /* audio or video frame number */ | |
| 139 int key_frame; /* true if the previous compressed frame was | |
| 140 a key frame (intra, or seekable) */ | |
| 141 int quality; /* quality of the previous encoded frame | |
| 142 (between 1 (good) and 31 (bad)) */ | |
| 268 | 143 float qcompress; /* amount of qscale change between easy & hard scenes (0.0-1.0)*/ |
| 144 float qblur; /* amount of qscale smoothing over time (0.0-1.0) */ | |
| 145 int qmin; /* min qscale */ | |
| 146 int qmax; /* max qscale */ | |
| 147 int max_qdiff; /* max qscale difference between frames */ | |
| 324 | 148 int max_b_frames; /* maximum b frames, the output will be delayed by max_b_frames+1 relative to the input */ |
| 149 | |
| 0 | 150 struct AVCodec *codec; |
| 151 void *priv_data; | |
| 152 | |
| 162 | 153 /* The following data is for RTP friendly coding */ |
| 154 /* By now only H.263/H.263+ coder honours this */ | |
| 155 int rtp_mode; /* 1 for activate RTP friendly-mode */ | |
| 156 /* highers numbers represent more error-prone */ | |
| 157 /* enviroments, by now just "1" exist */ | |
| 158 | |
| 159 int rtp_payload_size; /* The size of the RTP payload, the coder will */ | |
| 160 /* do it's best to deliver a chunk with size */ | |
| 161 /* below rtp_payload_size, the chunk will start */ | |
| 162 /* with a start code on some codecs like H.263 */ | |
| 163 /* This doesn't take account of any particular */ | |
| 164 /* headers inside the transmited RTP payload */ | |
| 231 | 165 |
| 166 | |
| 167 /* The RTP callcack: This function is called */ | |
| 168 /* every time the encoder as a packet to send */ | |
| 169 /* Depends on the encoder if the data starts */ | |
| 170 /* with a Start Code (it should) H.263 does */ | |
| 171 void (*rtp_callback)(void *data, int size, int packet_number); | |
| 172 | |
|
252
ddb1a0e94cf4
- Added PSNR feature to libavcodec and ffmpeg. By now just Y PSNR until I'm
pulento
parents:
231
diff
changeset
|
173 /* These are for PSNR calculation, if you set get_psnr to 1 */ |
|
ddb1a0e94cf4
- Added PSNR feature to libavcodec and ffmpeg. By now just Y PSNR until I'm
pulento
parents:
231
diff
changeset
|
174 /* after encoding you will have the PSNR on psnr_y/cb/cr */ |
|
ddb1a0e94cf4
- Added PSNR feature to libavcodec and ffmpeg. By now just Y PSNR until I'm
pulento
parents:
231
diff
changeset
|
175 int get_psnr; |
|
ddb1a0e94cf4
- Added PSNR feature to libavcodec and ffmpeg. By now just Y PSNR until I'm
pulento
parents:
231
diff
changeset
|
176 float psnr_y; |
|
ddb1a0e94cf4
- Added PSNR feature to libavcodec and ffmpeg. By now just Y PSNR until I'm
pulento
parents:
231
diff
changeset
|
177 float psnr_cb; |
|
ddb1a0e94cf4
- Added PSNR feature to libavcodec and ffmpeg. By now just Y PSNR until I'm
pulento
parents:
231
diff
changeset
|
178 float psnr_cr; |
| 286 | 179 |
| 180 /* statistics, used for 2-pass encoding */ | |
| 181 int mv_bits; | |
| 182 int header_bits; | |
| 183 int i_tex_bits; | |
| 184 int p_tex_bits; | |
| 185 int i_count; | |
| 186 int p_count; | |
| 187 int skip_count; | |
| 188 int misc_bits; // cbp, mb_type | |
| 189 int frame_bits; | |
| 162 | 190 |
| 0 | 191 /* the following fields are ignored */ |
| 67 | 192 void *opaque; /* can be used to carry app specific stuff */ |
| 0 | 193 char codec_name[32]; |
| 194 int codec_type; /* see CODEC_TYPE_xxx */ | |
| 195 int codec_id; /* see CODEC_ID_xxx */ | |
| 196 unsigned int codec_tag; /* codec tag, only used if unknown codec */ | |
| 197 } AVCodecContext; | |
| 198 | |
| 199 typedef struct AVCodec { | |
| 200 char *name; | |
| 201 int type; | |
| 202 int id; | |
| 203 int priv_data_size; | |
| 204 int (*init)(AVCodecContext *); | |
| 205 int (*encode)(AVCodecContext *, UINT8 *buf, int buf_size, void *data); | |
| 206 int (*close)(AVCodecContext *); | |
| 207 int (*decode)(AVCodecContext *, void *outdata, int *outdata_size, | |
| 208 UINT8 *buf, int buf_size); | |
| 67 | 209 int capabilities; |
| 0 | 210 struct AVCodec *next; |
| 211 } AVCodec; | |
| 212 | |
| 213 /* three components are given, that's all */ | |
| 214 typedef struct AVPicture { | |
| 215 UINT8 *data[3]; | |
| 216 int linesize[3]; | |
| 217 } AVPicture; | |
| 218 | |
| 219 extern AVCodec ac3_encoder; | |
| 220 extern AVCodec mp2_encoder; | |
|
260
e1bacfb3f51f
- Added MP3 encoding through libmp3lame contributed by Lennert Buytenhek.
pulento
parents:
252
diff
changeset
|
221 extern AVCodec mp3lame_encoder; |
| 0 | 222 extern AVCodec mpeg1video_encoder; |
| 223 extern AVCodec h263_encoder; | |
| 224 extern AVCodec h263p_encoder; | |
| 225 extern AVCodec rv10_encoder; | |
| 226 extern AVCodec mjpeg_encoder; | |
| 67 | 227 extern AVCodec mpeg4_encoder; |
| 307 | 228 extern AVCodec msmpeg4v1_encoder; |
| 229 extern AVCodec msmpeg4v2_encoder; | |
| 230 extern AVCodec msmpeg4v3_encoder; | |
| 0 | 231 |
| 232 extern AVCodec h263_decoder; | |
| 67 | 233 extern AVCodec mpeg4_decoder; |
| 307 | 234 extern AVCodec msmpeg4v1_decoder; |
| 235 extern AVCodec msmpeg4v2_decoder; | |
| 236 extern AVCodec msmpeg4v3_decoder; | |
| 311 | 237 extern AVCodec wmv1_decoder; |
| 0 | 238 extern AVCodec mpeg_decoder; |
| 239 extern AVCodec h263i_decoder; | |
| 240 extern AVCodec rv10_decoder; | |
| 24 | 241 extern AVCodec mjpeg_decoder; |
| 322 | 242 extern AVCodec mp2_decoder; |
| 92 | 243 extern AVCodec mp3_decoder; |
| 0 | 244 |
| 92 | 245 /* pcm codecs */ |
| 246 #define PCM_CODEC(id, name) \ | |
| 247 extern AVCodec name ## _decoder; \ | |
| 248 extern AVCodec name ## _encoder; | |
| 249 | |
| 250 PCM_CODEC(CODEC_ID_PCM_S16LE, pcm_s16le); | |
| 251 PCM_CODEC(CODEC_ID_PCM_S16BE, pcm_s16be); | |
| 252 PCM_CODEC(CODEC_ID_PCM_U16LE, pcm_u16le); | |
| 253 PCM_CODEC(CODEC_ID_PCM_U16BE, pcm_u16be); | |
| 254 PCM_CODEC(CODEC_ID_PCM_S8, pcm_s8); | |
| 255 PCM_CODEC(CODEC_ID_PCM_U8, pcm_u8); | |
| 256 PCM_CODEC(CODEC_ID_PCM_ALAW, pcm_alaw); | |
| 257 PCM_CODEC(CODEC_ID_PCM_MULAW, pcm_mulaw); | |
| 258 | |
| 259 #undef PCM_CODEC | |
| 260 | |
| 261 /* dummy raw video codec */ | |
| 0 | 262 extern AVCodec rawvideo_codec; |
| 263 | |
| 264 /* the following codecs use external GPL libs */ | |
| 265 extern AVCodec ac3_decoder; | |
| 266 | |
| 267 /* resample.c */ | |
| 268 | |
| 269 struct ReSampleContext; | |
| 270 | |
| 271 typedef struct ReSampleContext ReSampleContext; | |
| 272 | |
| 273 ReSampleContext *audio_resample_init(int output_channels, int input_channels, | |
| 274 int output_rate, int input_rate); | |
| 275 int audio_resample(ReSampleContext *s, short *output, short *input, int nb_samples); | |
| 276 void audio_resample_close(ReSampleContext *s); | |
| 277 | |
| 278 /* YUV420 format is assumed ! */ | |
| 279 | |
| 280 struct ImgReSampleContext; | |
| 281 | |
| 282 typedef struct ImgReSampleContext ImgReSampleContext; | |
| 283 | |
| 284 ImgReSampleContext *img_resample_init(int output_width, int output_height, | |
| 285 int input_width, int input_height); | |
| 286 void img_resample(ImgReSampleContext *s, | |
| 287 AVPicture *output, AVPicture *input); | |
| 288 | |
| 289 void img_resample_close(ImgReSampleContext *s); | |
| 290 | |
| 49 | 291 void avpicture_fill(AVPicture *picture, UINT8 *ptr, |
| 292 int pix_fmt, int width, int height); | |
| 293 int avpicture_get_size(int pix_fmt, int width, int height); | |
| 294 | |
| 295 /* convert among pixel formats */ | |
| 296 int img_convert(AVPicture *dst, int dst_pix_fmt, | |
| 297 AVPicture *src, int pix_fmt, | |
| 298 int width, int height); | |
| 299 | |
| 300 /* deinterlace a picture */ | |
| 301 int avpicture_deinterlace(AVPicture *dst, AVPicture *src, | |
| 0 | 302 int pix_fmt, int width, int height); |
| 303 | |
| 304 /* external high level API */ | |
| 305 | |
| 306 extern AVCodec *first_avcodec; | |
| 307 | |
| 308 void avcodec_init(void); | |
| 309 | |
| 310 void register_avcodec(AVCodec *format); | |
| 311 AVCodec *avcodec_find_encoder(enum CodecID id); | |
| 177 | 312 AVCodec *avcodec_find_encoder_by_name(const char *name); |
| 0 | 313 AVCodec *avcodec_find_decoder(enum CodecID id); |
| 314 AVCodec *avcodec_find_decoder_by_name(const char *name); | |
| 315 void avcodec_string(char *buf, int buf_size, AVCodecContext *enc, int encode); | |
| 316 | |
| 317 int avcodec_open(AVCodecContext *avctx, AVCodec *codec); | |
| 318 int avcodec_decode_audio(AVCodecContext *avctx, INT16 *samples, | |
| 319 int *frame_size_ptr, | |
| 320 UINT8 *buf, int buf_size); | |
| 321 int avcodec_decode_video(AVCodecContext *avctx, AVPicture *picture, | |
| 322 int *got_picture_ptr, | |
| 323 UINT8 *buf, int buf_size); | |
| 324 int avcodec_encode_audio(AVCodecContext *avctx, UINT8 *buf, int buf_size, | |
| 325 const short *samples); | |
| 326 int avcodec_encode_video(AVCodecContext *avctx, UINT8 *buf, int buf_size, | |
| 327 const AVPicture *pict); | |
| 328 | |
| 329 int avcodec_close(AVCodecContext *avctx); | |
| 330 | |
| 331 void avcodec_register_all(void); | |
| 92 | 332 |
|
108
1e4a4af694d1
exporting qscale data for postprocessing (for MPlayer)
arpi_esp
parents:
92
diff
changeset
|
333 #ifdef FF_POSTPROCESS |
|
1e4a4af694d1
exporting qscale data for postprocessing (for MPlayer)
arpi_esp
parents:
92
diff
changeset
|
334 #ifndef MBC |
| 162 | 335 #define MBC 48 |
| 336 #define MBR 36 | |
|
108
1e4a4af694d1
exporting qscale data for postprocessing (for MPlayer)
arpi_esp
parents:
92
diff
changeset
|
337 #endif |
|
1e4a4af694d1
exporting qscale data for postprocessing (for MPlayer)
arpi_esp
parents:
92
diff
changeset
|
338 extern int quant_store[MBR+1][MBC+1]; // [Review] |
|
1e4a4af694d1
exporting qscale data for postprocessing (for MPlayer)
arpi_esp
parents:
92
diff
changeset
|
339 #endif |
|
1e4a4af694d1
exporting qscale data for postprocessing (for MPlayer)
arpi_esp
parents:
92
diff
changeset
|
340 |
| 92 | 341 #endif /* AVCODEC_H */ |
