rl vlc table optimization (not yet used)
[libav.git] / libavcodec / avcodec.h
CommitLineData
a96b68b7
FB
1#ifndef AVCODEC_H
2#define AVCODEC_H
3
de6d9b64
FB
4#include "common.h"
5
4b1f4f23
J
6#define LIBAVCODEC_VERSION_INT 0x000406
7#define LIBAVCODEC_VERSION "0.4.6"
be8ffec9
NK
8#define LIBAVCODEC_BUILD 4615
9#define LIBAVCODEC_BUILD_STR "4615"
4b1f4f23 10
de6d9b64
FB
11enum CodecID {
12 CODEC_ID_NONE,
13 CODEC_ID_MPEG1VIDEO,
14 CODEC_ID_H263,
15 CODEC_ID_RV10,
16 CODEC_ID_MP2,
9d36bdc9 17 CODEC_ID_MP3LAME,
de6d9b64
FB
18 CODEC_ID_AC3,
19 CODEC_ID_MJPEG,
bf89e6b1 20 CODEC_ID_MPEG4,
de6d9b64 21 CODEC_ID_RAWVIDEO,
84afee34
MN
22 CODEC_ID_MSMPEG4V1,
23 CODEC_ID_MSMPEG4V2,
24 CODEC_ID_MSMPEG4V3,
e1a9dbff 25 CODEC_ID_WMV1,
b50eef3a 26 CODEC_ID_WMV2,
de6d9b64
FB
27 CODEC_ID_H263P,
28 CODEC_ID_H263I,
be8ffec9 29 CODEC_ID_SVQ1,
a96b68b7
FB
30
31 /* various pcm "codecs" */
32 CODEC_ID_PCM_S16LE,
33 CODEC_ID_PCM_S16BE,
34 CODEC_ID_PCM_U16LE,
35 CODEC_ID_PCM_U16BE,
36 CODEC_ID_PCM_S8,
37 CODEC_ID_PCM_U8,
38 CODEC_ID_PCM_MULAW,
39 CODEC_ID_PCM_ALAW,
de6d9b64 40};
84afee34 41#define CODEC_ID_MSMPEG4 CODEC_ID_MSMPEG4V3
de6d9b64
FB
42
43enum CodecType {
4a663d80 44 CODEC_TYPE_UNKNOWN = -1,
de6d9b64
FB
45 CODEC_TYPE_VIDEO,
46 CODEC_TYPE_AUDIO,
47};
48
49enum PixelFormat {
9f862d11 50 PIX_FMT_ANY = -1,
de6d9b64
FB
51 PIX_FMT_YUV420P,
52 PIX_FMT_YUV422,
53 PIX_FMT_RGB24,
54 PIX_FMT_BGR24,
d9fea0b5
FB
55 PIX_FMT_YUV422P,
56 PIX_FMT_YUV444P,
be8ffec9 57 PIX_FMT_YUV410P
de6d9b64
FB
58};
59
a96b68b7
FB
60/* currently unused, may be used if 24/32 bits samples ever supported */
61enum SampleFormat {
62 SAMPLE_FMT_S16 = 0, /* signed 16 bits */
63};
64
de6d9b64
FB
65/* in bytes */
66#define AVCODEC_MAX_AUDIO_FRAME_SIZE 18432
67
e4986da9
J
68/* motion estimation type, EPZS by default */
69enum Motion_Est_ID {
101bea5f 70 ME_ZERO = 1,
e4986da9
J
71 ME_FULL,
72 ME_LOG,
73 ME_PHODS,
74 ME_EPZS,
75 ME_X1
76};
77
101bea5f
J
78/* only for ME compatiblity with old apps */
79extern int motion_estimation_method;
80
e4986da9 81/* ME algos sorted by quality */
bc6caae2
J
82static const int Motion_Est_QTab[] = { ME_ZERO, ME_PHODS, ME_LOG,
83 ME_X1, ME_EPZS, ME_FULL };
de6d9b64 84
9dbcbd92
MN
85#define FF_MAX_B_FRAMES 4
86
de6d9b64 87/* encoding support */
ba6802de 88/* note not everything is supported yet */
de6d9b64
FB
89
90#define CODEC_FLAG_HQ 0x0001 /* high quality (non real time) encoding */
91#define CODEC_FLAG_QSCALE 0x0002 /* use fixed qscale */
ba6802de 92#define CODEC_FLAG_4MV 0x0004 /* 4 MV per MB allowed */
ba6802de
MN
93#define CODEC_FLAG_QPEL 0x0010 /* use qpel MC */
94#define CODEC_FLAG_GMC 0x0020 /* use GMC */
60e575ac 95#define CODEC_FLAG_TYPE 0x0040 /* fixed I/P frame type, from avctx->key_frame */
1f6b6e50 96#define CODEC_FLAG_PART 0x0080 /* use data partitioning */
9dbcbd92
MN
97/* parent program gurantees that the input for b-frame containing streams is not written to
98 for at least s->max_b_frames+1 frames, if this is not set than the input will be copied */
8b4c7dbc
MN
99#define CODEC_FLAG_INPUT_PRESERVED 0x0100
100#define CODEC_FLAG_PASS1 0x0200 /* use internal 2pass ratecontrol in first pass mode */
101#define CODEC_FLAG_PASS2 0x0400 /* use internal 2pass ratecontrol in second pass mode */
e84c31dc 102#define CODEC_FLAG_EXTERN_HUFF 0x1000 /* use external huffman table (for mjpeg) */
b50eef3a 103#define CODEC_FLAG_GRAY 0x2000 /* only decode/encode grayscale */
de6d9b64 104
bf89e6b1
FB
105/* codec capabilities */
106
107/* decoder can use draw_horiz_band callback */
108#define CODEC_CAP_DRAW_HORIZ_BAND 0x0001
109
de6d9b64
FB
110#define FRAME_RATE_BASE 10000
111
112typedef struct AVCodecContext {
113 int bit_rate;
9cdd6a24 114 int bit_rate_tolerance; /* amount of +- bits (>0)*/
de6d9b64
FB
115 int flags;
116 int sub_id; /* some codecs needs additionnal format info. It is
117 stored there */
e4986da9
J
118
119 int me_method; /* ME algorithm used for video coding */
120
e84c31dc
A
121 /* extra data from parent application to codec, e.g. huffman table
122 for mjpeg */
123 /* the parent should allocate and free this buffer */
124 void *extradata;
125 int extradata_size;
126
de6d9b64
FB
127 /* video only */
128 int frame_rate; /* frames per sec multiplied by FRAME_RATE_BASE */
129 int width, height;
11ce8834 130 int aspect_ratio_info;
2efe097a
MN
131#define FF_ASPECT_SQUARE 1
132#define FF_ASPECT_4_3_625 2
133#define FF_ASPECT_4_3_525 3
134#define FF_ASPECT_16_9_625 4
135#define FF_ASPECT_16_9_525 5
de6d9b64 136 int gop_size; /* 0 = intra only */
bc657ac3 137 enum PixelFormat pix_fmt; /* pixel format, see PIX_FMT_xxx */
e0a3d744
J
138 int repeat_pict; /* when decoding, this signal how much the picture */
139 /* must be delayed. */
140 /* extra_delay = (repeat_pict / 2) * (1/fps) */
bf89e6b1
FB
141 /* if non NULL, 'draw_horiz_band' is called by the libavcodec
142 decoder to draw an horizontal band. It improve cache usage. Not
143 all codecs can do that. You must check the codec capabilities
144 before */
145 void (*draw_horiz_band)(struct AVCodecContext *s,
146 UINT8 **src_ptr, int linesize,
147 int y, int width, int height);
148
de6d9b64
FB
149 /* audio only */
150 int sample_rate; /* samples per sec */
151 int channels;
a96b68b7 152 int sample_fmt; /* sample format, currenly unused */
de6d9b64
FB
153
154 /* the following data should not be initialized */
9cd3766f
J
155 int frame_size; /* in samples, initialized when calling 'init' */
156 int frame_number; /* audio or video frame number */
157 int real_pict_num; /* returns the real picture number of
158 previous encoded frame */
159 int key_frame; /* true if the previous compressed frame was
160 a key frame (intra, or seekable) */
161 int pict_type; /* picture type of the previous
162 encoded frame */
163/* FIXME: these should have FF_ */
164#define I_TYPE 1 // Intra
165#define P_TYPE 2 // Predicted
166#define B_TYPE 3 // Bi-dir predicted
167#define S_TYPE 4 // S(GMC)-VOP MPEG4
168
169 int delay; /* number of frames the decoded output
170 will be delayed relative to the encoded input */
2417652e
MN
171 uint8_t *mbskip_table; /* =1 if MB didnt change, is only valid for I/P frames
172 stride= mb_width = (width+15)>>4 */
1ff662cc
MN
173
174 /* encoding parameters */
de6d9b64 175 int quality; /* quality of the previous encoded frame
8b4c7dbc
MN
176 (between 1 (good) and 31 (bad))
177 this is allso used to set the quality in vbr mode
178 and the per frame quality in CODEC_FLAG_TYPE (second pass mode) */
9cdd6a24
MN
179 float qcompress; /* amount of qscale change between easy & hard scenes (0.0-1.0)*/
180 float qblur; /* amount of qscale smoothing over time (0.0-1.0) */
181 int qmin; /* min qscale */
182 int qmax; /* max qscale */
183 int max_qdiff; /* max qscale difference between frames */
9dbcbd92 184 int max_b_frames; /* maximum b frames, the output will be delayed by max_b_frames+1 relative to the input */
8b4c7dbc
MN
185 float b_quant_factor;/* qscale factor between ips and b frames */
186 int rc_strategy;
187 int b_frame_strategy;
9dbcbd92 188
2417652e
MN
189 int hurry_up; /* when set to 1 during decoding, b frames will be skiped
190 when set to 2 idct/dequant will be skipped too */
191
de6d9b64
FB
192 struct AVCodec *codec;
193 void *priv_data;
194
644d98a4 195 /* The following data is for RTP friendly coding */
1f6b6e50 196 /* By now only H.263/H.263+/MPEG4 coder honours this */
644d98a4
J
197 int rtp_mode; /* 1 for activate RTP friendly-mode */
198 /* highers numbers represent more error-prone */
199 /* enviroments, by now just "1" exist */
200
201 int rtp_payload_size; /* The size of the RTP payload, the coder will */
202 /* do it's best to deliver a chunk with size */
203 /* below rtp_payload_size, the chunk will start */
204 /* with a start code on some codecs like H.263 */
205 /* This doesn't take account of any particular */
206 /* headers inside the transmited RTP payload */
81401c1f
J
207
208
209 /* The RTP callcack: This function is called */
210 /* every time the encoder as a packet to send */
211 /* Depends on the encoder if the data starts */
212 /* with a Start Code (it should) H.263 does */
213 void (*rtp_callback)(void *data, int size, int packet_number);
214
43f1708f
J
215 /* These are for PSNR calculation, if you set get_psnr to 1 */
216 /* after encoding you will have the PSNR on psnr_y/cb/cr */
217 int get_psnr;
218 float psnr_y;
219 float psnr_cb;
220 float psnr_cr;
098eefe1
MN
221
222 /* statistics, used for 2-pass encoding */
223 int mv_bits;
224 int header_bits;
225 int i_tex_bits;
226 int p_tex_bits;
227 int i_count;
228 int p_count;
229 int skip_count;
230 int misc_bits; // cbp, mb_type
231 int frame_bits;
644d98a4 232
de6d9b64 233 /* the following fields are ignored */
bf89e6b1 234 void *opaque; /* can be used to carry app specific stuff */
de6d9b64 235 char codec_name[32];
4a663d80
PG
236 enum CodecType codec_type; /* see CODEC_TYPE_xxx */
237 enum CodecID codec_id; /* see CODEC_ID_xxx */
de6d9b64 238 unsigned int codec_tag; /* codec tag, only used if unknown codec */
92ba5ffb
MN
239
240 int workaround_bugs; /* workaround bugs in encoders which cannot be detected automatically */
1f6b6e50
MN
241 int luma_elim_threshold;
242 int chroma_elim_threshold;
243 int strict_std_compliance; /* strictly follow the std (MPEG4, ...) */
244 float b_quant_offset;/* qscale offset between ips and b frames, not implemented yet */
245 int error_resilience;
ae72cda6
NK
246
247#ifndef MBC
248#define MBC 128
249#define MBR 96
250#endif
251 int *quant_store; /* field for communicating with external postprocessing */
8696b636 252 unsigned qstride;
1f6b6e50 253 //FIXME this should be reordered after kabis API is finished ...
5d27890a
NK
254 /*
255 Note: Below are located reserved fields for further usage
256 It requires for ABI !!!
257 If you'll perform some changes then borrow new space from these fields
258 (void * can be safety replaced with struct * ;)
259 P L E A S E ! ! !
260 IMPORTANT: Never change order of already declared fields!!!
261 */
262 unsigned long long int
263 ull_res0,ull_res1,ull_res2,ull_res3,ull_res4,ull_res5,
264 ull_res6,ull_res7,ull_res8,ull_res9,ull_res10,ull_res11,ull_res12;
265 float
266 flt_res0,flt_res1,flt_res2,flt_res3,flt_res4,flt_res5,
1f6b6e50 267 flt_res6,flt_res7,flt_res8,flt_res9,flt_res10,flt_res11;
5d27890a
NK
268 void
269 *ptr_res0,*ptr_res1,*ptr_res2,*ptr_res3,*ptr_res4,*ptr_res5,
ae72cda6 270 *ptr_res6,*ptr_res7,*ptr_res8,*ptr_res9,*ptr_res10,*ptr_res11;
5d27890a
NK
271 unsigned long int
272 ul_res0,ul_res1,ul_res2,ul_res3,ul_res4,ul_res5,
273 ul_res6,ul_res7,ul_res8,ul_res9,ul_res10,ul_res11,ul_res12;
274 unsigned int
275 ui_res0,ui_res1,ui_res2,ui_res3,ui_res4,ui_res5,
8696b636 276 ui_res6;
5d27890a
NK
277 unsigned short int
278 us_res0,us_res1,us_res2,us_res3,us_res4,us_res5,
279 us_res6,us_res7,us_res8,us_res9,us_res10,us_res11,us_res12;
280 unsigned char
281 uc_res0,uc_res1,uc_res2,uc_res3,uc_res4,uc_res5,
282 uc_res6,uc_res7,uc_res8,uc_res9,uc_res10,uc_res11,uc_res12;
de6d9b64
FB
283} AVCodecContext;
284
285typedef struct AVCodec {
286 char *name;
287 int type;
288 int id;
289 int priv_data_size;
290 int (*init)(AVCodecContext *);
291 int (*encode)(AVCodecContext *, UINT8 *buf, int buf_size, void *data);
292 int (*close)(AVCodecContext *);
293 int (*decode)(AVCodecContext *, void *outdata, int *outdata_size,
294 UINT8 *buf, int buf_size);
bf89e6b1 295 int capabilities;
de6d9b64 296 struct AVCodec *next;
5d27890a
NK
297 /*
298 Note: Below are located reserved fields for further usage
299 It requires for ABI !!!
300 If you'll perform some changes then borrow new space from these fields
301 (void * can be safety replaced with struct * ;)
302 P L E A S E ! ! !
303 IMPORTANT: Never change order of already declared fields!!!
304 */
305 unsigned long long int
306 ull_res0,ull_res1,ull_res2,ull_res3,ull_res4,ull_res5,
307 ull_res6,ull_res7,ull_res8,ull_res9,ull_res10,ull_res11,ull_res12;
308 float
309 flt_res0,flt_res1,flt_res2,flt_res3,flt_res4,flt_res5,
310 flt_res6,flt_res7,flt_res8,flt_res9,flt_res10,flt_res11,flt_res12;
311 void
312 *ptr_res0,*ptr_res1,*ptr_res2,*ptr_res3,*ptr_res4,*ptr_res5,
313 *ptr_res6,*ptr_res7,*ptr_res8,*ptr_res9,*ptr_res10,*ptr_res11,*ptr_res12;
de6d9b64
FB
314} AVCodec;
315
316/* three components are given, that's all */
317typedef struct AVPicture {
318 UINT8 *data[3];
319 int linesize[3];
320} AVPicture;
321
322extern AVCodec ac3_encoder;
323extern AVCodec mp2_encoder;
9d36bdc9 324extern AVCodec mp3lame_encoder;
de6d9b64
FB
325extern AVCodec mpeg1video_encoder;
326extern AVCodec h263_encoder;
327extern AVCodec h263p_encoder;
328extern AVCodec rv10_encoder;
329extern AVCodec mjpeg_encoder;
bf89e6b1 330extern AVCodec mpeg4_encoder;
84afee34
MN
331extern AVCodec msmpeg4v1_encoder;
332extern AVCodec msmpeg4v2_encoder;
333extern AVCodec msmpeg4v3_encoder;
0151a6f5
MN
334extern AVCodec wmv1_encoder;
335extern AVCodec wmv2_encoder;
de6d9b64
FB
336
337extern AVCodec h263_decoder;
bf89e6b1 338extern AVCodec mpeg4_decoder;
84afee34
MN
339extern AVCodec msmpeg4v1_decoder;
340extern AVCodec msmpeg4v2_decoder;
341extern AVCodec msmpeg4v3_decoder;
e1a9dbff 342extern AVCodec wmv1_decoder;
0151a6f5 343extern AVCodec wmv2_decoder;
de6d9b64
FB
344extern AVCodec mpeg_decoder;
345extern AVCodec h263i_decoder;
346extern AVCodec rv10_decoder;
be8ffec9 347extern AVCodec svq1_decoder;
4e66ab3b 348extern AVCodec mjpeg_decoder;
4b1f4f23 349extern AVCodec mp2_decoder;
a96b68b7 350extern AVCodec mp3_decoder;
de6d9b64 351
a96b68b7
FB
352/* pcm codecs */
353#define PCM_CODEC(id, name) \
354extern AVCodec name ## _decoder; \
355extern AVCodec name ## _encoder;
356
357PCM_CODEC(CODEC_ID_PCM_S16LE, pcm_s16le);
358PCM_CODEC(CODEC_ID_PCM_S16BE, pcm_s16be);
359PCM_CODEC(CODEC_ID_PCM_U16LE, pcm_u16le);
360PCM_CODEC(CODEC_ID_PCM_U16BE, pcm_u16be);
361PCM_CODEC(CODEC_ID_PCM_S8, pcm_s8);
362PCM_CODEC(CODEC_ID_PCM_U8, pcm_u8);
363PCM_CODEC(CODEC_ID_PCM_ALAW, pcm_alaw);
364PCM_CODEC(CODEC_ID_PCM_MULAW, pcm_mulaw);
365
366#undef PCM_CODEC
367
368/* dummy raw video codec */
de6d9b64
FB
369extern AVCodec rawvideo_codec;
370
371/* the following codecs use external GPL libs */
de6d9b64
FB
372extern AVCodec ac3_decoder;
373
374/* resample.c */
375
376struct ReSampleContext;
377
378typedef struct ReSampleContext ReSampleContext;
379
380ReSampleContext *audio_resample_init(int output_channels, int input_channels,
381 int output_rate, int input_rate);
382int audio_resample(ReSampleContext *s, short *output, short *input, int nb_samples);
383void audio_resample_close(ReSampleContext *s);
384
385/* YUV420 format is assumed ! */
386
387struct ImgReSampleContext;
388
389typedef struct ImgReSampleContext ImgReSampleContext;
390
391ImgReSampleContext *img_resample_init(int output_width, int output_height,
392 int input_width, int input_height);
393void img_resample(ImgReSampleContext *s,
394 AVPicture *output, AVPicture *input);
395
396void img_resample_close(ImgReSampleContext *s);
397
219b06c6
FB
398void avpicture_fill(AVPicture *picture, UINT8 *ptr,
399 int pix_fmt, int width, int height);
400int avpicture_get_size(int pix_fmt, int width, int height);
401
402/* convert among pixel formats */
403int img_convert(AVPicture *dst, int dst_pix_fmt,
404 AVPicture *src, int pix_fmt,
405 int width, int height);
406
407/* deinterlace a picture */
408int avpicture_deinterlace(AVPicture *dst, AVPicture *src,
de6d9b64
FB
409 int pix_fmt, int width, int height);
410
411/* external high level API */
412
413extern AVCodec *first_avcodec;
414
156e5023 415/* returns LIBAVCODEC_VERSION_INT constant */
51a49663 416unsigned avcodec_version(void);
8bceb6af 417/* returns LIBAVCODEC_BUILD constant */
51a49663 418unsigned avcodec_build(void);
de6d9b64
FB
419void avcodec_init(void);
420
51a49663
FB
421void avcodec_set_bit_exact(void);
422
de6d9b64
FB
423void register_avcodec(AVCodec *format);
424AVCodec *avcodec_find_encoder(enum CodecID id);
98f3b098 425AVCodec *avcodec_find_encoder_by_name(const char *name);
de6d9b64
FB
426AVCodec *avcodec_find_decoder(enum CodecID id);
427AVCodec *avcodec_find_decoder_by_name(const char *name);
428void avcodec_string(char *buf, int buf_size, AVCodecContext *enc, int encode);
429
430int avcodec_open(AVCodecContext *avctx, AVCodec *codec);
431int avcodec_decode_audio(AVCodecContext *avctx, INT16 *samples,
432 int *frame_size_ptr,
433 UINT8 *buf, int buf_size);
434int avcodec_decode_video(AVCodecContext *avctx, AVPicture *picture,
435 int *got_picture_ptr,
436 UINT8 *buf, int buf_size);
437int avcodec_encode_audio(AVCodecContext *avctx, UINT8 *buf, int buf_size,
438 const short *samples);
439int avcodec_encode_video(AVCodecContext *avctx, UINT8 *buf, int buf_size,
440 const AVPicture *pict);
441
442int avcodec_close(AVCodecContext *avctx);
443
444void avcodec_register_all(void);
a96b68b7 445
1c2a8c7f
MN
446void avcodec_flush_buffers(AVCodecContext *avctx);
447
79e7b305 448#ifdef FF_POSTPROCESS
79e7b305
A
449extern int quant_store[MBR+1][MBC+1]; // [Review]
450#endif
451
e8f14793
ZK
452
453/**
454 * Interface for 0.5.0 version
455 *
456 * do not even think about it's usage for this moment
457 */
458
459typedef struct {
460 // compressed size used from given memory buffer
461 int size;
462 /// I/P/B frame type
463 int frame_type;
464} avc_enc_result_t;
465
466/**
467 * Commands
468 * order can't be changed - once it was defined
469 */
470typedef enum {
471 // general commands
472 AVC_OPEN_BY_NAME = 0xACA000,
473 AVC_OPEN_BY_CODEC_ID,
474 AVC_OPEN_BY_FOURCC,
475 AVC_CLOSE,
476
477 AVC_FLUSH,
478 // pin - struct { uint8_t* src, uint_t src_size }
479 // pout - struct { AVPicture* img, consumed_bytes,
480 AVC_DECODE,
481 // pin - struct { AVPicture* img, uint8_t* dest, uint_t dest_size }
482 // pout - uint_t used_from_dest_size
483 AVC_ENCODE,
484
485 // query/get video commands
486 AVC_GET_VERSION = 0xACB000,
487 AVC_GET_WIDTH,
488 AVC_GET_HEIGHT,
489 AVC_GET_DELAY,
490 AVC_GET_QUANT_TABLE,
491 // ...
492
493 // query/get audio commands
494 AVC_GET_FRAME_SIZE = 0xABC000,
495
496 // maybe define some simple structure which
497 // might be passed to the user - but they can't
498 // contain any codec specific parts and these
499 // calls are usualy necessary only few times
500
501 // set video commands
502 AVC_SET_WIDTH = 0xACD000,
503 AVC_SET_HEIGHT,
504
505 // set video encoding commands
506 AVC_SET_FRAME_RATE = 0xACD800,
507 AVC_SET_QUALITY,
508 AVC_SET_HURRY_UP,
509
510 // set audio commands
511 AVC_SET_SAMPLE_RATE = 0xACE000,
512 AVC_SET_CHANNELS,
513
514} avc_cmd_t;
515
516/**
517 * \param handle allocated private structure by libavcodec
518 * for initialization pass NULL - will be returned pout
519 * user is supposed to know nothing about its structure
520 * \param cmd type of operation to be performed
521 * \param pint input parameter
522 * \param pout output parameter
523 *
524 * \returns command status - eventually for query command it might return
525 * integer resulting value
526 */
527int avcodec(void* handle, avc_cmd_t cmd, void* pin, void* pout);
528
544eb99c
FB
529/* memory */
530void *av_malloc(int size);
531void *av_mallocz(int size);
532void av_free(void *ptr);
533void __av_freep(void **ptr);
534#define av_freep(p) __av_freep((void **)(p))
535
a96b68b7 536#endif /* AVCODEC_H */