* Mea culpa: it seems that I broke encoding to 8-bit pcm files. This fixes it.
[libav.git] / libavcodec / avcodec.h
CommitLineData
a96b68b7
FB
1#ifndef AVCODEC_H
2#define AVCODEC_H
3
de6d9b64
FB
4#include "common.h"
5
4b1f4f23
J
6#define LIBAVCODEC_VERSION_INT 0x000406
7#define LIBAVCODEC_VERSION "0.4.6"
79b0d5f9
NK
8#define LIBAVCODEC_BUILD 4608
9#define LIBAVCODEC_BUILD_STR "4608"
4b1f4f23 10
de6d9b64
FB
11enum CodecID {
12 CODEC_ID_NONE,
13 CODEC_ID_MPEG1VIDEO,
14 CODEC_ID_H263,
15 CODEC_ID_RV10,
16 CODEC_ID_MP2,
9d36bdc9 17 CODEC_ID_MP3LAME,
de6d9b64
FB
18 CODEC_ID_AC3,
19 CODEC_ID_MJPEG,
bf89e6b1 20 CODEC_ID_MPEG4,
de6d9b64 21 CODEC_ID_RAWVIDEO,
84afee34
MN
22 CODEC_ID_MSMPEG4V1,
23 CODEC_ID_MSMPEG4V2,
24 CODEC_ID_MSMPEG4V3,
e1a9dbff 25 CODEC_ID_WMV1,
de6d9b64
FB
26 CODEC_ID_H263P,
27 CODEC_ID_H263I,
a96b68b7
FB
28
29 /* various pcm "codecs" */
30 CODEC_ID_PCM_S16LE,
31 CODEC_ID_PCM_S16BE,
32 CODEC_ID_PCM_U16LE,
33 CODEC_ID_PCM_U16BE,
34 CODEC_ID_PCM_S8,
35 CODEC_ID_PCM_U8,
36 CODEC_ID_PCM_MULAW,
37 CODEC_ID_PCM_ALAW,
de6d9b64 38};
84afee34 39#define CODEC_ID_MSMPEG4 CODEC_ID_MSMPEG4V3
de6d9b64
FB
40
41enum CodecType {
4a663d80 42 CODEC_TYPE_UNKNOWN = -1,
de6d9b64
FB
43 CODEC_TYPE_VIDEO,
44 CODEC_TYPE_AUDIO,
45};
46
47enum PixelFormat {
9f862d11 48 PIX_FMT_ANY = -1,
de6d9b64
FB
49 PIX_FMT_YUV420P,
50 PIX_FMT_YUV422,
51 PIX_FMT_RGB24,
52 PIX_FMT_BGR24,
d9fea0b5
FB
53 PIX_FMT_YUV422P,
54 PIX_FMT_YUV444P,
de6d9b64
FB
55};
56
a96b68b7
FB
57/* currently unused, may be used if 24/32 bits samples ever supported */
58enum SampleFormat {
59 SAMPLE_FMT_S16 = 0, /* signed 16 bits */
60};
61
de6d9b64
FB
62/* in bytes */
63#define AVCODEC_MAX_AUDIO_FRAME_SIZE 18432
64
e4986da9
J
65/* motion estimation type, EPZS by default */
66enum Motion_Est_ID {
101bea5f 67 ME_ZERO = 1,
e4986da9
J
68 ME_FULL,
69 ME_LOG,
70 ME_PHODS,
71 ME_EPZS,
72 ME_X1
73};
74
101bea5f
J
75/* only for ME compatiblity with old apps */
76extern int motion_estimation_method;
77
e4986da9 78/* ME algos sorted by quality */
bc6caae2
J
79static const int Motion_Est_QTab[] = { ME_ZERO, ME_PHODS, ME_LOG,
80 ME_X1, ME_EPZS, ME_FULL };
de6d9b64 81
9dbcbd92
MN
82#define FF_MAX_B_FRAMES 4
83
de6d9b64 84/* encoding support */
ba6802de 85/* note not everything is supported yet */
de6d9b64
FB
86
87#define CODEC_FLAG_HQ 0x0001 /* high quality (non real time) encoding */
88#define CODEC_FLAG_QSCALE 0x0002 /* use fixed qscale */
ba6802de 89#define CODEC_FLAG_4MV 0x0004 /* 4 MV per MB allowed */
ba6802de
MN
90#define CODEC_FLAG_QPEL 0x0010 /* use qpel MC */
91#define CODEC_FLAG_GMC 0x0020 /* use GMC */
60e575ac 92#define CODEC_FLAG_TYPE 0x0040 /* fixed I/P frame type, from avctx->key_frame */
9dbcbd92
MN
93/* parent program gurantees that the input for b-frame containing streams is not written to
94 for at least s->max_b_frames+1 frames, if this is not set than the input will be copied */
8b4c7dbc
MN
95#define CODEC_FLAG_INPUT_PRESERVED 0x0100
96#define CODEC_FLAG_PASS1 0x0200 /* use internal 2pass ratecontrol in first pass mode */
97#define CODEC_FLAG_PASS2 0x0400 /* use internal 2pass ratecontrol in second pass mode */
e84c31dc 98#define CODEC_FLAG_EXTERN_HUFF 0x1000 /* use external huffman table (for mjpeg) */
de6d9b64 99
bf89e6b1
FB
100/* codec capabilities */
101
102/* decoder can use draw_horiz_band callback */
103#define CODEC_CAP_DRAW_HORIZ_BAND 0x0001
104
de6d9b64
FB
105#define FRAME_RATE_BASE 10000
106
107typedef struct AVCodecContext {
108 int bit_rate;
9cdd6a24 109 int bit_rate_tolerance; /* amount of +- bits (>0)*/
de6d9b64
FB
110 int flags;
111 int sub_id; /* some codecs needs additionnal format info. It is
112 stored there */
e4986da9
J
113
114 int me_method; /* ME algorithm used for video coding */
115
e84c31dc
A
116 /* extra data from parent application to codec, e.g. huffman table
117 for mjpeg */
118 /* the parent should allocate and free this buffer */
119 void *extradata;
120 int extradata_size;
121
de6d9b64
FB
122 /* video only */
123 int frame_rate; /* frames per sec multiplied by FRAME_RATE_BASE */
124 int width, height;
11ce8834 125 int aspect_ratio_info;
2efe097a
MN
126#define FF_ASPECT_SQUARE 1
127#define FF_ASPECT_4_3_625 2
128#define FF_ASPECT_4_3_525 3
129#define FF_ASPECT_16_9_625 4
130#define FF_ASPECT_16_9_525 5
de6d9b64 131 int gop_size; /* 0 = intra only */
bc657ac3 132 enum PixelFormat pix_fmt; /* pixel format, see PIX_FMT_xxx */
c80340a4
J
133 int repeat_pict; /* set this to 1 if you want the decoder
134 to repeat frames for 3:2 pulldown (MPEG-2) */
bf89e6b1
FB
135 /* if non NULL, 'draw_horiz_band' is called by the libavcodec
136 decoder to draw an horizontal band. It improve cache usage. Not
137 all codecs can do that. You must check the codec capabilities
138 before */
139 void (*draw_horiz_band)(struct AVCodecContext *s,
140 UINT8 **src_ptr, int linesize,
141 int y, int width, int height);
142
de6d9b64
FB
143 /* audio only */
144 int sample_rate; /* samples per sec */
145 int channels;
a96b68b7 146 int sample_fmt; /* sample format, currenly unused */
de6d9b64
FB
147
148 /* the following data should not be initialized */
9cd3766f
J
149 int frame_size; /* in samples, initialized when calling 'init' */
150 int frame_number; /* audio or video frame number */
151 int real_pict_num; /* returns the real picture number of
152 previous encoded frame */
153 int key_frame; /* true if the previous compressed frame was
154 a key frame (intra, or seekable) */
155 int pict_type; /* picture type of the previous
156 encoded frame */
157/* FIXME: these should have FF_ */
158#define I_TYPE 1 // Intra
159#define P_TYPE 2 // Predicted
160#define B_TYPE 3 // Bi-dir predicted
161#define S_TYPE 4 // S(GMC)-VOP MPEG4
162
163 int delay; /* number of frames the decoded output
164 will be delayed relative to the encoded input */
2417652e
MN
165 uint8_t *mbskip_table; /* =1 if MB didnt change, is only valid for I/P frames
166 stride= mb_width = (width+15)>>4 */
1ff662cc
MN
167
168 /* encoding parameters */
de6d9b64 169 int quality; /* quality of the previous encoded frame
8b4c7dbc
MN
170 (between 1 (good) and 31 (bad))
171 this is allso used to set the quality in vbr mode
172 and the per frame quality in CODEC_FLAG_TYPE (second pass mode) */
9cdd6a24
MN
173 float qcompress; /* amount of qscale change between easy & hard scenes (0.0-1.0)*/
174 float qblur; /* amount of qscale smoothing over time (0.0-1.0) */
175 int qmin; /* min qscale */
176 int qmax; /* max qscale */
177 int max_qdiff; /* max qscale difference between frames */
9dbcbd92 178 int max_b_frames; /* maximum b frames, the output will be delayed by max_b_frames+1 relative to the input */
8b4c7dbc
MN
179 float b_quant_factor;/* qscale factor between ips and b frames */
180 int rc_strategy;
181 int b_frame_strategy;
9dbcbd92 182
2417652e
MN
183 int hurry_up; /* when set to 1 during decoding, b frames will be skiped
184 when set to 2 idct/dequant will be skipped too */
185
de6d9b64
FB
186 struct AVCodec *codec;
187 void *priv_data;
188
644d98a4
J
189 /* The following data is for RTP friendly coding */
190 /* By now only H.263/H.263+ coder honours this */
191 int rtp_mode; /* 1 for activate RTP friendly-mode */
192 /* highers numbers represent more error-prone */
193 /* enviroments, by now just "1" exist */
194
195 int rtp_payload_size; /* The size of the RTP payload, the coder will */
196 /* do it's best to deliver a chunk with size */
197 /* below rtp_payload_size, the chunk will start */
198 /* with a start code on some codecs like H.263 */
199 /* This doesn't take account of any particular */
200 /* headers inside the transmited RTP payload */
81401c1f
J
201
202
203 /* The RTP callcack: This function is called */
204 /* every time the encoder as a packet to send */
205 /* Depends on the encoder if the data starts */
206 /* with a Start Code (it should) H.263 does */
207 void (*rtp_callback)(void *data, int size, int packet_number);
208
43f1708f
J
209 /* These are for PSNR calculation, if you set get_psnr to 1 */
210 /* after encoding you will have the PSNR on psnr_y/cb/cr */
211 int get_psnr;
212 float psnr_y;
213 float psnr_cb;
214 float psnr_cr;
098eefe1
MN
215
216 /* statistics, used for 2-pass encoding */
217 int mv_bits;
218 int header_bits;
219 int i_tex_bits;
220 int p_tex_bits;
221 int i_count;
222 int p_count;
223 int skip_count;
224 int misc_bits; // cbp, mb_type
225 int frame_bits;
644d98a4 226
de6d9b64 227 /* the following fields are ignored */
bf89e6b1 228 void *opaque; /* can be used to carry app specific stuff */
de6d9b64 229 char codec_name[32];
4a663d80
PG
230 enum CodecType codec_type; /* see CODEC_TYPE_xxx */
231 enum CodecID codec_id; /* see CODEC_ID_xxx */
de6d9b64 232 unsigned int codec_tag; /* codec tag, only used if unknown codec */
5d27890a
NK
233 /*
234 Note: Below are located reserved fields for further usage
235 It requires for ABI !!!
236 If you'll perform some changes then borrow new space from these fields
237 (void * can be safety replaced with struct * ;)
238 P L E A S E ! ! !
239 IMPORTANT: Never change order of already declared fields!!!
240 */
241 unsigned long long int
242 ull_res0,ull_res1,ull_res2,ull_res3,ull_res4,ull_res5,
243 ull_res6,ull_res7,ull_res8,ull_res9,ull_res10,ull_res11,ull_res12;
244 float
245 flt_res0,flt_res1,flt_res2,flt_res3,flt_res4,flt_res5,
246 flt_res6,flt_res7,flt_res8,flt_res9,flt_res10,flt_res11,flt_res12;
247 void
248 *ptr_res0,*ptr_res1,*ptr_res2,*ptr_res3,*ptr_res4,*ptr_res5,
249 *ptr_res6,*ptr_res7,*ptr_res8,*ptr_res9,*ptr_res10,*ptr_res11,*ptr_res12;
250 unsigned long int
251 ul_res0,ul_res1,ul_res2,ul_res3,ul_res4,ul_res5,
252 ul_res6,ul_res7,ul_res8,ul_res9,ul_res10,ul_res11,ul_res12;
253 unsigned int
254 ui_res0,ui_res1,ui_res2,ui_res3,ui_res4,ui_res5,
255 ui_res6,ui_res7,ui_res8,ui_res9,ui_res10,ui_res11,ui_res12;
256 unsigned short int
257 us_res0,us_res1,us_res2,us_res3,us_res4,us_res5,
258 us_res6,us_res7,us_res8,us_res9,us_res10,us_res11,us_res12;
259 unsigned char
260 uc_res0,uc_res1,uc_res2,uc_res3,uc_res4,uc_res5,
261 uc_res6,uc_res7,uc_res8,uc_res9,uc_res10,uc_res11,uc_res12;
de6d9b64
FB
262} AVCodecContext;
263
264typedef struct AVCodec {
265 char *name;
266 int type;
267 int id;
268 int priv_data_size;
269 int (*init)(AVCodecContext *);
270 int (*encode)(AVCodecContext *, UINT8 *buf, int buf_size, void *data);
271 int (*close)(AVCodecContext *);
272 int (*decode)(AVCodecContext *, void *outdata, int *outdata_size,
273 UINT8 *buf, int buf_size);
bf89e6b1 274 int capabilities;
de6d9b64 275 struct AVCodec *next;
5d27890a
NK
276 /*
277 Note: Below are located reserved fields for further usage
278 It requires for ABI !!!
279 If you'll perform some changes then borrow new space from these fields
280 (void * can be safety replaced with struct * ;)
281 P L E A S E ! ! !
282 IMPORTANT: Never change order of already declared fields!!!
283 */
284 unsigned long long int
285 ull_res0,ull_res1,ull_res2,ull_res3,ull_res4,ull_res5,
286 ull_res6,ull_res7,ull_res8,ull_res9,ull_res10,ull_res11,ull_res12;
287 float
288 flt_res0,flt_res1,flt_res2,flt_res3,flt_res4,flt_res5,
289 flt_res6,flt_res7,flt_res8,flt_res9,flt_res10,flt_res11,flt_res12;
290 void
291 *ptr_res0,*ptr_res1,*ptr_res2,*ptr_res3,*ptr_res4,*ptr_res5,
292 *ptr_res6,*ptr_res7,*ptr_res8,*ptr_res9,*ptr_res10,*ptr_res11,*ptr_res12;
de6d9b64
FB
293} AVCodec;
294
295/* three components are given, that's all */
296typedef struct AVPicture {
297 UINT8 *data[3];
298 int linesize[3];
299} AVPicture;
300
301extern AVCodec ac3_encoder;
302extern AVCodec mp2_encoder;
9d36bdc9 303extern AVCodec mp3lame_encoder;
de6d9b64
FB
304extern AVCodec mpeg1video_encoder;
305extern AVCodec h263_encoder;
306extern AVCodec h263p_encoder;
307extern AVCodec rv10_encoder;
308extern AVCodec mjpeg_encoder;
bf89e6b1 309extern AVCodec mpeg4_encoder;
84afee34
MN
310extern AVCodec msmpeg4v1_encoder;
311extern AVCodec msmpeg4v2_encoder;
312extern AVCodec msmpeg4v3_encoder;
de6d9b64
FB
313
314extern AVCodec h263_decoder;
bf89e6b1 315extern AVCodec mpeg4_decoder;
84afee34
MN
316extern AVCodec msmpeg4v1_decoder;
317extern AVCodec msmpeg4v2_decoder;
318extern AVCodec msmpeg4v3_decoder;
e1a9dbff 319extern AVCodec wmv1_decoder;
de6d9b64
FB
320extern AVCodec mpeg_decoder;
321extern AVCodec h263i_decoder;
322extern AVCodec rv10_decoder;
4e66ab3b 323extern AVCodec mjpeg_decoder;
4b1f4f23 324extern AVCodec mp2_decoder;
a96b68b7 325extern AVCodec mp3_decoder;
de6d9b64 326
a96b68b7
FB
327/* pcm codecs */
328#define PCM_CODEC(id, name) \
329extern AVCodec name ## _decoder; \
330extern AVCodec name ## _encoder;
331
332PCM_CODEC(CODEC_ID_PCM_S16LE, pcm_s16le);
333PCM_CODEC(CODEC_ID_PCM_S16BE, pcm_s16be);
334PCM_CODEC(CODEC_ID_PCM_U16LE, pcm_u16le);
335PCM_CODEC(CODEC_ID_PCM_U16BE, pcm_u16be);
336PCM_CODEC(CODEC_ID_PCM_S8, pcm_s8);
337PCM_CODEC(CODEC_ID_PCM_U8, pcm_u8);
338PCM_CODEC(CODEC_ID_PCM_ALAW, pcm_alaw);
339PCM_CODEC(CODEC_ID_PCM_MULAW, pcm_mulaw);
340
341#undef PCM_CODEC
342
343/* dummy raw video codec */
de6d9b64
FB
344extern AVCodec rawvideo_codec;
345
346/* the following codecs use external GPL libs */
de6d9b64
FB
347extern AVCodec ac3_decoder;
348
349/* resample.c */
350
351struct ReSampleContext;
352
353typedef struct ReSampleContext ReSampleContext;
354
355ReSampleContext *audio_resample_init(int output_channels, int input_channels,
356 int output_rate, int input_rate);
357int audio_resample(ReSampleContext *s, short *output, short *input, int nb_samples);
358void audio_resample_close(ReSampleContext *s);
359
360/* YUV420 format is assumed ! */
361
362struct ImgReSampleContext;
363
364typedef struct ImgReSampleContext ImgReSampleContext;
365
366ImgReSampleContext *img_resample_init(int output_width, int output_height,
367 int input_width, int input_height);
368void img_resample(ImgReSampleContext *s,
369 AVPicture *output, AVPicture *input);
370
371void img_resample_close(ImgReSampleContext *s);
372
219b06c6
FB
373void avpicture_fill(AVPicture *picture, UINT8 *ptr,
374 int pix_fmt, int width, int height);
375int avpicture_get_size(int pix_fmt, int width, int height);
376
377/* convert among pixel formats */
378int img_convert(AVPicture *dst, int dst_pix_fmt,
379 AVPicture *src, int pix_fmt,
380 int width, int height);
381
382/* deinterlace a picture */
383int avpicture_deinterlace(AVPicture *dst, AVPicture *src,
de6d9b64
FB
384 int pix_fmt, int width, int height);
385
386/* external high level API */
387
388extern AVCodec *first_avcodec;
389
156e5023
NK
390/* returns LIBAVCODEC_VERSION_INT constant */
391unsigned avcodec_version( void );
8bceb6af
NK
392/* returns LIBAVCODEC_BUILD constant */
393unsigned avcodec_build( void );
de6d9b64
FB
394void avcodec_init(void);
395
396void register_avcodec(AVCodec *format);
397AVCodec *avcodec_find_encoder(enum CodecID id);
98f3b098 398AVCodec *avcodec_find_encoder_by_name(const char *name);
de6d9b64
FB
399AVCodec *avcodec_find_decoder(enum CodecID id);
400AVCodec *avcodec_find_decoder_by_name(const char *name);
401void avcodec_string(char *buf, int buf_size, AVCodecContext *enc, int encode);
402
403int avcodec_open(AVCodecContext *avctx, AVCodec *codec);
404int avcodec_decode_audio(AVCodecContext *avctx, INT16 *samples,
405 int *frame_size_ptr,
406 UINT8 *buf, int buf_size);
407int avcodec_decode_video(AVCodecContext *avctx, AVPicture *picture,
408 int *got_picture_ptr,
409 UINT8 *buf, int buf_size);
410int avcodec_encode_audio(AVCodecContext *avctx, UINT8 *buf, int buf_size,
411 const short *samples);
412int avcodec_encode_video(AVCodecContext *avctx, UINT8 *buf, int buf_size,
413 const AVPicture *pict);
414
415int avcodec_close(AVCodecContext *avctx);
416
417void avcodec_register_all(void);
a96b68b7 418
1c2a8c7f
MN
419void avcodec_flush_buffers(AVCodecContext *avctx);
420
79e7b305
A
421#ifdef FF_POSTPROCESS
422#ifndef MBC
2c029cd1
A
423#define MBC 128
424#define MBR 96
79e7b305
A
425#endif
426extern int quant_store[MBR+1][MBC+1]; // [Review]
427#endif
428
a96b68b7 429#endif /* AVCODEC_H */