build update - avpicture_fill() returns the image size
[libav.git] / libavcodec / avcodec.h
1 #ifndef AVCODEC_H
2 #define AVCODEC_H
3
4 #include "common.h"
5
6 #define LIBAVCODEC_VERSION_INT 0x000406
7 #define LIBAVCODEC_VERSION "0.4.6"
8 #define LIBAVCODEC_BUILD 4654
9 #define LIBAVCODEC_BUILD_STR "4654"
10
11 enum CodecID {
12 CODEC_ID_NONE,
13 CODEC_ID_MPEG1VIDEO,
14 CODEC_ID_H263,
15 CODEC_ID_RV10,
16 CODEC_ID_MP2,
17 CODEC_ID_MP3LAME,
18 CODEC_ID_VORBIS,
19 CODEC_ID_AC3,
20 CODEC_ID_MJPEG,
21 CODEC_ID_MJPEGB,
22 CODEC_ID_MPEG4,
23 CODEC_ID_RAWVIDEO,
24 CODEC_ID_MSMPEG4V1,
25 CODEC_ID_MSMPEG4V2,
26 CODEC_ID_MSMPEG4V3,
27 CODEC_ID_WMV1,
28 CODEC_ID_WMV2,
29 CODEC_ID_H263P,
30 CODEC_ID_H263I,
31 CODEC_ID_SVQ1,
32 CODEC_ID_DVVIDEO,
33 CODEC_ID_DVAUDIO,
34 CODEC_ID_WMAV1,
35 CODEC_ID_WMAV2,
36 CODEC_ID_MACE3,
37 CODEC_ID_MACE6,
38 CODEC_ID_HUFFYUV,
39
40 /* various pcm "codecs" */
41 CODEC_ID_PCM_S16LE,
42 CODEC_ID_PCM_S16BE,
43 CODEC_ID_PCM_U16LE,
44 CODEC_ID_PCM_U16BE,
45 CODEC_ID_PCM_S8,
46 CODEC_ID_PCM_U8,
47 CODEC_ID_PCM_MULAW,
48 CODEC_ID_PCM_ALAW,
49
50 /* various adpcm codecs */
51 CODEC_ID_ADPCM_IMA_QT,
52 CODEC_ID_ADPCM_IMA_WAV,
53 CODEC_ID_ADPCM_MS,
54 };
55
56 enum CodecType {
57 CODEC_TYPE_UNKNOWN = -1,
58 CODEC_TYPE_VIDEO,
59 CODEC_TYPE_AUDIO,
60 };
61
62 enum PixelFormat {
63 PIX_FMT_YUV420P,
64 PIX_FMT_YUV422,
65 PIX_FMT_RGB24, /* 3 bytes, R is first */
66 PIX_FMT_BGR24, /* 3 bytes, B is first */
67 PIX_FMT_YUV422P,
68 PIX_FMT_YUV444P,
69 PIX_FMT_RGBA32, /* always stored in cpu endianness */
70 PIX_FMT_YUV410P,
71 PIX_FMT_YUV411P,
72 PIX_FMT_RGB565, /* always stored in cpu endianness */
73 PIX_FMT_RGB555, /* always stored in cpu endianness, most significant bit to 1 */
74 PIX_FMT_GRAY8,
75 PIX_FMT_MONOWHITE, /* 0 is white */
76 PIX_FMT_MONOBLACK, /* 0 is black */
77 PIX_FMT_NB,
78 };
79
80 /* currently unused, may be used if 24/32 bits samples ever supported */
81 enum SampleFormat {
82 SAMPLE_FMT_S16 = 0, /* signed 16 bits */
83 };
84
85 /* in bytes */
86 #define AVCODEC_MAX_AUDIO_FRAME_SIZE 131072
87
88 /**
89 * Required number of zero bytes at the end of the input bitstream for decoding.
90 * to avoid overreading (and possibly segfaulting)
91 */
92 #define FF_INPUT_BUFFER_PADDING_SIZE 8
93
94 /* motion estimation type, EPZS by default */
95 enum Motion_Est_ID {
96 ME_ZERO = 1,
97 ME_FULL,
98 ME_LOG,
99 ME_PHODS,
100 ME_EPZS,
101 ME_X1
102 };
103
104 typedef struct RcOverride{
105 int start_frame;
106 int end_frame;
107 int qscale; // if this is 0 then quality_factor will be used instead
108 float quality_factor;
109 } RcOverride;
110
111 /* only for ME compatiblity with old apps */
112 extern int motion_estimation_method;
113
114 /* ME algos sorted by quality */
115 static const int Motion_Est_QTab[] = { ME_ZERO, ME_PHODS, ME_LOG,
116 ME_X1, ME_EPZS, ME_FULL };
117
118
119 #define FF_MAX_B_FRAMES 8
120
121 /* encoding support
122 these flags can be passed in AVCodecContext.flags before initing
123 Note: note not everything is supported yet
124 */
125
126 #define CODEC_FLAG_HQ 0x0001 /* brute force MB-type decission mode (slow) */
127 #define CODEC_FLAG_QSCALE 0x0002 /* use fixed qscale */
128 #define CODEC_FLAG_4MV 0x0004 /* 4 MV per MB allowed */
129 #define CODEC_FLAG_QPEL 0x0010 /* use qpel MC */
130 #define CODEC_FLAG_GMC 0x0020 /* use GMC */
131 #define CODEC_FLAG_PART 0x0080 /* use data partitioning */
132 /* parent program gurantees that the input for b-frame containing streams is not written to
133 for at least s->max_b_frames+1 frames, if this is not set than the input will be copied */
134 #define CODEC_FLAG_INPUT_PRESERVED 0x0100
135 #define CODEC_FLAG_PASS1 0x0200 /* use internal 2pass ratecontrol in first pass mode */
136 #define CODEC_FLAG_PASS2 0x0400 /* use internal 2pass ratecontrol in second pass mode */
137 #define CODEC_FLAG_EXTERN_HUFF 0x1000 /* use external huffman table (for mjpeg) */
138 #define CODEC_FLAG_GRAY 0x2000 /* only decode/encode grayscale */
139 #define CODEC_FLAG_EMU_EDGE 0x4000/* dont draw edges */
140 #define CODEC_FLAG_PSNR 0x8000 /* error[?] variables will be set during encoding */
141 #define CODEC_FLAG_TRUNCATED 0x00010000 /* input bitstream might be truncated at a random location instead
142 of only at frame boundaries */
143 #define CODEC_FLAG_NORMALIZE_AQP 0x00020000 /* normalize adaptive quantization */
144 #define CODEC_FLAG_INTERLACED_DCT 0x00040000 /* use interlaced dct */
145 #define CODEC_FLAG_LOW_DELAY 0x00080000 /* force low delay / will fail on b frames */
146 #define CODEC_FLAG_ALT_SCAN 0x00100000 /* use alternate scan */
147 #define CODEC_FLAG_TRELLIS_QUANT 0x00200000 /* use trellis quantization */
148 #define CODEC_FLAG_GLOBAL_HEADER 0x00400000 /* place global headers in extradata instead of every keyframe */
149
150 /* codec capabilities */
151
152 #define CODEC_CAP_DRAW_HORIZ_BAND 0x0001 /* decoder can use draw_horiz_band callback */
153 #define CODEC_CAP_DR1 0x0002 /* direct rendering method 1 */
154 /* if 'parse_only' field is true, then avcodec_parse_frame() can be
155 used */
156 #define CODEC_CAP_PARSE_ONLY 0x0004
157 #define CODEC_CAP_TRUNCATED 0x0008
158
159 #define FRAME_RATE_BASE 10000
160
161 #define FF_COMMON_FRAME \
162 uint8_t *data[4];\
163 int linesize[4];\
164 /**\
165 * pointer to the first allocated byte of the picture. can be used in get_buffer/release_buffer\
166 * this isnt used by lavc unless the default get/release_buffer() is used\
167 * encoding: \
168 * decoding: \
169 */\
170 uint8_t *base[4];\
171 /**\
172 * 1 -> keyframe, 0-> not\
173 * encoding: set by lavc\
174 * decoding: set by lavc\
175 */\
176 int key_frame;\
177 \
178 /**\
179 * picture type of the frame, see ?_TYPE below\
180 * encoding: set by lavc for coded_picture (and set by user for input)\
181 * decoding: set by lavc\
182 */\
183 int pict_type;\
184 \
185 /**\
186 * presentation timestamp in micro seconds (time when frame should be shown to user)\
187 * if 0 then the frame_rate will be used as reference\
188 * encoding: MUST be set by user\
189 * decoding: set by lavc\
190 */\
191 long long int pts;\
192 \
193 /**\
194 * picture number in bitstream order.\
195 * encoding: set by\
196 * decoding: set by lavc\
197 */\
198 int coded_picture_number;\
199 /**\
200 * encoding: set by\
201 * decoding: set by lavc\
202 * picture number in display order.\
203 */\
204 int display_picture_number;\
205 \
206 /**\
207 * quality (between 1 (good) and 31 (bad)) \
208 * encoding: set by lavc for coded_picture (and set by user for input)\
209 * decoding: set by lavc\
210 */\
211 float quality; \
212 \
213 /**\
214 * buffer age (1->was last buffer and dint change, 2->..., ...).\
215 * set to something large if the buffer has not been used yet \
216 * encoding: unused\
217 * decoding: MUST be set by get_buffer()\
218 */\
219 int age;\
220 \
221 /**\
222 * is this picture used as reference\
223 * encoding: unused\
224 * decoding: set by lavc (before get_buffer() call))\
225 */\
226 int reference;\
227 \
228 /**\
229 * QP table\
230 * encoding: unused\
231 * decoding: set by lavc\
232 */\
233 int8_t *qscale_table;\
234 /**\
235 * QP store stride\
236 * encoding: unused\
237 * decoding: set by lavc\
238 */\
239 int qstride;\
240 \
241 /**\
242 * mbskip_table[mb]>=1 if MB didnt change\
243 * stride= mb_width = (width+15)>>4\
244 * encoding: unused\
245 * decoding: set by lavc\
246 */\
247 uint8_t *mbskip_table;\
248 \
249 /**\
250 * for some private data of the user\
251 * encoding: unused\
252 * decoding: set by user\
253 */\
254 void *opaque;\
255 \
256 /**\
257 * error\
258 * encoding: set by lavc if flags&CODEC_FLAG_PSNR\
259 * decoding: unused\
260 */\
261 uint64_t error[4];\
262 \
263 /**\
264 * type of the buffer (to keep track of who has to dealloc data[*])\
265 * encoding: set by the one who allocs it\
266 * decoding: set by the one who allocs it\
267 * Note: user allocated (direct rendering) & internal buffers can not coexist currently\
268 */\
269 int type;\
270
271 #define FF_BUFFER_TYPE_INTERNAL 1
272 #define FF_BUFFER_TYPE_USER 2 // Direct rendering buffers
273 #define FF_BUFFER_TYPE_SHARED 4 // input frame for encoding(wont be dealloced)
274
275
276 #define FF_I_TYPE 1 // Intra
277 #define FF_P_TYPE 2 // Predicted
278 #define FF_B_TYPE 3 // Bi-dir predicted
279 #define FF_S_TYPE 4 // S(GMC)-VOP MPEG4
280
281 typedef struct AVFrame {
282 FF_COMMON_FRAME
283 } AVFrame;
284
285 typedef struct AVCodecContext {
286 /**
287 * the average bitrate
288 * encoding: set by user. unused for constant quantizer encoding
289 * decoding: set by lavc. 0 or some bitrate if this info is available in the stream
290 */
291 int bit_rate;
292
293 /**
294 * number of bits the bitstream is allowed to diverge from the reference
295 * the reference can be CBR (for CBR pass1) or VBR (for pass2)
296 * encoding: set by user. unused for constant quantizer encoding
297 * decoding: unused
298 */
299 int bit_rate_tolerance;
300
301 /**
302 * CODEC_FLAG_*
303 * encoding: set by user.
304 * decoding: set by user.
305 */
306 int flags;
307
308 /**
309 * some codecs needs additionnal format info. It is stored here
310 * encoding: set by user.
311 * decoding: set by lavc. (FIXME is this ok?)
312 */
313 int sub_id;
314
315 /**
316 * motion estimation algorithm used for video coding
317 * encoding: MUST be set by user.
318 * decoding: unused
319 */
320 int me_method;
321
322 /**
323 * some codecs need / can use extra-data like huffman tables
324 * mjpeg: huffman tables
325 * rv10: additional flags
326 * mpeg4: global headers (they can be in the bitstream or here)
327 * encoding: set/allocated/freed by lavc.
328 * decoding: set/allocated/freed by user.
329 */
330 void *extradata;
331 int extradata_size;
332
333 /* video only */
334 /**
335 * frames per sec multiplied by FRAME_RATE_BASE
336 * for variable fps this is the precission, so if the timestamps
337 * can be specified in msec precssion then this is 1000*FRAME_RATE_BASE
338 * encoding: MUST be set by user
339 * decoding: set by lavc. 0 or the frame_rate if available
340 */
341 int frame_rate;
342
343 /**
344 * encoding: MUST be set by user.
345 * decoding: set by user, some codecs might override / change it during playback
346 */
347 int width, height;
348
349 #define FF_ASPECT_SQUARE 1
350 #define FF_ASPECT_4_3_625 2
351 #define FF_ASPECT_4_3_525 3
352 #define FF_ASPECT_16_9_625 4
353 #define FF_ASPECT_16_9_525 5
354 #define FF_ASPECT_EXTENDED 15
355
356 /**
357 * the number of pictures in a group of pitures, or 0 for intra_only
358 * encoding: set by user.
359 * decoding: unused
360 */
361 int gop_size;
362
363 /**
364 * pixel format, see PIX_FMT_xxx
365 * encoding: unused
366 * decoding: set by lavc.
367 */
368 enum PixelFormat pix_fmt;
369
370 int repeat_pict; /* when decoding, this signal how much the picture */
371 /* must be delayed. */
372 /* extra_delay = (repeat_pict / 2) * (1/fps) */
373
374 /**
375 * if non NULL, 'draw_horiz_band' is called by the libavcodec
376 * decoder to draw an horizontal band. It improve cache usage. Not
377 * all codecs can do that. You must check the codec capabilities
378 * before
379 * encoding: unused
380 * decoding: set by user.
381 */
382 void (*draw_horiz_band)(struct AVCodecContext *s,
383 UINT8 **src_ptr, int linesize,
384 int y, int width, int height);
385
386 /* audio only */
387 int sample_rate; /* samples per sec */
388 int channels;
389 int sample_fmt; /* sample format, currenly unused */
390
391 /* the following data should not be initialized */
392 int frame_size; /* in samples, initialized when calling 'init' */
393 int frame_number; /* audio or video frame number */
394 int real_pict_num; /* returns the real picture number of
395 previous encoded frame */
396
397 /**
398 * number of frames the decoded output will be delayed relative to
399 * the encoded input
400 * encoding: set by lavc.
401 * decoding: unused
402 */
403 int delay;
404
405 /* encoding parameters */
406 float qcompress; /* amount of qscale change between easy & hard scenes (0.0-1.0)*/
407 float qblur; /* amount of qscale smoothing over time (0.0-1.0) */
408
409 /**
410 * minimum quantizer
411 * encoding: set by user.
412 * decoding: unused
413 */
414 int qmin;
415
416 /**
417 * maximum quantizer
418 * encoding: set by user.
419 * decoding: unused
420 */
421 int qmax;
422
423 /**
424 * maximum quantizer difference etween frames
425 * encoding: set by user.
426 * decoding: unused
427 */
428 int max_qdiff;
429
430 /**
431 * maximum number of b frames between non b frames
432 * note: the output will be delayed by max_b_frames+1 relative to the input
433 * encoding: set by user.
434 * decoding: unused
435 */
436 int max_b_frames;
437
438 /**
439 * qscale factor between ip and b frames
440 * encoding: set by user.
441 * decoding: unused
442 */
443 float b_quant_factor;
444
445 /** obsolete FIXME remove */
446 int rc_strategy;
447 int b_frame_strategy;
448
449 /**
450 * encoding: unused
451 * decoding: set by user. 1-> skip b frames, 2-> skip idct/dequant too, 5-> skip everything except header
452 */
453 int hurry_up;
454
455 struct AVCodec *codec;
456
457 void *priv_data;
458
459 /* The following data is for RTP friendly coding */
460 /* By now only H.263/H.263+/MPEG4 coder honours this */
461 int rtp_mode; /* 1 for activate RTP friendly-mode */
462 /* highers numbers represent more error-prone */
463 /* enviroments, by now just "1" exist */
464
465 int rtp_payload_size; /* The size of the RTP payload, the coder will */
466 /* do it's best to deliver a chunk with size */
467 /* below rtp_payload_size, the chunk will start */
468 /* with a start code on some codecs like H.263 */
469 /* This doesn't take account of any particular */
470 /* headers inside the transmited RTP payload */
471
472
473 /* The RTP callcack: This function is called */
474 /* every time the encoder as a packet to send */
475 /* Depends on the encoder if the data starts */
476 /* with a Start Code (it should) H.263 does */
477 void (*rtp_callback)(void *data, int size, int packet_number);
478
479 /* statistics, used for 2-pass encoding */
480 int mv_bits;
481 int header_bits;
482 int i_tex_bits;
483 int p_tex_bits;
484 int i_count;
485 int p_count;
486 int skip_count;
487 int misc_bits;
488
489 /**
490 * number of bits used for the previously encoded frame
491 * encoding: set by lavc
492 * decoding: - for audio - bits_per_sample
493 */
494 int frame_bits;
495
496 /**
497 * private data of the user, can be used to carry app specific stuff
498 * encoding: set by user
499 * decoding: set by user
500 */
501 void *opaque;
502
503 char codec_name[32];
504 enum CodecType codec_type; /* see CODEC_TYPE_xxx */
505 enum CodecID codec_id; /* see CODEC_ID_xxx */
506 unsigned int codec_tag; /* codec tag, only used if unknown codec */
507
508 /**
509 * workaround bugs in encoders which sometimes cannot be detected automatically
510 * encoding: unused
511 * decoding: set by user
512 */
513 int workaround_bugs;
514 #define FF_BUG_AUTODETECT 1 //autodetection
515 #define FF_BUG_OLD_MSMPEG4 2
516 #define FF_BUG_XVID_ILACE 4
517 #define FF_BUG_UMP4 8
518 #define FF_BUG_NO_PADDING 16
519 #define FF_BUG_AC_VLC 32
520 #define FF_BUG_QPEL_CHROMA 64
521 #define FF_BUG_STD_QPEL 128
522 //#define FF_BUG_FAKE_SCALABILITY 16 //autodetection should work 100%
523
524 /**
525 * encoding: set by user
526 * decoding: unused
527 */
528 int luma_elim_threshold;
529
530 /**
531 * encoding: set by user
532 * decoding: unused
533 */
534 int chroma_elim_threshold;
535
536 /**
537 * strictly follow the std (MPEG4, ...)
538 * encoding: set by user
539 * decoding: unused
540 */
541 int strict_std_compliance;
542
543 /**
544 * qscale offset between ip and b frames
545 * if > 0 then the last p frame quantizer will be used (q= lastp_q*factor+offset)
546 * if < 0 then normal ratecontrol will be done (q= -normal_q*factor+offset)
547 * encoding: set by user.
548 * decoding: unused
549 */
550 float b_quant_offset;
551
552 /**
553 * error resilience higher values will detect more errors but may missdetect
554 * some more or less valid parts as errors
555 * encoding: unused
556 * decoding: set by user
557 */
558 int error_resilience;
559 #define FF_ER_CAREFULL 1
560 #define FF_ER_COMPLIANT 2
561 #define FF_ER_AGGRESSIVE 3
562 #define FF_ER_VERY_AGGRESSIVE 4
563
564 /**
565 * called at the beginning of each frame to get a buffer for it.
566 * if pic.reference is set then the frame will be read later by lavc
567 * encoding: unused
568 * decoding: set by lavc, user can override
569 */
570 int (*get_buffer)(struct AVCodecContext *c, AVFrame *pic);
571
572 /**
573 * called to release buffers which where allocated with get_buffer.
574 * a released buffer can be reused in get_buffer()
575 * pic.data[*] must be set to NULL
576 * encoding: unused
577 * decoding: set by lavc, user can override
578 */
579 void (*release_buffer)(struct AVCodecContext *c, AVFrame *pic);
580
581 /**
582 * is 1 if the decoded stream contains b frames, 0 otherwise
583 * encoding: unused
584 * decoding: set by lavc
585 */
586 int has_b_frames;
587
588 int block_align; /* used by some WAV based audio codecs */
589
590 int parse_only; /* decoding only: if true, only parsing is done
591 (function avcodec_parse_frame()). The frame
592 data is returned. Only MPEG codecs support this now. */
593
594 /**
595 * 0-> h263 quant 1-> mpeg quant
596 * encoding: set by user.
597 * decoding: unused
598 */
599 int mpeg_quant;
600
601 /**
602 * pass1 encoding statistics output buffer
603 * encoding: set by lavc
604 * decoding: unused
605 */
606 char *stats_out; /* encoding statistics output buffer */
607
608 /**
609 * pass2 encoding statistics input buffer.
610 * concatenated stuff from stats_out of pass1 should be placed here
611 * encoding: allocated/set/freed by user
612 * decoding: unused
613 */
614 char *stats_in;
615
616 /**
617 * ratecontrol qmin qmax limiting method
618 * 0-> clipping, 1-> use a nice continous function to limit qscale wthin qmin/qmax
619 * encoding: set by user.
620 * decoding: unused
621 */
622 float rc_qsquish;
623
624 float rc_qmod_amp;
625 int rc_qmod_freq;
626
627 /**
628 * ratecontrol override, see RcOverride
629 * encoding: allocated/set/freed by user.
630 * decoding: unused
631 */
632 RcOverride *rc_override;
633 int rc_override_count;
634
635 /**
636 * rate control equation
637 * encoding: set by user
638 * decoding: unused
639 */
640 char *rc_eq;
641
642 /**
643 * maximum bitrate
644 * encoding: set by user.
645 * decoding: unused
646 */
647 int rc_max_rate;
648
649 /**
650 * minimum bitrate
651 * encoding: set by user.
652 * decoding: unused
653 */
654 int rc_min_rate;
655
656 /**
657 * decoder bitstream buffer size
658 * encoding: set by user.
659 * decoding: unused
660 */
661 int rc_buffer_size;
662 float rc_buffer_aggressivity;
663
664 /**
665 * qscale factor between p and i frames
666 * encoding: set by user.
667 * decoding: unused
668 */
669 float i_quant_factor;
670
671 /**
672 * qscale offset between p and i frames
673 * if > 0 then the last p frame quantizer will be used (q= lastp_q*factor+offset)
674 * if < 0 then normal ratecontrol will be done (q= -normal_q*factor+offset)
675 * encoding: set by user.
676 * decoding: unused
677 */
678 float i_quant_offset;
679
680 /**
681 * initial complexity for pass1 ratecontrol
682 * encoding: set by user.
683 * decoding: unused
684 */
685 float rc_initial_cplx;
686
687 /**
688 * dct algorithm, see FF_DCT_* below
689 * encoding: set by user
690 * decoding: unused
691 */
692 int dct_algo;
693 #define FF_DCT_AUTO 0
694 #define FF_DCT_FASTINT 1
695 #define FF_DCT_INT 2
696 #define FF_DCT_MMX 3
697 #define FF_DCT_MLIB 4
698 #define FF_DCT_ALTIVEC 5
699
700 /**
701 * luminance masking (0-> disabled)
702 * encoding: set by user
703 * decoding: unused
704 */
705 float lumi_masking;
706
707 /**
708 * temporary complexity masking (0-> disabled)
709 * encoding: set by user
710 * decoding: unused
711 */
712 float temporal_cplx_masking;
713
714 /**
715 * spatial complexity masking (0-> disabled)
716 * encoding: set by user
717 * decoding: unused
718 */
719 float spatial_cplx_masking;
720
721 /**
722 * p block masking (0-> disabled)
723 * encoding: set by user
724 * decoding: unused
725 */
726 float p_masking;
727
728 /**
729 * darkness masking (0-> disabled)
730 * encoding: set by user
731 * decoding: unused
732 */
733 float dark_masking;
734
735 /**
736 * fourcc (LSB first, so "ABCD" -> ('D'<<24) + ('C'<<16) + ('B'<<8) + 'A')
737 * this is used to workaround some encoder bugs
738 * encoding: unused
739 * decoding: set by user, will be converted to upper case by lavc during init
740 */
741 int fourcc;
742
743 /**
744 * idct algorithm, see FF_IDCT_* below
745 * encoding: set by user
746 * decoding: set by user
747 */
748 int idct_algo;
749 #define FF_IDCT_AUTO 0
750 #define FF_IDCT_INT 1
751 #define FF_IDCT_SIMPLE 2
752 #define FF_IDCT_SIMPLEMMX 3
753 #define FF_IDCT_LIBMPEG2MMX 4
754 #define FF_IDCT_PS2 5
755 #define FF_IDCT_MLIB 6
756 #define FF_IDCT_ARM 7
757 #define FF_IDCT_ALTIVEC 8
758
759 /**
760 * slice count
761 * encoding: set by lavc
762 * decoding: set by user (or 0)
763 */
764 int slice_count;
765 /**
766 * slice offsets in the frame in bytes
767 * encoding: set/allocated by lavc
768 * decoding: set/allocated by user (or NULL)
769 */
770 int *slice_offset;
771
772 /**
773 * error concealment flags
774 * encoding: unused
775 * decoding: set by user
776 */
777 int error_concealment;
778 #define FF_EC_GUESS_MVS 1
779 #define FF_EC_DEBLOCK 2
780
781 /**
782 * dsp_mask could be used to disable unwanted
783 * CPU features (i.e. MMX, SSE. ...)
784 */
785 unsigned dsp_mask;
786
787 /**
788 * bits per sample/pixel from the demuxer (needed for huffyuv)
789 * encoding: set by lavc
790 * decoding: set by user
791 */
792 int bits_per_sample;
793
794 /**
795 * prediction method (needed for huffyuv)
796 * encoding: set by user
797 * decoding: unused
798 */
799 int prediction_method;
800 #define FF_PRED_LEFT 0
801 #define FF_PRED_PLANE 1
802 #define FF_PRED_MEDIAN 2
803
804 /**
805 * aspect ratio. (0 if unknown)
806 * encoding: set by user.
807 * decoding: set by lavc.
808 */
809 float aspect_ratio;
810
811 /**
812 * the picture in the bitstream
813 * encoding: set by lavc
814 * decoding: set by lavc
815 */
816 AVFrame *coded_frame;
817
818 /**
819 * debug
820 * encoding: set by user.
821 * decoding: set by user.
822 */
823 int debug;
824 #define FF_DEBUG_PICT_INFO 1
825 #define FF_DEBUG_RC 2
826 #define FF_DEBUG_BITSTREAM 4
827 #define FF_DEBUG_MB_TYPE 8
828 #define FF_DEBUG_QP 16
829 #define FF_DEBUG_MV 32
830 #define FF_DEBUG_VIS_MV 0x00000040
831 #define FF_DEBUG_SKIP 0x00000080
832 #define FF_DEBUG_STARTCODE 0x00000100
833 #define FF_DEBUG_PTS 0x00000200
834
835 /**
836 * error
837 * encoding: set by lavc if flags&CODEC_FLAG_PSNR
838 * decoding: unused
839 */
840 uint64_t error[4];
841
842 /**
843 * minimum MB quantizer
844 * encoding: set by user.
845 * decoding: unused
846 */
847 int mb_qmin;
848
849 /**
850 * maximum MB quantizer
851 * encoding: set by user.
852 * decoding: unused
853 */
854 int mb_qmax;
855
856 /**
857 * motion estimation compare function
858 * encoding: set by user.
859 * decoding: unused
860 */
861 int me_cmp;
862 /**
863 * subpixel motion estimation compare function
864 * encoding: set by user.
865 * decoding: unused
866 */
867 int me_sub_cmp;
868 /**
869 * macroblock compare function (not supported yet)
870 * encoding: set by user.
871 * decoding: unused
872 */
873 int mb_cmp;
874 #define FF_CMP_SAD 0
875 #define FF_CMP_SSE 1
876 #define FF_CMP_SATD 2
877 #define FF_CMP_DCT 3
878 #define FF_CMP_PSNR 4
879 #define FF_CMP_BIT 5
880 #define FF_CMP_RD 6
881 #define FF_CMP_ZERO 7
882 #define FF_CMP_CHROMA 256
883
884 /**
885 * ME diamond size & shape
886 * encoding: set by user.
887 * decoding: unused
888 */
889 int dia_size;
890
891 /**
892 * amount of previous MV predictors (2a+1 x 2a+1 square)
893 * encoding: set by user.
894 * decoding: unused
895 */
896 int last_predictor_count;
897
898 /**
899 * pre pass for motion estimation
900 * encoding: set by user.
901 * decoding: unused
902 */
903 int pre_me;
904
905 /**
906 * motion estimation pre pass compare function
907 * encoding: set by user.
908 * decoding: unused
909 */
910 int me_pre_cmp;
911
912 /**
913 * ME pre pass diamond size & shape
914 * encoding: set by user.
915 * decoding: unused
916 */
917 int pre_dia_size;
918
919 /**
920 * subpel ME quality
921 * encoding: set by user.
922 * decoding: unused
923 */
924 int me_subpel_quality;
925
926 } AVCodecContext;
927
928 typedef struct AVCodec {
929 const char *name;
930 int type;
931 int id;
932 int priv_data_size;
933 int (*init)(AVCodecContext *);
934 int (*encode)(AVCodecContext *, UINT8 *buf, int buf_size, void *data);
935 int (*close)(AVCodecContext *);
936 int (*decode)(AVCodecContext *, void *outdata, int *outdata_size,
937 UINT8 *buf, int buf_size);
938 int capabilities;
939 struct AVCodec *next;
940 } AVCodec;
941
942 /**
943 * four components are given, that's all.
944 * the last component is alpha
945 */
946 typedef struct AVPicture {
947 UINT8 *data[4];
948 int linesize[4];
949 } AVPicture;
950
951 extern AVCodec ac3_encoder;
952 extern AVCodec mp2_encoder;
953 extern AVCodec mp3lame_encoder;
954 extern AVCodec oggvorbis_encoder;
955 extern AVCodec mpeg1video_encoder;
956 extern AVCodec h263_encoder;
957 extern AVCodec h263p_encoder;
958 extern AVCodec rv10_encoder;
959 extern AVCodec mjpeg_encoder;
960 extern AVCodec mpeg4_encoder;
961 extern AVCodec msmpeg4v1_encoder;
962 extern AVCodec msmpeg4v2_encoder;
963 extern AVCodec msmpeg4v3_encoder;
964 extern AVCodec wmv1_encoder;
965 extern AVCodec wmv2_encoder;
966 extern AVCodec huffyuv_encoder;
967
968 extern AVCodec h263_decoder;
969 extern AVCodec mpeg4_decoder;
970 extern AVCodec msmpeg4v1_decoder;
971 extern AVCodec msmpeg4v2_decoder;
972 extern AVCodec msmpeg4v3_decoder;
973 extern AVCodec wmv1_decoder;
974 extern AVCodec wmv2_decoder;
975 extern AVCodec mpeg_decoder;
976 extern AVCodec h263i_decoder;
977 extern AVCodec rv10_decoder;
978 extern AVCodec svq1_decoder;
979 extern AVCodec dvvideo_decoder;
980 extern AVCodec dvaudio_decoder;
981 extern AVCodec wmav1_decoder;
982 extern AVCodec wmav2_decoder;
983 extern AVCodec mjpeg_decoder;
984 extern AVCodec mjpegb_decoder;
985 extern AVCodec mp2_decoder;
986 extern AVCodec mp3_decoder;
987 extern AVCodec mace3_decoder;
988 extern AVCodec mace6_decoder;
989 extern AVCodec huffyuv_decoder;
990 extern AVCodec oggvorbis_decoder;
991
992 /* pcm codecs */
993 #define PCM_CODEC(id, name) \
994 extern AVCodec name ## _decoder; \
995 extern AVCodec name ## _encoder
996
997 PCM_CODEC(CODEC_ID_PCM_S16LE, pcm_s16le);
998 PCM_CODEC(CODEC_ID_PCM_S16BE, pcm_s16be);
999 PCM_CODEC(CODEC_ID_PCM_U16LE, pcm_u16le);
1000 PCM_CODEC(CODEC_ID_PCM_U16BE, pcm_u16be);
1001 PCM_CODEC(CODEC_ID_PCM_S8, pcm_s8);
1002 PCM_CODEC(CODEC_ID_PCM_U8, pcm_u8);
1003 PCM_CODEC(CODEC_ID_PCM_ALAW, pcm_alaw);
1004 PCM_CODEC(CODEC_ID_PCM_MULAW, pcm_mulaw);
1005
1006 /* adpcm codecs */
1007
1008 PCM_CODEC(CODEC_ID_ADPCM_IMA_QT, adpcm_ima_qt);
1009 PCM_CODEC(CODEC_ID_ADPCM_IMA_WAV, adpcm_ima_wav);
1010 PCM_CODEC(CODEC_ID_ADPCM_MS, adpcm_ms);
1011
1012 #undef PCM_CODEC
1013
1014 /* dummy raw video codec */
1015 extern AVCodec rawvideo_codec;
1016
1017 /* the following codecs use external GPL libs */
1018 extern AVCodec ac3_decoder;
1019
1020 /* resample.c */
1021
1022 struct ReSampleContext;
1023
1024 typedef struct ReSampleContext ReSampleContext;
1025
1026 ReSampleContext *audio_resample_init(int output_channels, int input_channels,
1027 int output_rate, int input_rate);
1028 int audio_resample(ReSampleContext *s, short *output, short *input, int nb_samples);
1029 void audio_resample_close(ReSampleContext *s);
1030
1031 /* YUV420 format is assumed ! */
1032
1033 struct ImgReSampleContext;
1034
1035 typedef struct ImgReSampleContext ImgReSampleContext;
1036
1037 ImgReSampleContext *img_resample_init(int output_width, int output_height,
1038 int input_width, int input_height);
1039
1040 ImgReSampleContext *img_resample_full_init(int owidth, int oheight,
1041 int iwidth, int iheight,
1042 int topBand, int bottomBand,
1043 int leftBand, int rightBand);
1044
1045 void img_resample(ImgReSampleContext *s,
1046 AVPicture *output, AVPicture *input);
1047
1048 void img_resample_close(ImgReSampleContext *s);
1049
1050 int avpicture_fill(AVPicture *picture, UINT8 *ptr,
1051 int pix_fmt, int width, int height);
1052 int avpicture_get_size(int pix_fmt, int width, int height);
1053 void avcodec_get_chroma_sub_sample(int pix_fmt, int *h_shift, int *v_shift);
1054 const char *avcodec_get_pix_fmt_name(int pix_fmt);
1055
1056 /* convert among pixel formats */
1057 int img_convert(AVPicture *dst, int dst_pix_fmt,
1058 AVPicture *src, int pix_fmt,
1059 int width, int height);
1060
1061 /* deinterlace a picture */
1062 int avpicture_deinterlace(AVPicture *dst, AVPicture *src,
1063 int pix_fmt, int width, int height);
1064
1065 /* external high level API */
1066
1067 extern AVCodec *first_avcodec;
1068
1069 /* returns LIBAVCODEC_VERSION_INT constant */
1070 unsigned avcodec_version(void);
1071 /* returns LIBAVCODEC_BUILD constant */
1072 unsigned avcodec_build(void);
1073 void avcodec_init(void);
1074
1075 void avcodec_set_bit_exact(void);
1076
1077 void register_avcodec(AVCodec *format);
1078 AVCodec *avcodec_find_encoder(enum CodecID id);
1079 AVCodec *avcodec_find_encoder_by_name(const char *name);
1080 AVCodec *avcodec_find_decoder(enum CodecID id);
1081 AVCodec *avcodec_find_decoder_by_name(const char *name);
1082 void avcodec_string(char *buf, int buf_size, AVCodecContext *enc, int encode);
1083
1084 void avcodec_get_context_defaults(AVCodecContext *s);
1085 AVCodecContext *avcodec_alloc_context(void);
1086 AVFrame *avcodec_alloc_frame(void);
1087
1088 int avcodec_default_get_buffer(AVCodecContext *s, AVFrame *pic);
1089 void avcodec_default_release_buffer(AVCodecContext *s, AVFrame *pic);
1090
1091 int avcodec_open(AVCodecContext *avctx, AVCodec *codec);
1092 int avcodec_decode_audio(AVCodecContext *avctx, INT16 *samples,
1093 int *frame_size_ptr,
1094 UINT8 *buf, int buf_size);
1095 int avcodec_decode_video(AVCodecContext *avctx, AVFrame *picture,
1096 int *got_picture_ptr,
1097 UINT8 *buf, int buf_size);
1098 int avcodec_parse_frame(AVCodecContext *avctx, UINT8 **pdata,
1099 int *data_size_ptr,
1100 UINT8 *buf, int buf_size);
1101 int avcodec_encode_audio(AVCodecContext *avctx, UINT8 *buf, int buf_size,
1102 const short *samples);
1103 int avcodec_encode_video(AVCodecContext *avctx, UINT8 *buf, int buf_size,
1104 const AVFrame *pict);
1105
1106 int avcodec_close(AVCodecContext *avctx);
1107
1108 void avcodec_register_all(void);
1109
1110 void avcodec_flush_buffers(AVCodecContext *avctx);
1111
1112 typedef struct {
1113 /** options' name with default value*/
1114 const char* name;
1115 /** English text help */
1116 const char* help;
1117 /** type of variable */
1118 int type;
1119 #define FF_CONF_TYPE_BOOL 1 // boolean - true,1,on (or simply presence)
1120 #define FF_CONF_TYPE_DOUBLE 2 // double
1121 #define FF_CONF_TYPE_INT 3 // integer
1122 #define FF_CONF_TYPE_STRING 4 // string (finished with \0)
1123 #define FF_CONF_TYPE_MASK 0x1f // mask for types - upper bits are various flags
1124 #define FF_CONF_TYPE_EXPERT 0x20 // flag for expert option
1125 #define FF_CONF_TYPE_FLAG (FF_CONF_TYPE_BOOL | 0x40)
1126 #define FF_CONF_TYPE_RCOVERIDE (FF_CONF_TYPE_STRING | 0x80)
1127 /** where the parsed value should be stored */
1128 void* val;
1129 /** min value (min == max -> no limits) */
1130 double min;
1131 /** maximum value for double/int */
1132 double max;
1133 /** default boo [0,1]l/double/int value */
1134 double defval;
1135 /**
1136 * default string value (with optional semicolon delimited extra option-list
1137 * i.e. option1;option2;option3
1138 * defval might select other then first argument as default
1139 */
1140 const char* defstr;
1141 /** char* list of supported codecs (i.e. ",msmpeg4,h263," NULL - everything */
1142 const char* supported;
1143 } avc_config_t;
1144
1145 void avcodec_getopt(AVCodecContext* avctx, char* str, avc_config_t** config);
1146
1147 /**
1148 * Interface for 0.5.0 version
1149 *
1150 * do not even think about it's usage for this moment
1151 */
1152
1153 typedef struct {
1154 // compressed size used from given memory buffer
1155 int size;
1156 /// I/P/B frame type
1157 int frame_type;
1158 } avc_enc_result_t;
1159
1160 /**
1161 * Commands
1162 * order can't be changed - once it was defined
1163 */
1164 typedef enum {
1165 // general commands
1166 AVC_OPEN_BY_NAME = 0xACA000,
1167 AVC_OPEN_BY_CODEC_ID,
1168 AVC_OPEN_BY_FOURCC,
1169 AVC_CLOSE,
1170
1171 AVC_FLUSH,
1172 // pin - struct { uint8_t* src, uint_t src_size }
1173 // pout - struct { AVPicture* img, consumed_bytes,
1174 AVC_DECODE,
1175 // pin - struct { AVPicture* img, uint8_t* dest, uint_t dest_size }
1176 // pout - uint_t used_from_dest_size
1177 AVC_ENCODE,
1178
1179 // query/get video commands
1180 AVC_GET_VERSION = 0xACB000,
1181 AVC_GET_WIDTH,
1182 AVC_GET_HEIGHT,
1183 AVC_GET_DELAY,
1184 AVC_GET_QUANT_TABLE,
1185 // ...
1186
1187 // query/get audio commands
1188 AVC_GET_FRAME_SIZE = 0xABC000,
1189
1190 // maybe define some simple structure which
1191 // might be passed to the user - but they can't
1192 // contain any codec specific parts and these
1193 // calls are usualy necessary only few times
1194
1195 // set video commands
1196 AVC_SET_WIDTH = 0xACD000,
1197 AVC_SET_HEIGHT,
1198
1199 // set video encoding commands
1200 AVC_SET_FRAME_RATE = 0xACD800,
1201 AVC_SET_QUALITY,
1202 AVC_SET_HURRY_UP,
1203
1204 // set audio commands
1205 AVC_SET_SAMPLE_RATE = 0xACE000,
1206 AVC_SET_CHANNELS,
1207
1208 } avc_cmd_t;
1209
1210 /**
1211 * \param handle allocated private structure by libavcodec
1212 * for initialization pass NULL - will be returned pout
1213 * user is supposed to know nothing about its structure
1214 * \param cmd type of operation to be performed
1215 * \param pint input parameter
1216 * \param pout output parameter
1217 *
1218 * \returns command status - eventually for query command it might return
1219 * integer resulting value
1220 */
1221 int avcodec(void* handle, avc_cmd_t cmd, void* pin, void* pout);
1222
1223 /* memory */
1224 void *av_malloc(unsigned int size);
1225 void *av_mallocz(unsigned int size);
1226 void av_free(void *ptr);
1227 void __av_freep(void **ptr);
1228 #define av_freep(p) __av_freep((void **)(p))
1229 /* for static data only */
1230 /* call av_free_static to release all staticaly allocated tables */
1231 void av_free_static(void);
1232 void *__av_mallocz_static(void** location, unsigned int size);
1233 #define av_mallocz_static(p, s) __av_mallocz_static((void **)(p), s)
1234
1235 #endif /* AVCODEC_H */