support for DV aspect ratio and erroneous audio patch by (Dan Dennedy (dan at dennedy...
[libav.git] / libavcodec / mpegvideo.h
CommitLineData
de6d9b64
FB
1/*
2 * Generic DCT based hybrid video encoder
ff4ec49e 3 * Copyright (c) 2000, 2001, 2002 Fabrice Bellard.
de6d9b64 4 *
ff4ec49e
FB
5 * This library is free software; you can redistribute it and/or
6 * modify it under the terms of the GNU Lesser General Public
7 * License as published by the Free Software Foundation; either
8 * version 2 of the License, or (at your option) any later version.
de6d9b64 9 *
ff4ec49e 10 * This library is distributed in the hope that it will be useful,
de6d9b64 11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
ff4ec49e
FB
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 * Lesser General Public License for more details.
de6d9b64 14 *
ff4ec49e
FB
15 * You should have received a copy of the GNU Lesser General Public
16 * License along with this library; if not, write to the Free Software
17 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
de6d9b64
FB
18 */
19
983e3246
MN
20/**
21 * @file mpegvideo.h
22 * mpegvideo header.
23 */
24
cd4af68a
ZK
25#ifndef AVCODEC_MPEGVIDEO_H
26#define AVCODEC_MPEGVIDEO_H
27
5c91a675
ZK
28#include "dsputil.h"
29
277f4827 30#define FRAME_SKIPED 100 ///< return value for header parsers if frame is not coded
eec1c6b9 31
de6d9b64
FB
32enum OutputFormat {
33 FMT_MPEG1,
34 FMT_H263,
9dbcbd92 35 FMT_MJPEG,
de6d9b64
FB
36};
37
1e491e29
MN
38#define EDGE_WIDTH 16
39
de6d9b64
FB
40#define MPEG_BUF_SIZE (16 * 1024)
41
ad324c93
MN
42#define QMAT_SHIFT_MMX 16
43#define QMAT_SHIFT 22
2f349de2 44
45870f57
MN
45#define MAX_FCODE 7
46#define MAX_MV 2048
1e491e29 47
0d1e9246 48#define MAX_PICTURE_COUNT 15
45870f57 49
7f2fe444
MN
50#define ME_MAP_SIZE 64
51#define ME_MAP_SHIFT 3
52#define ME_MAP_MV_BITS 11
53
0151a6f5
MN
54/* run length table */
55#define MAX_RUN 64
56#define MAX_LEVEL 64
57
277f4827
MN
58#define I_TYPE FF_I_TYPE ///< Intra
59#define P_TYPE FF_P_TYPE ///< Predicted
60#define B_TYPE FF_B_TYPE ///< Bi-dir predicted
61#define S_TYPE FF_S_TYPE ///< S(GMC)-VOP MPEG4
140cb663 62
9cdd6a24
MN
63typedef struct Predictor{
64 double coeff;
65 double count;
66 double decay;
67} Predictor;
68
8b4c7dbc
MN
69typedef struct RateControlEntry{
70 int pict_type;
c5d309f2 71 float qscale;
8b4c7dbc
MN
72 int mv_bits;
73 int i_tex_bits;
74 int p_tex_bits;
75 int misc_bits;
0c1a9eda 76 uint64_t expected_bits;
8b4c7dbc
MN
77 int new_pict_type;
78 float new_qscale;
3aa102be
MN
79 int mc_mb_var_sum;
80 int mb_var_sum;
81 int i_count;
82 int f_code;
83 int b_code;
8b4c7dbc
MN
84}RateControlEntry;
85
277f4827
MN
86/**
87 * rate control context.
88 */
8b4c7dbc
MN
89typedef struct RateControlContext{
90 FILE *stats_file;
277f4827 91 int num_entries; ///< number of RateControlEntries
8b4c7dbc 92 RateControlEntry *entry;
277f4827 93 int buffer_index; ///< amount of bits in the video/audio buffer
3aa102be 94 Predictor pred[5];
277f4827
MN
95 double short_term_qsum; ///< sum of recent qscales
96 double short_term_qcount; ///< count of recent qscales
97 double pass1_rc_eq_output_sum;///< sum of the output of the rc equation, this is used for normalization
98 double pass1_wanted_bits; ///< bits which should have been outputed by the pass1 code (including complexity init)
3aa102be 99 double last_qscale;
277f4827 100 double last_qscale_for[5]; ///< last qscale for a specific pict type, used for max_diff & ipb factor stuff
3aa102be
MN
101 int last_mc_mb_var_sum;
102 int last_mb_var_sum;
0c1a9eda
ZK
103 uint64_t i_cplx_sum[5];
104 uint64_t p_cplx_sum[5];
105 uint64_t mv_bits_sum[5];
106 uint64_t qscale_sum[5];
3aa102be 107 int frame_count[5];
947ac25a 108 int last_non_b_pict_type;
8b4c7dbc
MN
109}RateControlContext;
110
277f4827
MN
111/**
112 * Scantable.
113 */
2ad1516a 114typedef struct ScanTable{
0c1a9eda
ZK
115 const uint8_t *scantable;
116 uint8_t permutated[64];
117 uint8_t raster_end[64];
05c4072b 118#ifdef ARCH_POWERPC
277f4827 119 /** Used by dct_quantise_alitvec to find last-non-zero */
0c1a9eda 120 uint8_t __align8 inverse[64];
05c4072b 121#endif
2ad1516a
MN
122} ScanTable;
123
277f4827
MN
124/**
125 * Picture.
126 */
1e491e29 127typedef struct Picture{
492cd3a9 128 FF_COMMON_FRAME
1e491e29 129
277f4827
MN
130 int mb_var_sum; ///< sum of MB variance for current frame
131 int mc_mb_var_sum; ///< motion compensated MB variance for current frame
132 uint16_t *mb_var; ///< Table for MB variances
133 uint16_t *mc_mb_var; ///< Table for motion compensated MB variances
134 uint8_t *mb_mean; ///< Table for MB luminance
135 int32_t *mb_cmp_score; ///< Table for MB cmp scores, for mb decission
0d1e9246 136 int b_frame_score; /* */
1e491e29
MN
137} Picture;
138
d7425f59 139typedef struct ParseContext{
0c1a9eda 140 uint8_t *buffer;
d7425f59
MN
141 int index;
142 int last_index;
143 int buffer_size;
144 int state;
145 int frame_start_found;
146} ParseContext;
147
1457ab52
MN
148struct MpegEncContext;
149
277f4827
MN
150/**
151 * Motion estimation context.
152 */
1457ab52 153typedef struct MotionEstContext{
277f4827
MN
154 int skip; ///< set if ME is skiped for the current MB
155 int co_located_mv[4][2]; ///< mv from last p frame for direct mode ME
1457ab52 156 int direct_basis_mv[4][2];
277f4827
MN
157 uint8_t *scratchpad; ///< data area for the me algo, so that the ME doesnt need to malloc/free
158 uint32_t *map; ///< map to avoid duplicate evaluations
159 uint32_t *score_map; ///< map to store the scores
1457ab52 160 int map_generation;
826f429a 161 int pre_penalty_factor;
1457ab52
MN
162 int penalty_factor;
163 int sub_penalty_factor;
67725183 164 int mb_penalty_factor;
277f4827 165 int pre_pass; ///< = 1 for the pre pass
826f429a 166 int dia_size;
30952237 167 uint8_t (*mv_penalty)[MAX_MV*2+1]; ///< amount of bits needed to encode a MV
1457ab52
MN
168 int (*sub_motion_search)(struct MpegEncContext * s,
169 int *mx_ptr, int *my_ptr, int dmin,
170 int xmin, int ymin, int xmax, int ymax,
171 int pred_x, int pred_y, Picture *ref_picture,
30952237 172 int n, int size, uint8_t * const mv_penalty);
1457ab52
MN
173 int (*motion_search[7])(struct MpegEncContext * s, int block,
174 int *mx_ptr, int *my_ptr,
175 int P[10][2], int pred_x, int pred_y,
826f429a 176 int xmin, int ymin, int xmax, int ymax, Picture *ref_picture, int16_t (*last_mv)[2],
30952237 177 int ref_mv_scale, uint8_t * const mv_penalty);
826f429a
MN
178 int (*pre_motion_search)(struct MpegEncContext * s, int block,
179 int *mx_ptr, int *my_ptr,
180 int P[10][2], int pred_x, int pred_y,
b07a5980 181 int xmin, int ymin, int xmax, int ymax, Picture *ref_picture, int16_t (*last_mv)[2],
30952237 182 int ref_mv_scale, uint8_t * const mv_penalty);
67725183 183 int (*get_mb_score)(struct MpegEncContext * s, int mx, int my, int pred_x, int pred_y, Picture *ref_picture,
30952237 184 uint8_t * const mv_penalty);
1457ab52
MN
185}MotionEstContext;
186
277f4827
MN
187/**
188 * MpegEncContext.
189 */
de6d9b64 190typedef struct MpegEncContext {
58f26ba9 191 struct AVCodecContext *avctx;
de6d9b64 192 /* the following parameters must be initialized before encoding */
277f4827 193 int width, height;///< picture size. must be a multiple of 16
de6d9b64 194 int gop_size;
277f4827
MN
195 int intra_only; ///< if true, only intra pictures are generated
196 int bit_rate; ///< wanted bit rate
197 int bit_rate_tolerance; ///< amount of +- bits (>0)
198 enum OutputFormat out_format; ///< output format
199 int h263_pred; ///< use mpeg4/h263 ac/dc predictions
d7e9533a
MN
200
201/* the following codec id fields are deprecated in favor of codec_id */
277f4827
MN
202 int h263_plus; ///< h263 plus headers
203 int h263_rv10; ///< use RV10 variation for H263
204 int h263_msmpeg4; ///< generate MSMPEG4 compatible stream (deprecated, use msmpeg4_version instead)
205 int h263_intel; ///< use I263 intel h263 header
d7e9533a
MN
206
207 int codec_id; /* see CODEC_ID_xxx */
277f4827
MN
208 int fixed_qscale; ///< fixed qscale if non zero
209 float qcompress; ///< amount of qscale change between easy & hard scenes (0.0-1.0)
210 float qblur; ///< amount of qscale smoothing over time (0.0-1.0)
277f4827
MN
211 int max_qdiff; ///< max qscale difference between frames
212 int encoding; ///< true if we are encoding (vs decoding)
213 int flags; ///< AVCodecContext.flags (HQ, MV4, ...)
214 int max_b_frames; ///< max number of b-frames for encoding
8b4c7dbc 215 int b_frame_strategy;
7f2fe444
MN
216 int luma_elim_threshold;
217 int chroma_elim_threshold;
277f4827
MN
218 int strict_std_compliance; ///< strictly follow the std (MPEG4, ...)
219 int workaround_bugs; ///< workaround bugs in encoders which cannot be detected automatically
de6d9b64
FB
220 /* the following fields are managed internally by the encoder */
221
277f4827 222 /** bit output */
de6d9b64
FB
223 PutBitContext pb;
224
225 /* sequence parameters */
226 int context_initialized;
9dbcbd92 227 int input_picture_number;
de6d9b64 228 int picture_number;
277f4827
MN
229 int picture_in_gop_number; ///< 0-> first pic in gop, ...
230 int b_frames_since_non_b; ///< used for encoding, relative to not yet reordered input
231 int mb_width, mb_height; ///< number of MBs horizontally & vertically
232 int h_edge_pos, v_edge_pos;///< horizontal / vertical position of the right/bottom edge (pixel replicateion)
233 int mb_num; ///< number of MBs of a picture
234 int linesize; ///< line size, in bytes, may be different from width
235 int uvlinesize; ///< line size, for chroma in bytes, may be different from width
236 Picture picture[MAX_PICTURE_COUNT]; ///< main picture buffer
237 Picture *input_picture[MAX_PICTURE_COUNT]; ///< next pictures on display order for encoding
238 Picture *reordered_input_picture[MAX_PICTURE_COUNT]; ///< pointer to the next pictures in codedorder for encoding
b536d0aa
MN
239
240 /**
241 * copy of the previous picture structure.
242 * note, linesize & data, might not match the previous picture (for field pictures)
243 */
244 Picture last_picture;
245
246 /**
247 * copy of the next picture structure.
248 * note, linesize & data, might not match the next picture (for field pictures)
249 */
250 Picture next_picture;
251
252 /**
253 * copy of the source picture structure for encoding.
254 * note, linesize & data, might not match the source picture (for field pictures)
255 */
256 Picture new_picture;
257
258 /**
259 * copy of the current picture structure.
260 * note, linesize & data, might not match the current picture (for field pictures)
261 */
277f4827 262 Picture current_picture; ///< buffer to store the decompressed current picture
b536d0aa
MN
263
264 Picture *last_picture_ptr; ///< pointer to the previous picture.
265 Picture *next_picture_ptr; ///< pointer to the next picture (for bidir pred)
266 Picture *new_picture_ptr; ///< pointer to the source picture for encoding
267 Picture *current_picture_ptr; ///< pointer to the current picture
277f4827
MN
268 int last_dc[3]; ///< last DC values for MPEG1
269 int16_t *dc_val[3]; ///< used for mpeg4 DC prediction, all 3 arrays must be continuous
de6d9b64 270 int y_dc_scale, c_dc_scale;
277f4827
MN
271 uint8_t *y_dc_scale_table; ///< qscale -> y_dc_scale table
272 uint8_t *c_dc_scale_table; ///< qscale -> c_dc_scale table
273 uint8_t *coded_block; ///< used for coded block pattern prediction (msmpeg4v3, wmv1)
274 int16_t (*ac_val[3])[16]; ///< used for for mpeg4 AC prediction, all 3 arrays must be continuous
de6d9b64 275 int ac_pred;
277f4827 276 uint8_t *prev_pict_types; ///< previous picture types in bitstream order, used for mb skip
f943e138 277#define PREV_PICT_TYPES_BUFFER_SIZE 256
277f4827
MN
278 int mb_skiped; ///< MUST BE SET only during DECODING
279 uint8_t *mbskip_table; /**< used to avoid copy if macroblock skipped (for black regions for example)
9dbcbd92 280 and used for b-frame encoding & decoding (contains skip table of next P Frame) */
277f4827
MN
281 uint8_t *mbintra_table; ///< used to avoid setting {ac, dc, cbp}-pred stuff to zero on inter MB decoding
282 uint8_t *cbp_table; ///< used to store cbp, ac_pred for partitioned decoding
283 uint8_t *pred_dir_table; ///< used to store pred_dir for partitioned decoding
f7b47594 284 uint8_t *allocated_edge_emu_buffer;
277f4827 285 uint8_t *edge_emu_buffer; ///< points into the middle of allocated_edge_emu_buffer
de6d9b64 286
277f4827
MN
287 int qscale; ///< QP
288 float frame_qscale; ///< qscale from the frame level rc FIXME remove
289 int adaptive_quant; ///< use adaptive quantization
290 int dquant; ///< qscale difference to prev qscale
291 int pict_type; ///< I_TYPE, P_TYPE, B_TYPE, ...
3aa102be 292 int last_pict_type;
277f4827 293 int last_non_b_pict_type; ///< used for mpeg4 gmc b-frames & ratecontrol
de6d9b64
FB
294 int frame_rate_index;
295 /* motion compensation */
277f4827
MN
296 int unrestricted_mv; ///< mv can point outside of the coded picture
297 int h263_long_vectors; ///< use horrible h263v1 long vector mode
298
299 DSPContext dsp; ///< pointers for accelerated dsp fucntions
300 int f_code; ///< forward MV resolution
301 int b_code; ///< backward MV resolution for B Frames (mpeg4)
302 int16_t (*motion_val)[2]; ///< used for MV prediction (4MV per MB)
303 int16_t (*p_mv_table)[2]; ///< MV table (1MV per MB) p-frame encoding
304 int16_t (*b_forw_mv_table)[2]; ///< MV table (1MV per MB) forward mode b-frame encoding
305 int16_t (*b_back_mv_table)[2]; ///< MV table (1MV per MB) backward mode b-frame encoding
306 int16_t (*b_bidir_forw_mv_table)[2]; ///< MV table (1MV per MB) bidir mode b-frame encoding
307 int16_t (*b_bidir_back_mv_table)[2]; ///< MV table (1MV per MB) bidir mode b-frame encoding
308 int16_t (*b_direct_mv_table)[2]; ///< MV table (1MV per MB) direct mode b-frame encoding
309 int me_method; ///< ME algorithm
1fb4890b 310 int scene_change_score;
de6d9b64
FB
311 int mv_dir;
312#define MV_DIR_BACKWARD 1
313#define MV_DIR_FORWARD 2
277f4827 314#define MV_DIRECT 4 ///< bidirectional mode where the difference equals the MV of the last P/S/I-Frame (mpeg4)
de6d9b64 315 int mv_type;
277f4827
MN
316#define MV_TYPE_16X16 0 ///< 1 vector for the whole mb
317#define MV_TYPE_8X8 1 ///< 4 vectors (h263, mpeg4 4MV)
318#define MV_TYPE_16X8 2 ///< 2 vectors, one per 16x8 block
319#define MV_TYPE_FIELD 3 ///< 2 vectors, one per field
320#define MV_TYPE_DMV 4 ///< 2 vectors, special mpeg2 Dual Prime Vectors
321 /**motion vectors for a macroblock
de6d9b64
FB
322 first coordinate : 0 = forward 1 = backward
323 second " : depend on type
324 third " : 0 = x, 1 = y
325 */
326 int mv[2][4][2];
327 int field_select[2][2];
277f4827
MN
328 int last_mv[2][2][2]; ///< last MV, used for MV prediction in MPEG1 & B-frame MPEG4
329 uint8_t *fcode_tab; ///< smallest fcode needed for each MV
1457ab52
MN
330
331 MotionEstContext me;
de6d9b64 332
277f4827 333 int no_rounding; /**< apply no rounding to motion compensation (MPEG4, msmpeg4, ...)
91029be7 334 for b-frames rounding mode is allways 0 */
de6d9b64 335
277f4827 336 int hurry_up; /**< when set to 1 during decoding, b frames will be skiped
2417652e 337 when set to 2 idct/dequant will be skipped too */
c5d309f2 338
de6d9b64
FB
339 /* macroblock layer */
340 int mb_x, mb_y;
9b8709d1 341 int mb_skip_run;
de6d9b64 342 int mb_intra;
277f4827 343 uint8_t *mb_type; ///< Table for MB type
ba6802de
MN
344#define MB_TYPE_INTRA 0x01
345#define MB_TYPE_INTER 0x02
346#define MB_TYPE_INTER4V 0x04
347#define MB_TYPE_SKIPED 0x08
7f2fe444
MN
348#define MB_TYPE_GMC 0x10
349
ba6802de
MN
350#define MB_TYPE_DIRECT 0x10
351#define MB_TYPE_FORWARD 0x20
9dbcbd92 352#define MB_TYPE_BACKWARD 0x40
ba6802de 353#define MB_TYPE_BIDIR 0x80
4278e7a6 354
277f4827 355 int block_index[6]; ///< index to current MB in block based arrays with edges
4278e7a6
MN
356 int block_wrap[6];
357
277f4827 358 /** matrix transmitted in the bitstream */
0c1a9eda
ZK
359 uint16_t intra_matrix[64];
360 uint16_t chroma_intra_matrix[64];
361 uint16_t inter_matrix[64];
362 uint16_t chroma_inter_matrix[64];
1984f635 363#define QUANT_BIAS_SHIFT 8
277f4827
MN
364 int intra_quant_bias; ///< bias for the quantizer
365 int inter_quant_bias; ///< bias for the quantizer
366 int min_qcoeff; ///< minimum encodable coefficient
367 int max_qcoeff; ///< maximum encodable coefficient
368 int ac_esc_length; ///< num of bits needed to encode the longest esc
477ab036
MN
369 uint8_t *intra_ac_vlc_length;
370 uint8_t *intra_ac_vlc_last_length;
371 uint8_t *inter_ac_vlc_length;
372 uint8_t *inter_ac_vlc_last_length;
67725183
MN
373 uint8_t *luma_dc_vlc_length;
374 uint8_t *chroma_dc_vlc_length;
c442d75c 375#define UNI_AC_ENC_INDEX(run,level) ((run)*128 + (level))
477ab036 376
277f4827 377 /** precomputed matrix (combine qscale and DCT renorm) */
05c4072b
MN
378 int __align8 q_intra_matrix[32][64];
379 int __align8 q_inter_matrix[32][64];
277f4827 380 /** identical to the above but for MMX & these are not permutated */
0c1a9eda
ZK
381 uint16_t __align8 q_intra_matrix16[32][64];
382 uint16_t __align8 q_inter_matrix16[32][64];
383 uint16_t __align8 q_intra_matrix16_bias[32][64];
384 uint16_t __align8 q_inter_matrix16_bias[32][64];
277f4827 385 int block_last_index[6]; ///< last non zero coefficient in block
2ad1516a 386 /* scantables */
05c4072b 387 ScanTable __align8 intra_scantable;
2ad1516a
MN
388 ScanTable intra_h_scantable;
389 ScanTable intra_v_scantable;
277f4827 390 ScanTable inter_scantable; ///< if inter == intra then intra should be used to reduce tha cache usage
de6d9b64 391
277f4827 392 void *opaque; ///< private data for the user
de6d9b64
FB
393
394 /* bit rate control */
9dbcbd92 395 int I_frame_bits; //FIXME used in mpeg12 ...
0c1a9eda
ZK
396 int64_t wanted_bits;
397 int64_t total_bits;
277f4827
MN
398 int frame_bits; ///< bits used for the current frame
399 RateControlContext rc_context; ///< contains stuff only accessed in ratecontrol.c
9cdd6a24 400
098eefe1
MN
401 /* statistics, used for 2-pass encoding */
402 int mv_bits;
403 int header_bits;
404 int i_tex_bits;
405 int p_tex_bits;
406 int i_count;
66370d3f
MN
407 int f_count;
408 int b_count;
098eefe1 409 int skip_count;
277f4827
MN
410 int misc_bits; ///< cbp, mb_type
411 int last_bits; ///< temp var used for calculating the above vars
7f2fe444
MN
412
413 /* error concealment / resync */
277f4827
MN
414 uint8_t *error_status_table; ///< table of the error status of each MB
415#define VP_START 1 ///< current MB is the first after a resync marker
4d2858de
MN
416#define AC_ERROR 2
417#define DC_ERROR 4
418#define MV_ERROR 8
419#define AC_END 16
420#define DC_END 32
421#define MV_END 64
422//FIXME some prefix?
423
277f4827
MN
424 int resync_mb_x; ///< x position of last resync marker
425 int resync_mb_y; ///< y position of last resync marker
426 GetBitContext last_resync_gb; ///< used to search for the next resync marker
427 int mb_num_left; ///< number of MBs left in this video packet (for partitioned Slices only)
428 int next_p_frame_damaged; ///< set if the next p frame is damaged, to avoid showing trashed b frames
7f2fe444 429 int error_resilience;
d7425f59
MN
430
431 ParseContext parse_context;
098eefe1 432
102d3908
J
433 /* H.263 specific */
434 int gob_number;
644d98a4 435 int gob_index;
d140623f 436
544286b3 437 /* H.263+ specific */
277f4827
MN
438 int umvplus; ///< == H263+ && unrestricted_mv
439 int h263_aic; ///< Advanded INTRA Coding (AIC)
440 int h263_aic_dir; ///< AIC direction: 0 = left, 1 = top
544286b3 441
de6d9b64 442 /* mpeg4 specific */
6f91bcd1 443 int time_increment_resolution;
277f4827 444 int time_increment_bits; ///< number of bits to represent the fractional part of time
9dbcbd92 445 int last_time_base;
277f4827
MN
446 int time_base; ///< time in seconds of last I,P,S Frame
447 int64_t time; ///< time of current frame
0c1a9eda 448 int64_t last_non_b_time;
277f4827
MN
449 uint16_t pp_time; ///< time distance between the last 2 p,s,i frames
450 uint16_t pb_time; ///< time distance between the last b and p,s,i frame
0c1a9eda 451 uint16_t pp_field_time;
277f4827 452 uint16_t pb_field_time; ///< like above, just for interlaced
1a565432
FB
453 int shape;
454 int vol_sprite_usage;
cc9ba006
MN
455 int sprite_width;
456 int sprite_height;
457 int sprite_left;
458 int sprite_top;
459 int sprite_brightness_change;
73c8e514 460 int num_sprite_warping_points;
44eb4951 461 int real_sprite_warping_points;
277f4827
MN
462 int sprite_offset[2][2]; ///< sprite offset[isChroma][isMVY]
463 int sprite_delta[2][2]; ///< sprite_delta [isY][isMVY]
464 int sprite_shift[2]; ///< sprite shift [isChroma]
73c8e514 465 int mcsel;
1a565432 466 int quant_precision;
277f4827 467 int quarter_sample; ///< 1->qpel, 0->half pel ME/MC
cc9ba006 468 int scalability;
0fd90455
MN
469 int hierachy_type;
470 int enhancement_type;
cc9ba006
MN
471 int new_pred;
472 int reduced_res_vop;
473 int aspect_ratio_info;
e769f053
AB
474 int aspected_width;
475 int aspected_height;
cc9ba006
MN
476 int sprite_warping_accuracy;
477 int low_latency_sprite;
277f4827
MN
478 int data_partitioning; ///< data partitioning flag from header
479 int partitioned_frame; ///< is current frame partitioned
480 int rvlc; ///< reversible vlc
481 int resync_marker; ///< could this stream contain resync markers
482 int low_delay; ///< no reordering needed / has no b-frames
1ff662cc 483 int vo_type;
277f4827
MN
484 int vol_control_parameters; ///< does the stream contain the low_delay flag, used to workaround buggy encoders
485 PutBitContext tex_pb; ///< used for data partitioned VOPs
486 PutBitContext pb2; ///< used for data partitioned VOPs
7f2fe444
MN
487#define PB_BUFFER_SIZE 1024*256
488 uint8_t *tex_pb_buffer;
489 uint8_t *pb2_buffer;
d930ef19 490 int mpeg_quant;
bea669e5
MN
491#define CO_LOCATED_TYPE_4MV 1
492#define CO_LOCATED_TYPE_FIELDMV 2
277f4827
MN
493 int8_t *co_located_type_table; ///< 4mv & field_mv info for next b frame
494 int16_t (*field_mv_table)[2][2]; ///< used for interlaced b frame decoding
495 int8_t (*field_select_table)[2]; ///< wtf, no really another table for interlaced b frames
496 int t_frame; ///< time distance of first I -> B, used for interlaced b frames
497 int padding_bug_score; ///< used to detect the VERY common padding bug in MPEG4
44eb4951
MN
498
499 /* divx specific, used to workaround (many) bugs in divx5 */
500 int divx_version;
501 int divx_build;
d5a21172 502 int divx_packed;
eec1c6b9 503#define BITSTREAM_BUFFER_SIZE 1024*256
0c1a9eda 504 uint8_t *bitstream_buffer; //Divx 5.01 puts several frames in a single one, this is used to reorder them
eec1c6b9
MN
505 int bitstream_buffer_size;
506
7da71a5c
MN
507 int xvid_build;
508
4d2858de
MN
509 /* lavc specific stuff, used to workaround bugs in libavcodec */
510 int ffmpeg_version;
511 int lavc_build;
512
de6d9b64 513 /* RV10 specific */
277f4827 514 int rv10_version; ///< RV10 version: 0 or 3
de6d9b64
FB
515 int rv10_first_dc_coded[3];
516
517 /* MJPEG specific */
518 struct MJpegContext *mjpeg_ctx;
277f4827
MN
519 int mjpeg_vsample[3]; ///< vertical sampling factors, default = {2, 1, 1}
520 int mjpeg_hsample[3]; ///< horizontal sampling factors, default = {2, 1, 1}
521 int mjpeg_write_tables; ///< do we want to have quantisation- and huffmantables in the jpeg file ?
522 int mjpeg_data_only_frames; ///< frames only with SOI, SOS and EOI markers
de6d9b64
FB
523
524 /* MSMPEG4 specific */
525 int mv_table_index;
526 int rl_table_index;
527 int rl_chroma_table_index;
528 int dc_table_index;
529 int use_skip_mb_code;
277f4827
MN
530 int slice_height; ///< in macroblocks
531 int first_slice_line; ///< used in mpeg4 too to handle resync markers
ae40484c 532 int flipflop_rounding;
277f4827 533 int msmpeg4_version; ///< 0=not msmpeg4, 1=mp41, 2=mp42, 3=mp43/divx3 4=wmv1/7 5=wmv2/8
0151a6f5
MN
534 int per_mb_rl_table;
535 int esc3_level_length;
536 int esc3_run_length;
277f4827 537 /** [mb_intra][isChroma][level][run][last] */
6b460aa3 538 int (*ac_stats)[2][MAX_LEVEL+1][MAX_RUN+1][2];
de0f2f4c 539 int inter_intra_pred;
1457ab52 540 int mspel;
0151a6f5 541
de6d9b64
FB
542 /* decompression specific */
543 GetBitContext gb;
544
1e491e29 545 /* Mpeg1 specific */
277f4827
MN
546 int fake_picture_number; ///< picture number at the bitstream frame rate
547 int gop_picture_number; ///< index of the first picture of a GOP based on fake_pic_num & mpeg1 specific
548 int last_mv_dir; ///< last mv_dir, used for b frame encoding
1e491e29 549
de6d9b64
FB
550 /* MPEG2 specific - I wish I had not to support this mess. */
551 int progressive_sequence;
552 int mpeg_f_code[2][2];
553 int picture_structure;
554/* picture type */
555#define PICT_TOP_FIELD 1
556#define PICT_BOTTOM_FIELD 2
557#define PICT_FRAME 3
558
559 int intra_dc_precision;
560 int frame_pred_frame_dct;
561 int top_field_first;
562 int concealment_motion_vectors;
563 int q_scale_type;
564 int intra_vlc_format;
565 int alternate_scan;
566 int repeat_first_field;
567 int chroma_420_type;
568 int progressive_frame;
569 int mpeg2;
570 int full_pel[2];
571 int interlaced_dct;
de6d9b64 572 int first_slice;
dfb476cb 573 int first_field;
644d98a4
J
574
575 /* RTP specific */
81401c1f 576 /* These are explained on avcodec.h */
644d98a4
J
577 int rtp_mode;
578 int rtp_payload_size;
81401c1f 579 void (*rtp_callback)(void *data, int size, int packet_number);
0c1a9eda 580 uint8_t *ptr_lastgob;
644d98a4 581
277f4827 582 DCTELEM (*block)[64]; ///< points to one of the following blocks
91029be7 583 DCTELEM blocks[2][6][64] __align8; // for HQ mode we need to keep the best block
4d2858de
MN
584 int (*decode_mb)(struct MpegEncContext *s, DCTELEM block[6][64]); // used by some codecs to avoid a switch()
585#define SLICE_OK 0
586#define SLICE_ERROR -1
587#define SLICE_END -2 //end marker found
588#define SLICE_NOEND -3 //no end marker or error found but mb count exceeded
589
9dbf1ddd 590 void (*dct_unquantize_mpeg1)(struct MpegEncContext *s,
67309e49 591 DCTELEM *block/*align 16*/, int n, int qscale);
9dbf1ddd 592 void (*dct_unquantize_mpeg2)(struct MpegEncContext *s,
67309e49 593 DCTELEM *block/*align 16*/, int n, int qscale);
3bf43d42 594 void (*dct_unquantize_h263)(struct MpegEncContext *s,
67309e49 595 DCTELEM *block/*align 16*/, int n, int qscale);
3bf43d42 596 void (*dct_unquantize)(struct MpegEncContext *s, // unquantizer to use (mpeg4 can use both)
67309e49
MN
597 DCTELEM *block/*align 16*/, int n, int qscale);
598 int (*dct_quantize)(struct MpegEncContext *s, DCTELEM *block/*align 16*/, int n, int qscale, int *overflow);
3a87ac94 599 int (*fast_dct_quantize)(struct MpegEncContext *s, DCTELEM *block/*align 16*/, int n, int qscale, int *overflow);
de6d9b64
FB
600} MpegEncContext;
601
4d2858de 602
defdfc9a 603int DCT_common_init(MpegEncContext *s);
de6d9b64
FB
604int MPV_common_init(MpegEncContext *s);
605void MPV_common_end(MpegEncContext *s);
606void MPV_decode_mb(MpegEncContext *s, DCTELEM block[6][64]);
d6db1c9c 607int MPV_frame_start(MpegEncContext *s, AVCodecContext *avctx);
de6d9b64 608void MPV_frame_end(MpegEncContext *s);
1457ab52
MN
609int MPV_encode_init(AVCodecContext *avctx);
610int MPV_encode_end(AVCodecContext *avctx);
611int MPV_encode_picture(AVCodecContext *avctx, unsigned char *buf, int buf_size, void *data);
21af69f7
FB
612#ifdef HAVE_MMX
613void MPV_common_init_mmx(MpegEncContext *s);
614#endif
e0580f8c
FH
615#ifdef ARCH_ALPHA
616void MPV_common_init_axp(MpegEncContext *s);
617#endif
c7e07931
MO
618#ifdef HAVE_MLIB
619void MPV_common_init_mlib(MpegEncContext *s);
620#endif
5917d17c
LS
621#ifdef HAVE_MMI
622void MPV_common_init_mmi(MpegEncContext *s);
623#endif
83f238cb 624#ifdef ARCH_ARMV4L
d43b10ec 625void MPV_common_init_armv4l(MpegEncContext *s);
83f238cb 626#endif
05c4072b
MN
627#ifdef ARCH_POWERPC
628void MPV_common_init_ppc(MpegEncContext *s);
629#endif
0c1a9eda 630extern void (*draw_edges)(uint8_t *buf, int wrap, int width, int height, int w);
0c1a9eda 631void ff_copy_bits(PutBitContext *pb, uint8_t *src, int length);
7f2fe444 632void ff_clean_intra_table_entries(MpegEncContext *s);
0c1a9eda 633void ff_init_scantable(MpegEncContext *s, ScanTable *st, const uint8_t *src_scantable);
640950c7 634void ff_draw_horiz_band(MpegEncContext *s, int y, int h);
0c1a9eda 635void ff_emulated_edge_mc(MpegEncContext *s, uint8_t *src, int linesize, int block_w, int block_h,
1457ab52 636 int src_x, int src_y, int w, int h);
59b571c1 637char ff_get_pict_type_char(int pict_type);
b7a22d84 638int ff_combine_frame( MpegEncContext *s, int next, uint8_t **buf, int *buf_size);
59b571c1 639
46b4feec
MN
640void ff_er_frame_start(MpegEncContext *s);
641void ff_er_frame_end(MpegEncContext *s);
642void ff_er_add_slice(MpegEncContext *s, int startx, int starty, int endx, int endy, int status);
643
644
a33c7159 645extern enum PixelFormat ff_yuv420p_list[2];
de6d9b64 646
4d2858de
MN
647static inline void ff_init_block_index(MpegEncContext *s){
648 s->block_index[0]= s->block_wrap[0]*(s->mb_y*2 + 1) - 1 + s->mb_x*2;
649 s->block_index[1]= s->block_wrap[0]*(s->mb_y*2 + 1) + s->mb_x*2;
650 s->block_index[2]= s->block_wrap[0]*(s->mb_y*2 + 2) - 1 + s->mb_x*2;
651 s->block_index[3]= s->block_wrap[0]*(s->mb_y*2 + 2) + s->mb_x*2;
652 s->block_index[4]= s->block_wrap[4]*(s->mb_y + 1) + s->block_wrap[0]*(s->mb_height*2 + 2) + s->mb_x;
653 s->block_index[5]= s->block_wrap[4]*(s->mb_y + 1 + s->mb_height + 2) + s->block_wrap[0]*(s->mb_height*2 + 2) + s->mb_x;
654}
655
656static inline void ff_update_block_index(MpegEncContext *s){
657 s->block_index[0]+=2;
658 s->block_index[1]+=2;
659 s->block_index[2]+=2;
660 s->block_index[3]+=2;
661 s->block_index[4]++;
662 s->block_index[5]++;
663}
664
4d2a4834
MN
665static inline int get_bits_diff(MpegEncContext *s){
666 const int bits= get_bit_count(&s->pb);
667 const int last= s->last_bits;
668
669 s->last_bits = bits;
670
671 return bits - last;
672}
4d2858de 673
de6d9b64 674/* motion_est.c */
9dbcbd92
MN
675void ff_estimate_p_frame_motion(MpegEncContext * s,
676 int mb_x, int mb_y);
677void ff_estimate_b_frame_motion(MpegEncContext * s,
678 int mb_x, int mb_y);
679int ff_get_best_fcode(MpegEncContext * s, int16_t (*mv_table)[2], int type);
680void ff_fix_long_p_mvs(MpegEncContext * s);
681void ff_fix_long_b_mvs(MpegEncContext * s, int16_t (*mv_table)[2], int f_code, int type);
1457ab52 682void ff_init_me(MpegEncContext *s);
f5fb6b34 683int ff_pre_estimate_p_frame_motion(MpegEncContext * s, int mb_x, int mb_y);
de6d9b64 684
4d2858de 685
de6d9b64 686/* mpeg12.c */
0c1a9eda
ZK
687extern const int16_t ff_mpeg1_default_intra_matrix[64];
688extern const int16_t ff_mpeg1_default_non_intra_matrix[64];
689extern uint8_t ff_mpeg1_dc_scale_table[128];
de6d9b64
FB
690
691void mpeg1_encode_picture_header(MpegEncContext *s, int picture_number);
692void mpeg1_encode_mb(MpegEncContext *s,
693 DCTELEM block[6][64],
694 int motion_x, int motion_y);
0151a6f5 695void ff_mpeg1_encode_init(MpegEncContext *s);
9b8709d1
MN
696void ff_mpeg1_encode_slice_header(MpegEncContext *s);
697void ff_mpeg1_clean_buffers(MpegEncContext *s);
de6d9b64 698
4d2858de 699
277f4827 700/** RLTable. */
de6d9b64 701typedef struct RLTable {
277f4827
MN
702 int n; ///< number of entries of table_vlc minus 1
703 int last; ///< number of values for last = 0
0c1a9eda
ZK
704 const uint16_t (*table_vlc)[2];
705 const int8_t *table_run;
706 const int8_t *table_level;
277f4827
MN
707 uint8_t *index_run[2]; ///< encoding only
708 int8_t *max_level[2]; ///< encoding & decoding
709 int8_t *max_run[2]; ///< encoding & decoding
710 VLC vlc; ///< decoding only deprected FIXME remove
711 RL_VLC_ELEM *rl_vlc[32]; ///< decoding only
de6d9b64
FB
712} RLTable;
713
714void init_rl(RLTable *rl);
715void init_vlc_rl(RLTable *rl);
716
3232bc88 717static inline int get_rl_index(const RLTable *rl, int last, int run, int level)
de6d9b64
FB
718{
719 int index;
720 index = rl->index_run[last][run];
721 if (index >= rl->n)
722 return rl->n;
723 if (level > rl->max_level[last][run])
724 return rl->n;
725 return index + level - 1;
726}
727
0c1a9eda
ZK
728extern uint8_t ff_mpeg4_y_dc_scale_table[32];
729extern uint8_t ff_mpeg4_c_dc_scale_table[32];
730extern const int16_t ff_mpeg4_default_intra_matrix[64];
731extern const int16_t ff_mpeg4_default_non_intra_matrix[64];
1457ab52
MN
732int ff_h263_decode_init(AVCodecContext *avctx);
733int ff_h263_decode_frame(AVCodecContext *avctx,
734 void *data, int *data_size,
0c1a9eda 735 uint8_t *buf, int buf_size);
1457ab52 736int ff_h263_decode_end(AVCodecContext *avctx);
de6d9b64
FB
737void h263_encode_mb(MpegEncContext *s,
738 DCTELEM block[6][64],
739 int motion_x, int motion_y);
d6231b9e
MN
740void mpeg4_encode_mb(MpegEncContext *s,
741 DCTELEM block[6][64],
742 int motion_x, int motion_y);
de6d9b64 743void h263_encode_picture_header(MpegEncContext *s, int picture_number);
644d98a4 744int h263_encode_gob_header(MpegEncContext * s, int mb_line);
0c1a9eda 745int16_t *h263_pred_motion(MpegEncContext * s, int block,
de6d9b64 746 int *px, int *py);
0e15384d 747void mpeg4_pred_ac(MpegEncContext * s, DCTELEM *block, int n,
de6d9b64 748 int dir);
91029be7 749void ff_set_mpeg4_time(MpegEncContext * s, int picture_number);
de6d9b64 750void mpeg4_encode_picture_header(MpegEncContext *s, int picture_number);
45870f57 751void h263_encode_init(MpegEncContext *s);
de6d9b64
FB
752void h263_decode_init_vlc(MpegEncContext *s);
753int h263_decode_picture_header(MpegEncContext *s);
4d2858de 754int ff_h263_decode_gob_header(MpegEncContext *s);
b704e742
MN
755int ff_mpeg4_decode_picture_header(MpegEncContext * s, GetBitContext *gb);
756
757
de6d9b64 758int intel_h263_decode_picture_header(MpegEncContext *s);
4d2858de
MN
759int ff_h263_decode_mb(MpegEncContext *s,
760 DCTELEM block[6][64]);
de6d9b64 761int h263_get_picture_format(int width, int height);
7f2fe444
MN
762void ff_mpeg4_encode_video_packet_header(MpegEncContext *s);
763void ff_mpeg4_clean_buffers(MpegEncContext *s);
764void ff_mpeg4_stuffing(PutBitContext * pbc);
765void ff_mpeg4_init_partitions(MpegEncContext *s);
766void ff_mpeg4_merge_partitions(MpegEncContext *s);
c5d309f2 767void ff_clean_mpeg4_qscales(MpegEncContext *s);
9e4c6948 768void ff_clean_h263_qscales(MpegEncContext *s);
4d2858de
MN
769int ff_mpeg4_decode_partitions(MpegEncContext *s);
770int ff_mpeg4_get_video_packet_prefix_length(MpegEncContext *s);
771int ff_h263_resync(MpegEncContext *s);
772int ff_h263_get_gob_height(MpegEncContext *s);
1457ab52 773void ff_mpeg4_set_direct_mv(MpegEncContext *s, int mx, int my);
67725183 774inline int ff_h263_round_chroma(int x);
4d2858de 775
de6d9b64
FB
776
777/* rv10.c */
778void rv10_encode_picture_header(MpegEncContext *s, int picture_number);
779int rv_decode_dc(MpegEncContext *s, int n);
780
4d2858de 781
de6d9b64
FB
782/* msmpeg4.c */
783void msmpeg4_encode_picture_header(MpegEncContext * s, int picture_number);
ae40484c 784void msmpeg4_encode_ext_header(MpegEncContext * s);
de6d9b64
FB
785void msmpeg4_encode_mb(MpegEncContext * s,
786 DCTELEM block[6][64],
787 int motion_x, int motion_y);
de6d9b64 788int msmpeg4_decode_picture_header(MpegEncContext * s);
ae40484c 789int msmpeg4_decode_ext_header(MpegEncContext * s, int buf_size);
0151a6f5
MN
790int ff_msmpeg4_decode_init(MpegEncContext *s);
791void ff_msmpeg4_encode_init(MpegEncContext *s);
1457ab52
MN
792int ff_wmv2_decode_picture_header(MpegEncContext * s);
793void ff_wmv2_add_mb(MpegEncContext *s, DCTELEM block[6][64], uint8_t *dest_y, uint8_t *dest_cb, uint8_t *dest_cr);
794void ff_mspel_motion(MpegEncContext *s,
0c1a9eda
ZK
795 uint8_t *dest_y, uint8_t *dest_cb, uint8_t *dest_cr,
796 uint8_t **ref_picture, op_pixels_func (*pix_op)[4],
1457ab52
MN
797 int motion_x, int motion_y, int h);
798int ff_wmv2_encode_picture_header(MpegEncContext * s, int picture_number);
799void ff_wmv2_encode_mb(MpegEncContext * s,
800 DCTELEM block[6][64],
801 int motion_x, int motion_y);
de6d9b64 802
4d2858de 803/* mjpegenc.c */
de6d9b64
FB
804int mjpeg_init(MpegEncContext *s);
805void mjpeg_close(MpegEncContext *s);
806void mjpeg_encode_mb(MpegEncContext *s,
807 DCTELEM block[6][64]);
808void mjpeg_picture_header(MpegEncContext *s);
809void mjpeg_picture_trailer(MpegEncContext *s);
8b4c7dbc 810
4d2858de 811
8b4c7dbc
MN
812/* rate control */
813int ff_rate_control_init(MpegEncContext *s);
c5d309f2 814float ff_rate_estimate_qscale(MpegEncContext *s);
8b4c7dbc
MN
815void ff_write_pass1_stats(MpegEncContext *s);
816void ff_rate_control_uninit(MpegEncContext *s);
5c91a675
ZK
817double ff_eval(char *s, double *const_value, const char **const_name,
818 double (**func1)(void *, double), const char **func1_name,
3aa102be
MN
819 double (**func2)(void *, double, double), char **func2_name,
820 void *opaque);
821
8b4c7dbc 822
cd4af68a 823#endif /* AVCODEC_MPEGVIDEO_H */