libx264: Add support for the MPEG2 encoder
[libav.git] / libavcodec / libx264.c
1 /*
2 * H.264 encoding using the x264 library
3 * Copyright (C) 2005 Mans Rullgard <mans@mansr.com>
4 *
5 * This file is part of Libav.
6 *
7 * Libav is free software; you can redistribute it and/or
8 * modify it under the terms of the GNU Lesser General Public
9 * License as published by the Free Software Foundation; either
10 * version 2.1 of the License, or (at your option) any later version.
11 *
12 * Libav is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15 * Lesser General Public License for more details.
16 *
17 * You should have received a copy of the GNU Lesser General Public
18 * License along with Libav; if not, write to the Free Software
19 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20 */
21
22 #include "libavutil/internal.h"
23 #include "libavutil/opt.h"
24 #include "libavutil/mem.h"
25 #include "libavutil/pixdesc.h"
26 #include "libavutil/stereo3d.h"
27 #include "avcodec.h"
28 #include "internal.h"
29
30 #if defined(_MSC_VER)
31 #define X264_API_IMPORTS 1
32 #endif
33
34 #include <x264.h>
35 #include <float.h>
36 #include <math.h>
37 #include <stdio.h>
38 #include <stdlib.h>
39 #include <string.h>
40
41 typedef struct X264Context {
42 AVClass *class;
43 x264_param_t params;
44 x264_t *enc;
45 x264_picture_t pic;
46 uint8_t *sei;
47 int sei_size;
48 char *preset;
49 char *tune;
50 char *profile;
51 int fastfirstpass;
52 float crf;
53 float crf_max;
54 int cqp;
55 int aq_mode;
56 float aq_strength;
57 char *psy_rd;
58 int psy;
59 int rc_lookahead;
60 int weightp;
61 int weightb;
62 int ssim;
63 int intra_refresh;
64 int bluray_compat;
65 int b_bias;
66 int b_pyramid;
67 int mixed_refs;
68 int dct8x8;
69 int fast_pskip;
70 int aud;
71 int mbtree;
72 char *deblock;
73 float cplxblur;
74 char *partitions;
75 int direct_pred;
76 int slice_max_size;
77 char *stats;
78 int nal_hrd;
79 char *x264_params;
80 } X264Context;
81
82 static void X264_log(void *p, int level, const char *fmt, va_list args)
83 {
84 static const int level_map[] = {
85 [X264_LOG_ERROR] = AV_LOG_ERROR,
86 [X264_LOG_WARNING] = AV_LOG_WARNING,
87 [X264_LOG_INFO] = AV_LOG_INFO,
88 [X264_LOG_DEBUG] = AV_LOG_DEBUG
89 };
90
91 if (level < 0 || level > X264_LOG_DEBUG)
92 return;
93
94 av_vlog(p, level_map[level], fmt, args);
95 }
96
97
98 static int encode_nals(AVCodecContext *ctx, AVPacket *pkt,
99 x264_nal_t *nals, int nnal)
100 {
101 X264Context *x4 = ctx->priv_data;
102 uint8_t *p;
103 int i, size = x4->sei_size, ret;
104
105 if (!nnal)
106 return 0;
107
108 for (i = 0; i < nnal; i++)
109 size += nals[i].i_payload;
110
111 if ((ret = ff_alloc_packet(pkt, size)) < 0)
112 return ret;
113
114 p = pkt->data;
115
116 /* Write the SEI as part of the first frame. */
117 if (x4->sei_size > 0 && nnal > 0) {
118 memcpy(p, x4->sei, x4->sei_size);
119 p += x4->sei_size;
120 x4->sei_size = 0;
121 }
122
123 for (i = 0; i < nnal; i++){
124 memcpy(p, nals[i].p_payload, nals[i].i_payload);
125 p += nals[i].i_payload;
126 }
127
128 return 1;
129 }
130
131 static void reconfig_encoder(AVCodecContext *ctx, const AVFrame *frame)
132 {
133 X264Context *x4 = ctx->priv_data;
134 AVFrameSideData *side_data;
135
136
137 if (x4->params.b_tff != frame->top_field_first) {
138 x4->params.b_tff = frame->top_field_first;
139 x264_encoder_reconfig(x4->enc, &x4->params);
140 }
141 if (x4->params.vui.i_sar_height != ctx->sample_aspect_ratio.den ||
142 x4->params.vui.i_sar_width != ctx->sample_aspect_ratio.num) {
143 x4->params.vui.i_sar_height = ctx->sample_aspect_ratio.den;
144 x4->params.vui.i_sar_width = ctx->sample_aspect_ratio.num;
145 x264_encoder_reconfig(x4->enc, &x4->params);
146 }
147
148 if (x4->params.rc.i_vbv_buffer_size != ctx->rc_buffer_size / 1000 ||
149 x4->params.rc.i_vbv_max_bitrate != ctx->rc_max_rate / 1000) {
150 x4->params.rc.i_vbv_buffer_size = ctx->rc_buffer_size / 1000;
151 x4->params.rc.i_vbv_max_bitrate = ctx->rc_max_rate / 1000;
152 x264_encoder_reconfig(x4->enc, &x4->params);
153 }
154
155 if (x4->params.rc.i_rc_method == X264_RC_ABR &&
156 x4->params.rc.i_bitrate != ctx->bit_rate / 1000) {
157 x4->params.rc.i_bitrate = ctx->bit_rate / 1000;
158 x264_encoder_reconfig(x4->enc, &x4->params);
159 }
160
161 if (x4->crf >= 0 &&
162 x4->params.rc.i_rc_method == X264_RC_CRF &&
163 x4->params.rc.f_rf_constant != x4->crf) {
164 x4->params.rc.f_rf_constant = x4->crf;
165 x264_encoder_reconfig(x4->enc, &x4->params);
166 }
167
168 if (x4->params.rc.i_rc_method == X264_RC_CQP &&
169 x4->params.rc.i_qp_constant != x4->cqp) {
170 x4->params.rc.i_qp_constant = x4->cqp;
171 x264_encoder_reconfig(x4->enc, &x4->params);
172 }
173
174 if (x4->crf_max >= 0 &&
175 x4->params.rc.f_rf_constant_max != x4->crf_max) {
176 x4->params.rc.f_rf_constant_max = x4->crf_max;
177 x264_encoder_reconfig(x4->enc, &x4->params);
178 }
179
180 side_data = av_frame_get_side_data(frame, AV_FRAME_DATA_STEREO3D);
181 if (side_data) {
182 AVStereo3D *stereo = (AVStereo3D *)side_data->data;
183 int fpa_type;
184
185 switch (stereo->type) {
186 case AV_STEREO3D_CHECKERBOARD:
187 fpa_type = 0;
188 break;
189 case AV_STEREO3D_COLUMNS:
190 fpa_type = 1;
191 break;
192 case AV_STEREO3D_LINES:
193 fpa_type = 2;
194 break;
195 case AV_STEREO3D_SIDEBYSIDE:
196 fpa_type = 3;
197 break;
198 case AV_STEREO3D_TOPBOTTOM:
199 fpa_type = 4;
200 break;
201 case AV_STEREO3D_FRAMESEQUENCE:
202 fpa_type = 5;
203 break;
204 default:
205 fpa_type = -1;
206 break;
207 }
208
209 if (fpa_type != x4->params.i_frame_packing) {
210 x4->params.i_frame_packing = fpa_type;
211 x264_encoder_reconfig(x4->enc, &x4->params);
212 }
213 }
214 }
215
216 static int X264_frame(AVCodecContext *ctx, AVPacket *pkt, const AVFrame *frame,
217 int *got_packet)
218 {
219 X264Context *x4 = ctx->priv_data;
220 x264_nal_t *nal;
221 int nnal, i, ret;
222 x264_picture_t pic_out;
223
224 x264_picture_init( &x4->pic );
225 x4->pic.img.i_csp = x4->params.i_csp;
226 if (x264_bit_depth > 8)
227 x4->pic.img.i_csp |= X264_CSP_HIGH_DEPTH;
228 x4->pic.img.i_plane = 3;
229
230 if (frame) {
231 for (i = 0; i < 3; i++) {
232 x4->pic.img.plane[i] = frame->data[i];
233 x4->pic.img.i_stride[i] = frame->linesize[i];
234 }
235
236 x4->pic.i_pts = frame->pts;
237 x4->pic.i_type =
238 frame->pict_type == AV_PICTURE_TYPE_I ? X264_TYPE_KEYFRAME :
239 frame->pict_type == AV_PICTURE_TYPE_P ? X264_TYPE_P :
240 frame->pict_type == AV_PICTURE_TYPE_B ? X264_TYPE_B :
241 X264_TYPE_AUTO;
242 reconfig_encoder(ctx, frame);
243 }
244 do {
245 if (x264_encoder_encode(x4->enc, &nal, &nnal, frame? &x4->pic: NULL, &pic_out) < 0)
246 return AVERROR_UNKNOWN;
247
248 ret = encode_nals(ctx, pkt, nal, nnal);
249 if (ret < 0)
250 return ret;
251 } while (!ret && !frame && x264_encoder_delayed_frames(x4->enc));
252
253 pkt->pts = pic_out.i_pts;
254 pkt->dts = pic_out.i_dts;
255
256 switch (pic_out.i_type) {
257 case X264_TYPE_IDR:
258 case X264_TYPE_I:
259 ctx->coded_frame->pict_type = AV_PICTURE_TYPE_I;
260 break;
261 case X264_TYPE_P:
262 ctx->coded_frame->pict_type = AV_PICTURE_TYPE_P;
263 break;
264 case X264_TYPE_B:
265 case X264_TYPE_BREF:
266 ctx->coded_frame->pict_type = AV_PICTURE_TYPE_B;
267 break;
268 }
269
270 pkt->flags |= AV_PKT_FLAG_KEY*pic_out.b_keyframe;
271 if (ret)
272 ctx->coded_frame->quality = (pic_out.i_qpplus1 - 1) * FF_QP2LAMBDA;
273
274 *got_packet = ret;
275 return 0;
276 }
277
278 static av_cold int X264_close(AVCodecContext *avctx)
279 {
280 X264Context *x4 = avctx->priv_data;
281
282 av_freep(&avctx->extradata);
283 av_freep(&x4->sei);
284
285 if (x4->enc) {
286 x264_encoder_close(x4->enc);
287 x4->enc = NULL;
288 }
289
290 av_frame_free(&avctx->coded_frame);
291
292 return 0;
293 }
294
295 static int convert_pix_fmt(enum AVPixelFormat pix_fmt)
296 {
297 switch (pix_fmt) {
298 case AV_PIX_FMT_YUV420P:
299 case AV_PIX_FMT_YUVJ420P:
300 case AV_PIX_FMT_YUV420P9:
301 case AV_PIX_FMT_YUV420P10: return X264_CSP_I420;
302 case AV_PIX_FMT_YUV422P:
303 case AV_PIX_FMT_YUVJ422P:
304 case AV_PIX_FMT_YUV422P10: return X264_CSP_I422;
305 case AV_PIX_FMT_YUV444P:
306 case AV_PIX_FMT_YUVJ444P:
307 case AV_PIX_FMT_YUV444P9:
308 case AV_PIX_FMT_YUV444P10: return X264_CSP_I444;
309 case AV_PIX_FMT_NV12: return X264_CSP_NV12;
310 case AV_PIX_FMT_NV16:
311 case AV_PIX_FMT_NV20: return X264_CSP_NV16;
312 };
313 return 0;
314 }
315
316 #define PARSE_X264_OPT(name, var)\
317 if (x4->var && x264_param_parse(&x4->params, name, x4->var) < 0) {\
318 av_log(avctx, AV_LOG_ERROR, "Error parsing option '%s' with value '%s'.\n", name, x4->var);\
319 return AVERROR(EINVAL);\
320 }
321
322 static av_cold int X264_init(AVCodecContext *avctx)
323 {
324 X264Context *x4 = avctx->priv_data;
325
326 #if CONFIG_LIBX262_ENCODER
327 if (avctx->codec_id == AV_CODEC_ID_MPEG2VIDEO) {
328 x4->params.b_mpeg2 = 1;
329 x264_param_default_mpeg2(&x4->params);
330 } else
331 #else
332 x264_param_default(&x4->params);
333 #endif
334
335 x4->params.b_deblocking_filter = avctx->flags & CODEC_FLAG_LOOP_FILTER;
336
337 if (x4->preset || x4->tune)
338 if (x264_param_default_preset(&x4->params, x4->preset, x4->tune) < 0) {
339 av_log(avctx, AV_LOG_ERROR, "Error setting preset/tune %s/%s.\n", x4->preset, x4->tune);
340 return AVERROR(EINVAL);
341 }
342
343 if (avctx->level > 0)
344 x4->params.i_level_idc = avctx->level;
345
346 x4->params.pf_log = X264_log;
347 x4->params.p_log_private = avctx;
348 x4->params.i_log_level = X264_LOG_DEBUG;
349 x4->params.i_csp = convert_pix_fmt(avctx->pix_fmt);
350
351 if (avctx->bit_rate) {
352 x4->params.rc.i_bitrate = avctx->bit_rate / 1000;
353 x4->params.rc.i_rc_method = X264_RC_ABR;
354 }
355 x4->params.rc.i_vbv_buffer_size = avctx->rc_buffer_size / 1000;
356 x4->params.rc.i_vbv_max_bitrate = avctx->rc_max_rate / 1000;
357 x4->params.rc.b_stat_write = avctx->flags & CODEC_FLAG_PASS1;
358 if (avctx->flags & CODEC_FLAG_PASS2) {
359 x4->params.rc.b_stat_read = 1;
360 } else {
361 if (x4->crf >= 0) {
362 x4->params.rc.i_rc_method = X264_RC_CRF;
363 x4->params.rc.f_rf_constant = x4->crf;
364 } else if (x4->cqp >= 0) {
365 x4->params.rc.i_rc_method = X264_RC_CQP;
366 x4->params.rc.i_qp_constant = x4->cqp;
367 }
368
369 if (x4->crf_max >= 0)
370 x4->params.rc.f_rf_constant_max = x4->crf_max;
371 }
372
373 if (avctx->rc_buffer_size && avctx->rc_initial_buffer_occupancy > 0 &&
374 (avctx->rc_initial_buffer_occupancy <= avctx->rc_buffer_size)) {
375 x4->params.rc.f_vbv_buffer_init =
376 (float)avctx->rc_initial_buffer_occupancy / avctx->rc_buffer_size;
377 }
378
379 if (avctx->i_quant_factor > 0)
380 x4->params.rc.f_ip_factor = 1 / fabs(avctx->i_quant_factor);
381 x4->params.rc.f_pb_factor = avctx->b_quant_factor;
382 x4->params.analyse.i_chroma_qp_offset = avctx->chromaoffset;
383
384 if (avctx->me_method == ME_EPZS)
385 x4->params.analyse.i_me_method = X264_ME_DIA;
386 else if (avctx->me_method == ME_HEX)
387 x4->params.analyse.i_me_method = X264_ME_HEX;
388 else if (avctx->me_method == ME_UMH)
389 x4->params.analyse.i_me_method = X264_ME_UMH;
390 else if (avctx->me_method == ME_FULL)
391 x4->params.analyse.i_me_method = X264_ME_ESA;
392 else if (avctx->me_method == ME_TESA)
393 x4->params.analyse.i_me_method = X264_ME_TESA;
394
395 if (avctx->gop_size >= 0)
396 x4->params.i_keyint_max = avctx->gop_size;
397 if (avctx->max_b_frames >= 0)
398 x4->params.i_bframe = avctx->max_b_frames;
399 if (avctx->scenechange_threshold >= 0)
400 x4->params.i_scenecut_threshold = avctx->scenechange_threshold;
401 if (avctx->qmin >= 0)
402 x4->params.rc.i_qp_min = avctx->qmin;
403 if (avctx->qmax >= 0)
404 x4->params.rc.i_qp_max = avctx->qmax;
405 if (avctx->max_qdiff >= 0)
406 x4->params.rc.i_qp_step = avctx->max_qdiff;
407 if (avctx->qblur >= 0)
408 x4->params.rc.f_qblur = avctx->qblur; /* temporally blur quants */
409 if (avctx->qcompress >= 0)
410 x4->params.rc.f_qcompress = avctx->qcompress; /* 0.0 => cbr, 1.0 => constant qp */
411 if (avctx->refs >= 0)
412 x4->params.i_frame_reference = avctx->refs;
413 if (avctx->trellis >= 0)
414 x4->params.analyse.i_trellis = avctx->trellis;
415 if (avctx->me_range >= 0)
416 x4->params.analyse.i_me_range = avctx->me_range;
417 if (avctx->noise_reduction >= 0)
418 x4->params.analyse.i_noise_reduction = avctx->noise_reduction;
419 if (avctx->me_subpel_quality >= 0)
420 x4->params.analyse.i_subpel_refine = avctx->me_subpel_quality;
421 if (avctx->b_frame_strategy >= 0)
422 x4->params.i_bframe_adaptive = avctx->b_frame_strategy;
423 if (avctx->keyint_min >= 0)
424 x4->params.i_keyint_min = avctx->keyint_min;
425 if (avctx->coder_type >= 0)
426 x4->params.b_cabac = avctx->coder_type == FF_CODER_TYPE_AC;
427 if (avctx->me_cmp >= 0)
428 x4->params.analyse.b_chroma_me = avctx->me_cmp & FF_CMP_CHROMA;
429
430 if (x4->aq_mode >= 0)
431 x4->params.rc.i_aq_mode = x4->aq_mode;
432 if (x4->aq_strength >= 0)
433 x4->params.rc.f_aq_strength = x4->aq_strength;
434 PARSE_X264_OPT("psy-rd", psy_rd);
435 PARSE_X264_OPT("deblock", deblock);
436 PARSE_X264_OPT("partitions", partitions);
437 PARSE_X264_OPT("stats", stats);
438 if (x4->psy >= 0)
439 x4->params.analyse.b_psy = x4->psy;
440 if (x4->rc_lookahead >= 0)
441 x4->params.rc.i_lookahead = x4->rc_lookahead;
442 if (x4->weightp >= 0)
443 x4->params.analyse.i_weighted_pred = x4->weightp;
444 if (x4->weightb >= 0)
445 x4->params.analyse.b_weighted_bipred = x4->weightb;
446 if (x4->cplxblur >= 0)
447 x4->params.rc.f_complexity_blur = x4->cplxblur;
448
449 if (x4->ssim >= 0)
450 x4->params.analyse.b_ssim = x4->ssim;
451 if (x4->intra_refresh >= 0)
452 x4->params.b_intra_refresh = x4->intra_refresh;
453 if (x4->bluray_compat >= 0) {
454 x4->params.b_bluray_compat = x4->bluray_compat;
455 x4->params.b_vfr_input = 0;
456 }
457 if (x4->b_bias != INT_MIN)
458 x4->params.i_bframe_bias = x4->b_bias;
459 if (x4->b_pyramid >= 0)
460 x4->params.i_bframe_pyramid = x4->b_pyramid;
461 if (x4->mixed_refs >= 0)
462 x4->params.analyse.b_mixed_references = x4->mixed_refs;
463 if (x4->dct8x8 >= 0)
464 x4->params.analyse.b_transform_8x8 = x4->dct8x8;
465 if (x4->fast_pskip >= 0)
466 x4->params.analyse.b_fast_pskip = x4->fast_pskip;
467 if (x4->aud >= 0)
468 x4->params.b_aud = x4->aud;
469 if (x4->mbtree >= 0)
470 x4->params.rc.b_mb_tree = x4->mbtree;
471 if (x4->direct_pred >= 0)
472 x4->params.analyse.i_direct_mv_pred = x4->direct_pred;
473
474 if (x4->slice_max_size >= 0)
475 x4->params.i_slice_max_size = x4->slice_max_size;
476
477 if (x4->fastfirstpass)
478 x264_param_apply_fastfirstpass(&x4->params);
479
480 if (x4->nal_hrd >= 0)
481 x4->params.i_nal_hrd = x4->nal_hrd;
482
483 if (x4->profile)
484 if (x264_param_apply_profile(&x4->params, x4->profile) < 0) {
485 av_log(avctx, AV_LOG_ERROR, "Error setting profile %s.\n", x4->profile);
486 return AVERROR(EINVAL);
487 }
488
489 x4->params.i_width = avctx->width;
490 x4->params.i_height = avctx->height;
491 x4->params.vui.i_sar_width = avctx->sample_aspect_ratio.num;
492 x4->params.vui.i_sar_height = avctx->sample_aspect_ratio.den;
493 x4->params.i_fps_num = x4->params.i_timebase_den = avctx->time_base.den;
494 x4->params.i_fps_den = x4->params.i_timebase_num = avctx->time_base.num;
495
496 x4->params.analyse.b_psnr = avctx->flags & CODEC_FLAG_PSNR;
497
498 x4->params.i_threads = avctx->thread_count;
499 if (avctx->thread_type)
500 x4->params.b_sliced_threads = avctx->thread_type == FF_THREAD_SLICE;
501
502 x4->params.b_interlaced = avctx->flags & CODEC_FLAG_INTERLACED_DCT;
503
504 x4->params.b_open_gop = !(avctx->flags & CODEC_FLAG_CLOSED_GOP);
505
506 x4->params.i_slice_count = avctx->slices;
507
508 x4->params.vui.b_fullrange = avctx->pix_fmt == AV_PIX_FMT_YUVJ420P ||
509 avctx->pix_fmt == AV_PIX_FMT_YUVJ422P ||
510 avctx->pix_fmt == AV_PIX_FMT_YUVJ444P ||
511 avctx->color_range == AVCOL_RANGE_JPEG;
512
513 // x264 validates the values internally
514 x4->params.vui.i_colorprim = avctx->color_primaries;
515 x4->params.vui.i_transfer = avctx->color_trc;
516 x4->params.vui.i_colmatrix = avctx->colorspace;
517
518 if (avctx->flags & CODEC_FLAG_GLOBAL_HEADER)
519 x4->params.b_repeat_headers = 0;
520
521 if (x4->x264_params) {
522 AVDictionary *dict = NULL;
523 AVDictionaryEntry *en = NULL;
524
525 if (!av_dict_parse_string(&dict, x4->x264_params, "=", ":", 0)) {
526 while ((en = av_dict_get(dict, "", en, AV_DICT_IGNORE_SUFFIX))) {
527 if (x264_param_parse(&x4->params, en->key, en->value) < 0)
528 av_log(avctx, AV_LOG_WARNING,
529 "Error parsing option '%s = %s'.\n",
530 en->key, en->value);
531 }
532
533 av_dict_free(&dict);
534 }
535 }
536
537 // update AVCodecContext with x264 parameters
538 avctx->has_b_frames = x4->params.i_bframe ?
539 x4->params.i_bframe_pyramid ? 2 : 1 : 0;
540 if (avctx->max_b_frames < 0)
541 avctx->max_b_frames = 0;
542
543 avctx->bit_rate = x4->params.rc.i_bitrate*1000;
544
545 x4->enc = x264_encoder_open(&x4->params);
546 if (!x4->enc)
547 return AVERROR_UNKNOWN;
548
549 avctx->coded_frame = av_frame_alloc();
550 if (!avctx->coded_frame)
551 return AVERROR(ENOMEM);
552
553 if (avctx->flags & CODEC_FLAG_GLOBAL_HEADER) {
554 x264_nal_t *nal;
555 uint8_t *p;
556 int nnal, s, i;
557
558 s = x264_encoder_headers(x4->enc, &nal, &nnal);
559 avctx->extradata = p = av_malloc(s);
560 if (!p)
561 return AVERROR(ENOMEM);
562
563 for (i = 0; i < nnal; i++) {
564 /* Don't put the SEI in extradata. */
565 if (nal[i].i_type == NAL_SEI) {
566 av_log(avctx, AV_LOG_INFO, "%s\n", nal[i].p_payload+25);
567 x4->sei_size = nal[i].i_payload;
568 x4->sei = av_malloc(x4->sei_size);
569 if (!x4->sei)
570 return AVERROR(ENOMEM);
571 memcpy(x4->sei, nal[i].p_payload, nal[i].i_payload);
572 continue;
573 }
574 memcpy(p, nal[i].p_payload, nal[i].i_payload);
575 p += nal[i].i_payload;
576 }
577 avctx->extradata_size = p - avctx->extradata;
578 }
579
580 return 0;
581 }
582
583 static const enum AVPixelFormat pix_fmts_8bit[] = {
584 AV_PIX_FMT_YUV420P,
585 AV_PIX_FMT_YUVJ420P,
586 AV_PIX_FMT_YUV422P,
587 AV_PIX_FMT_YUVJ422P,
588 AV_PIX_FMT_YUV444P,
589 AV_PIX_FMT_YUVJ444P,
590 AV_PIX_FMT_NV12,
591 AV_PIX_FMT_NV16,
592 AV_PIX_FMT_NONE
593 };
594 static const enum AVPixelFormat pix_fmts_9bit[] = {
595 AV_PIX_FMT_YUV420P9,
596 AV_PIX_FMT_YUV444P9,
597 AV_PIX_FMT_NONE
598 };
599 static const enum AVPixelFormat pix_fmts_10bit[] = {
600 AV_PIX_FMT_YUV420P10,
601 AV_PIX_FMT_YUV422P10,
602 AV_PIX_FMT_YUV444P10,
603 AV_PIX_FMT_NV20,
604 AV_PIX_FMT_NONE
605 };
606
607 static av_cold void X264_init_static(AVCodec *codec)
608 {
609 if (x264_bit_depth == 8)
610 codec->pix_fmts = pix_fmts_8bit;
611 else if (x264_bit_depth == 9)
612 codec->pix_fmts = pix_fmts_9bit;
613 else if (x264_bit_depth == 10)
614 codec->pix_fmts = pix_fmts_10bit;
615 }
616
617 #define OFFSET(x) offsetof(X264Context, x)
618 #define VE AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_ENCODING_PARAM
619 static const AVOption options[] = {
620 { "preset", "Set the encoding preset (cf. x264 --fullhelp)", OFFSET(preset), AV_OPT_TYPE_STRING, { .str = "medium" }, 0, 0, VE},
621 { "tune", "Tune the encoding params (cf. x264 --fullhelp)", OFFSET(tune), AV_OPT_TYPE_STRING, { 0 }, 0, 0, VE},
622 { "profile", "Set profile restrictions (cf. x264 --fullhelp) ", OFFSET(profile), AV_OPT_TYPE_STRING, { 0 }, 0, 0, VE},
623 { "fastfirstpass", "Use fast settings when encoding first pass", OFFSET(fastfirstpass), AV_OPT_TYPE_INT, { .i64 = 1 }, 0, 1, VE},
624 { "crf", "Select the quality for constant quality mode", OFFSET(crf), AV_OPT_TYPE_FLOAT, {.dbl = -1 }, -1, FLT_MAX, VE },
625 { "crf_max", "In CRF mode, prevents VBV from lowering quality beyond this point.",OFFSET(crf_max), AV_OPT_TYPE_FLOAT, {.dbl = -1 }, -1, FLT_MAX, VE },
626 { "qp", "Constant quantization parameter rate control method",OFFSET(cqp), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, INT_MAX, VE },
627 { "aq-mode", "AQ method", OFFSET(aq_mode), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, INT_MAX, VE, "aq_mode"},
628 { "none", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = X264_AQ_NONE}, INT_MIN, INT_MAX, VE, "aq_mode" },
629 { "variance", "Variance AQ (complexity mask)", 0, AV_OPT_TYPE_CONST, {.i64 = X264_AQ_VARIANCE}, INT_MIN, INT_MAX, VE, "aq_mode" },
630 { "autovariance", "Auto-variance AQ (experimental)", 0, AV_OPT_TYPE_CONST, {.i64 = X264_AQ_AUTOVARIANCE}, INT_MIN, INT_MAX, VE, "aq_mode" },
631 { "aq-strength", "AQ strength. Reduces blocking and blurring in flat and textured areas.", OFFSET(aq_strength), AV_OPT_TYPE_FLOAT, {.dbl = -1}, -1, FLT_MAX, VE},
632 { "psy", "Use psychovisual optimizations.", OFFSET(psy), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, 1, VE },
633 { "psy-rd", "Strength of psychovisual optimization, in <psy-rd>:<psy-trellis> format.", OFFSET(psy_rd), AV_OPT_TYPE_STRING, {0 }, 0, 0, VE},
634 { "rc-lookahead", "Number of frames to look ahead for frametype and ratecontrol", OFFSET(rc_lookahead), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, INT_MAX, VE },
635 { "weightb", "Weighted prediction for B-frames.", OFFSET(weightb), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, 1, VE },
636 { "weightp", "Weighted prediction analysis method.", OFFSET(weightp), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, INT_MAX, VE, "weightp" },
637 { "none", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = X264_WEIGHTP_NONE}, INT_MIN, INT_MAX, VE, "weightp" },
638 { "simple", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = X264_WEIGHTP_SIMPLE}, INT_MIN, INT_MAX, VE, "weightp" },
639 { "smart", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = X264_WEIGHTP_SMART}, INT_MIN, INT_MAX, VE, "weightp" },
640 { "ssim", "Calculate and print SSIM stats.", OFFSET(ssim), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, 1, VE },
641 { "intra-refresh", "Use Periodic Intra Refresh instead of IDR frames.",OFFSET(intra_refresh),AV_OPT_TYPE_INT, { .i64 = -1 }, -1, 1, VE },
642 { "bluray-compat", "Bluray compatibility workarounds.", OFFSET(bluray_compat) ,AV_OPT_TYPE_INT, { .i64 = -1 }, -1, 1, VE },
643 { "b-bias", "Influences how often B-frames are used", OFFSET(b_bias), AV_OPT_TYPE_INT, { .i64 = INT_MIN}, INT_MIN, INT_MAX, VE },
644 { "b-pyramid", "Keep some B-frames as references.", OFFSET(b_pyramid), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, INT_MAX, VE, "b_pyramid" },
645 { "none", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = X264_B_PYRAMID_NONE}, INT_MIN, INT_MAX, VE, "b_pyramid" },
646 { "strict", "Strictly hierarchical pyramid", 0, AV_OPT_TYPE_CONST, {.i64 = X264_B_PYRAMID_STRICT}, INT_MIN, INT_MAX, VE, "b_pyramid" },
647 { "normal", "Non-strict (not Blu-ray compatible)", 0, AV_OPT_TYPE_CONST, {.i64 = X264_B_PYRAMID_NORMAL}, INT_MIN, INT_MAX, VE, "b_pyramid" },
648 { "mixed-refs", "One reference per partition, as opposed to one reference per macroblock", OFFSET(mixed_refs), AV_OPT_TYPE_INT, { .i64 = -1}, -1, 1, VE },
649 { "8x8dct", "High profile 8x8 transform.", OFFSET(dct8x8), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, 1, VE},
650 { "fast-pskip", NULL, OFFSET(fast_pskip), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, 1, VE},
651 { "aud", "Use access unit delimiters.", OFFSET(aud), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, 1, VE},
652 { "mbtree", "Use macroblock tree ratecontrol.", OFFSET(mbtree), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, 1, VE},
653 { "deblock", "Loop filter parameters, in <alpha:beta> form.", OFFSET(deblock), AV_OPT_TYPE_STRING, { 0 }, 0, 0, VE},
654 { "cplxblur", "Reduce fluctuations in QP (before curve compression)", OFFSET(cplxblur), AV_OPT_TYPE_FLOAT, {.dbl = -1 }, -1, FLT_MAX, VE},
655 { "partitions", "A comma-separated list of partitions to consider. "
656 "Possible values: p8x8, p4x4, b8x8, i8x8, i4x4, none, all", OFFSET(partitions), AV_OPT_TYPE_STRING, { 0 }, 0, 0, VE},
657 { "direct-pred", "Direct MV prediction mode", OFFSET(direct_pred), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, INT_MAX, VE, "direct-pred" },
658 { "none", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = X264_DIRECT_PRED_NONE }, 0, 0, VE, "direct-pred" },
659 { "spatial", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = X264_DIRECT_PRED_SPATIAL }, 0, 0, VE, "direct-pred" },
660 { "temporal", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = X264_DIRECT_PRED_TEMPORAL }, 0, 0, VE, "direct-pred" },
661 { "auto", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = X264_DIRECT_PRED_AUTO }, 0, 0, VE, "direct-pred" },
662 { "slice-max-size","Limit the size of each slice in bytes", OFFSET(slice_max_size),AV_OPT_TYPE_INT, { .i64 = -1 }, -1, INT_MAX, VE },
663 { "stats", "Filename for 2 pass stats", OFFSET(stats), AV_OPT_TYPE_STRING, { 0 }, 0, 0, VE },
664 { "nal-hrd", "Signal HRD information (requires vbv-bufsize; "
665 "cbr not allowed in .mp4)", OFFSET(nal_hrd), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, INT_MAX, VE, "nal-hrd" },
666 { "none", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = X264_NAL_HRD_NONE}, INT_MIN, INT_MAX, VE, "nal-hrd" },
667 { "vbr", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = X264_NAL_HRD_VBR}, INT_MIN, INT_MAX, VE, "nal-hrd" },
668 { "cbr", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = X264_NAL_HRD_CBR}, INT_MIN, INT_MAX, VE, "nal-hrd" },
669 { "x264-params", "Override the x264 configuration using a :-separated list of key=value parameters", OFFSET(x264_params), AV_OPT_TYPE_STRING, { 0 }, 0, 0, VE },
670 { NULL },
671 };
672
673 static const AVCodecDefault x264_defaults[] = {
674 { "b", "0" },
675 { "bf", "-1" },
676 { "g", "-1" },
677 { "i_qfactor", "-1" },
678 { "qmin", "-1" },
679 { "qmax", "-1" },
680 { "qdiff", "-1" },
681 { "qblur", "-1" },
682 { "qcomp", "-1" },
683 { "refs", "-1" },
684 { "sc_threshold", "-1" },
685 { "trellis", "-1" },
686 { "nr", "-1" },
687 { "me_range", "-1" },
688 { "me_method", "-1" },
689 { "subq", "-1" },
690 { "b_strategy", "-1" },
691 { "keyint_min", "-1" },
692 { "coder", "-1" },
693 { "cmp", "-1" },
694 { "threads", AV_STRINGIFY(X264_THREADS_AUTO) },
695 { "thread_type", "0" },
696 { "flags", "+cgop" },
697 { "rc_init_occupancy","-1" },
698 { NULL },
699 };
700
701 #if CONFIG_LIBX264_ENCODER
702 static const AVClass class = {
703 .class_name = "libx264",
704 .item_name = av_default_item_name,
705 .option = options,
706 .version = LIBAVUTIL_VERSION_INT,
707 };
708
709 AVCodec ff_libx264_encoder = {
710 .name = "libx264",
711 .long_name = NULL_IF_CONFIG_SMALL("libx264 H.264 / AVC / MPEG-4 AVC / MPEG-4 part 10"),
712 .type = AVMEDIA_TYPE_VIDEO,
713 .id = AV_CODEC_ID_H264,
714 .priv_data_size = sizeof(X264Context),
715 .init = X264_init,
716 .encode2 = X264_frame,
717 .close = X264_close,
718 .capabilities = CODEC_CAP_DELAY | CODEC_CAP_AUTO_THREADS,
719 .priv_class = &class,
720 .defaults = x264_defaults,
721 .init_static_data = X264_init_static,
722 .caps_internal = FF_CODEC_CAP_INIT_THREADSAFE |
723 FF_CODEC_CAP_INIT_CLEANUP,
724 };
725 #endif
726
727 #if CONFIG_LIBX262_ENCODER
728 static const AVClass X262_class = {
729 .class_name = "libx262",
730 .item_name = av_default_item_name,
731 .option = options,
732 .version = LIBAVUTIL_VERSION_INT,
733 };
734
735 AVCodec ff_libx262_encoder = {
736 .name = "libx262",
737 .long_name = NULL_IF_CONFIG_SMALL("libx262 MPEG2VIDEO"),
738 .type = AVMEDIA_TYPE_VIDEO,
739 .id = AV_CODEC_ID_MPEG2VIDEO,
740 .priv_data_size = sizeof(X264Context),
741 .init = X264_init,
742 .encode2 = X264_frame,
743 .close = X264_close,
744 .capabilities = CODEC_CAP_DELAY | CODEC_CAP_AUTO_THREADS,
745 .priv_class = &X262_class,
746 .defaults = x264_defaults,
747 .pix_fmts = pix_fmts_8bit,
748 .caps_internal = FF_CODEC_CAP_INIT_THREADSAFE |
749 FF_CODEC_CAP_INIT_CLEANUP,
750 };
751 #endif