Libav
libx264.c
Go to the documentation of this file.
1 /*
2  * H.264 encoding using the x264 library
3  * Copyright (C) 2005 Mans Rullgard <mans@mansr.com>
4  *
5  * This file is part of Libav.
6  *
7  * Libav is free software; you can redistribute it and/or
8  * modify it under the terms of the GNU Lesser General Public
9  * License as published by the Free Software Foundation; either
10  * version 2.1 of the License, or (at your option) any later version.
11  *
12  * Libav is distributed in the hope that it will be useful,
13  * but WITHOUT ANY WARRANTY; without even the implied warranty of
14  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15  * Lesser General Public License for more details.
16  *
17  * You should have received a copy of the GNU Lesser General Public
18  * License along with Libav; if not, write to the Free Software
19  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20  */
21 
22 #include "libavutil/internal.h"
23 #include "libavutil/opt.h"
24 #include "libavutil/mem.h"
25 #include "libavutil/pixdesc.h"
26 #include "libavutil/stereo3d.h"
27 #include "avcodec.h"
28 #include "internal.h"
29 
30 #if defined(_MSC_VER)
31 #define X264_API_IMPORTS 1
32 #endif
33 
34 #include <x264.h>
35 #include <float.h>
36 #include <math.h>
37 #include <stdio.h>
38 #include <stdlib.h>
39 #include <string.h>
40 
41 typedef struct X264Context {
42  AVClass *class;
43  x264_param_t params;
44  x264_t *enc;
45  x264_picture_t pic;
47  int sei_size;
48  char *preset;
49  char *tune;
50  char *profile;
52  float crf;
53  float crf_max;
54  int cqp;
55  int aq_mode;
56  float aq_strength;
57  char *psy_rd;
58  int psy;
60  int weightp;
61  int weightb;
62  int ssim;
65  int b_bias;
66  int b_pyramid;
68  int dct8x8;
70  int aud;
71  int mbtree;
72  char *deblock;
73  float cplxblur;
74  char *partitions;
77  char *stats;
78  int nal_hrd;
79  char *x264_params;
80 } X264Context;
81 
82 static void X264_log(void *p, int level, const char *fmt, va_list args)
83 {
84  static const int level_map[] = {
85  [X264_LOG_ERROR] = AV_LOG_ERROR,
86  [X264_LOG_WARNING] = AV_LOG_WARNING,
87  [X264_LOG_INFO] = AV_LOG_INFO,
88  [X264_LOG_DEBUG] = AV_LOG_DEBUG
89  };
90 
91  if (level < 0 || level > X264_LOG_DEBUG)
92  return;
93 
94  av_vlog(p, level_map[level], fmt, args);
95 }
96 
97 
98 static int encode_nals(AVCodecContext *ctx, AVPacket *pkt,
99  x264_nal_t *nals, int nnal)
100 {
101  X264Context *x4 = ctx->priv_data;
102  uint8_t *p;
103  int i, size = x4->sei_size, ret;
104 
105  if (!nnal)
106  return 0;
107 
108  for (i = 0; i < nnal; i++)
109  size += nals[i].i_payload;
110 
111  if ((ret = ff_alloc_packet(pkt, size)) < 0)
112  return ret;
113 
114  p = pkt->data;
115 
116  /* Write the SEI as part of the first frame. */
117  if (x4->sei_size > 0 && nnal > 0) {
118  memcpy(p, x4->sei, x4->sei_size);
119  p += x4->sei_size;
120  x4->sei_size = 0;
121  }
122 
123  for (i = 0; i < nnal; i++){
124  memcpy(p, nals[i].p_payload, nals[i].i_payload);
125  p += nals[i].i_payload;
126  }
127 
128  return 1;
129 }
130 
131 static int X264_frame(AVCodecContext *ctx, AVPacket *pkt, const AVFrame *frame,
132  int *got_packet)
133 {
134  X264Context *x4 = ctx->priv_data;
135  x264_nal_t *nal;
136  int nnal, i, ret;
137  x264_picture_t pic_out;
138  AVFrameSideData *side_data;
139 
140  x264_picture_init( &x4->pic );
141  x4->pic.img.i_csp = x4->params.i_csp;
142  if (x264_bit_depth > 8)
143  x4->pic.img.i_csp |= X264_CSP_HIGH_DEPTH;
144  x4->pic.img.i_plane = 3;
145 
146  if (frame) {
147  for (i = 0; i < 3; i++) {
148  x4->pic.img.plane[i] = frame->data[i];
149  x4->pic.img.i_stride[i] = frame->linesize[i];
150  }
151 
152  x4->pic.i_pts = frame->pts;
153  x4->pic.i_type =
154  frame->pict_type == AV_PICTURE_TYPE_I ? X264_TYPE_KEYFRAME :
155  frame->pict_type == AV_PICTURE_TYPE_P ? X264_TYPE_P :
156  frame->pict_type == AV_PICTURE_TYPE_B ? X264_TYPE_B :
157  X264_TYPE_AUTO;
158  if (x4->params.b_tff != frame->top_field_first) {
159  x4->params.b_tff = frame->top_field_first;
160  x264_encoder_reconfig(x4->enc, &x4->params);
161  }
162  if (x4->params.vui.i_sar_height != ctx->sample_aspect_ratio.den ||
163  x4->params.vui.i_sar_width != ctx->sample_aspect_ratio.num) {
164  x4->params.vui.i_sar_height = ctx->sample_aspect_ratio.den;
165  x4->params.vui.i_sar_width = ctx->sample_aspect_ratio.num;
166  x264_encoder_reconfig(x4->enc, &x4->params);
167  }
168 
170  if (side_data) {
171  AVStereo3D *stereo = (AVStereo3D *)side_data->data;
172  int fpa_type;
173 
174  switch (stereo->type) {
176  fpa_type = 0;
177  break;
178  case AV_STEREO3D_LINES:
179  fpa_type = 1;
180  break;
181  case AV_STEREO3D_COLUMNS:
182  fpa_type = 2;
183  break;
185  fpa_type = 3;
186  break;
188  fpa_type = 4;
189  break;
191  fpa_type = 5;
192  break;
193  default:
194  fpa_type = -1;
195  break;
196  }
197 
198  if (fpa_type != x4->params.i_frame_packing) {
199  x4->params.i_frame_packing = fpa_type;
200  x264_encoder_reconfig(x4->enc, &x4->params);
201  }
202  }
203  }
204  do {
205  if (x264_encoder_encode(x4->enc, &nal, &nnal, frame? &x4->pic: NULL, &pic_out) < 0)
206  return -1;
207 
208  ret = encode_nals(ctx, pkt, nal, nnal);
209  if (ret < 0)
210  return -1;
211  } while (!ret && !frame && x264_encoder_delayed_frames(x4->enc));
212 
213  pkt->pts = pic_out.i_pts;
214  pkt->dts = pic_out.i_dts;
215 
216  switch (pic_out.i_type) {
217  case X264_TYPE_IDR:
218  case X264_TYPE_I:
220  break;
221  case X264_TYPE_P:
223  break;
224  case X264_TYPE_B:
225  case X264_TYPE_BREF:
227  break;
228  }
229 
230  pkt->flags |= AV_PKT_FLAG_KEY*pic_out.b_keyframe;
231  if (ret)
232  ctx->coded_frame->quality = (pic_out.i_qpplus1 - 1) * FF_QP2LAMBDA;
233 
234  *got_packet = ret;
235  return 0;
236 }
237 
239 {
240  X264Context *x4 = avctx->priv_data;
241 
242  av_freep(&avctx->extradata);
243  av_free(x4->sei);
244 
245  if (x4->enc)
246  x264_encoder_close(x4->enc);
247 
248  av_frame_free(&avctx->coded_frame);
249 
250  return 0;
251 }
252 
254 {
255  switch (pix_fmt) {
256  case AV_PIX_FMT_YUV420P:
257  case AV_PIX_FMT_YUVJ420P:
258  case AV_PIX_FMT_YUV420P9:
259  case AV_PIX_FMT_YUV420P10: return X264_CSP_I420;
260  case AV_PIX_FMT_YUV422P:
261  case AV_PIX_FMT_YUV422P10: return X264_CSP_I422;
262  case AV_PIX_FMT_YUV444P:
263  case AV_PIX_FMT_YUV444P9:
264  case AV_PIX_FMT_YUV444P10: return X264_CSP_I444;
265  case AV_PIX_FMT_NV12: return X264_CSP_NV12;
266  case AV_PIX_FMT_NV16:
267  case AV_PIX_FMT_NV20: return X264_CSP_NV16;
268  };
269  return 0;
270 }
271 
272 #define PARSE_X264_OPT(name, var)\
273  if (x4->var && x264_param_parse(&x4->params, name, x4->var) < 0) {\
274  av_log(avctx, AV_LOG_ERROR, "Error parsing option '%s' with value '%s'.\n", name, x4->var);\
275  return AVERROR(EINVAL);\
276  }
277 
278 static av_cold int X264_init(AVCodecContext *avctx)
279 {
280  X264Context *x4 = avctx->priv_data;
281 
282  x264_param_default(&x4->params);
283 
284  x4->params.b_deblocking_filter = avctx->flags & CODEC_FLAG_LOOP_FILTER;
285 
286  if (x4->preset || x4->tune)
287  if (x264_param_default_preset(&x4->params, x4->preset, x4->tune) < 0) {
288  av_log(avctx, AV_LOG_ERROR, "Error setting preset/tune %s/%s.\n", x4->preset, x4->tune);
289  return AVERROR(EINVAL);
290  }
291 
292  if (avctx->level > 0)
293  x4->params.i_level_idc = avctx->level;
294 
295  x4->params.pf_log = X264_log;
296  x4->params.p_log_private = avctx;
297  x4->params.i_log_level = X264_LOG_DEBUG;
298  x4->params.i_csp = convert_pix_fmt(avctx->pix_fmt);
299 
300  if (avctx->bit_rate) {
301  x4->params.rc.i_bitrate = avctx->bit_rate / 1000;
302  x4->params.rc.i_rc_method = X264_RC_ABR;
303  }
304  x4->params.rc.i_vbv_buffer_size = avctx->rc_buffer_size / 1000;
305  x4->params.rc.i_vbv_max_bitrate = avctx->rc_max_rate / 1000;
306  x4->params.rc.b_stat_write = avctx->flags & CODEC_FLAG_PASS1;
307  if (avctx->flags & CODEC_FLAG_PASS2) {
308  x4->params.rc.b_stat_read = 1;
309  } else {
310  if (x4->crf >= 0) {
311  x4->params.rc.i_rc_method = X264_RC_CRF;
312  x4->params.rc.f_rf_constant = x4->crf;
313  } else if (x4->cqp >= 0) {
314  x4->params.rc.i_rc_method = X264_RC_CQP;
315  x4->params.rc.i_qp_constant = x4->cqp;
316  }
317 
318  if (x4->crf_max >= 0)
319  x4->params.rc.f_rf_constant_max = x4->crf_max;
320  }
321 
322  if (avctx->rc_buffer_size && avctx->rc_initial_buffer_occupancy > 0 &&
323  (avctx->rc_initial_buffer_occupancy <= avctx->rc_buffer_size)) {
324  x4->params.rc.f_vbv_buffer_init =
325  (float)avctx->rc_initial_buffer_occupancy / avctx->rc_buffer_size;
326  }
327 
328  if (avctx->i_quant_factor > 0)
329  x4->params.rc.f_ip_factor = 1 / fabs(avctx->i_quant_factor);
330  x4->params.rc.f_pb_factor = avctx->b_quant_factor;
331  x4->params.analyse.i_chroma_qp_offset = avctx->chromaoffset;
332 
333  if (avctx->me_method == ME_EPZS)
334  x4->params.analyse.i_me_method = X264_ME_DIA;
335  else if (avctx->me_method == ME_HEX)
336  x4->params.analyse.i_me_method = X264_ME_HEX;
337  else if (avctx->me_method == ME_UMH)
338  x4->params.analyse.i_me_method = X264_ME_UMH;
339  else if (avctx->me_method == ME_FULL)
340  x4->params.analyse.i_me_method = X264_ME_ESA;
341  else if (avctx->me_method == ME_TESA)
342  x4->params.analyse.i_me_method = X264_ME_TESA;
343 
344  if (avctx->gop_size >= 0)
345  x4->params.i_keyint_max = avctx->gop_size;
346  if (avctx->max_b_frames >= 0)
347  x4->params.i_bframe = avctx->max_b_frames;
348  if (avctx->scenechange_threshold >= 0)
349  x4->params.i_scenecut_threshold = avctx->scenechange_threshold;
350  if (avctx->qmin >= 0)
351  x4->params.rc.i_qp_min = avctx->qmin;
352  if (avctx->qmax >= 0)
353  x4->params.rc.i_qp_max = avctx->qmax;
354  if (avctx->max_qdiff >= 0)
355  x4->params.rc.i_qp_step = avctx->max_qdiff;
356  if (avctx->qblur >= 0)
357  x4->params.rc.f_qblur = avctx->qblur; /* temporally blur quants */
358  if (avctx->qcompress >= 0)
359  x4->params.rc.f_qcompress = avctx->qcompress; /* 0.0 => cbr, 1.0 => constant qp */
360  if (avctx->refs >= 0)
361  x4->params.i_frame_reference = avctx->refs;
362  if (avctx->trellis >= 0)
363  x4->params.analyse.i_trellis = avctx->trellis;
364  if (avctx->me_range >= 0)
365  x4->params.analyse.i_me_range = avctx->me_range;
366  if (avctx->noise_reduction >= 0)
367  x4->params.analyse.i_noise_reduction = avctx->noise_reduction;
368  if (avctx->me_subpel_quality >= 0)
369  x4->params.analyse.i_subpel_refine = avctx->me_subpel_quality;
370  if (avctx->b_frame_strategy >= 0)
371  x4->params.i_bframe_adaptive = avctx->b_frame_strategy;
372  if (avctx->keyint_min >= 0)
373  x4->params.i_keyint_min = avctx->keyint_min;
374  if (avctx->coder_type >= 0)
375  x4->params.b_cabac = avctx->coder_type == FF_CODER_TYPE_AC;
376  if (avctx->me_cmp >= 0)
377  x4->params.analyse.b_chroma_me = avctx->me_cmp & FF_CMP_CHROMA;
378 
379  if (x4->aq_mode >= 0)
380  x4->params.rc.i_aq_mode = x4->aq_mode;
381  if (x4->aq_strength >= 0)
382  x4->params.rc.f_aq_strength = x4->aq_strength;
383  PARSE_X264_OPT("psy-rd", psy_rd);
384  PARSE_X264_OPT("deblock", deblock);
385  PARSE_X264_OPT("partitions", partitions);
386  PARSE_X264_OPT("stats", stats);
387  if (x4->psy >= 0)
388  x4->params.analyse.b_psy = x4->psy;
389  if (x4->rc_lookahead >= 0)
390  x4->params.rc.i_lookahead = x4->rc_lookahead;
391  if (x4->weightp >= 0)
392  x4->params.analyse.i_weighted_pred = x4->weightp;
393  if (x4->weightb >= 0)
394  x4->params.analyse.b_weighted_bipred = x4->weightb;
395  if (x4->cplxblur >= 0)
396  x4->params.rc.f_complexity_blur = x4->cplxblur;
397 
398  if (x4->ssim >= 0)
399  x4->params.analyse.b_ssim = x4->ssim;
400  if (x4->intra_refresh >= 0)
401  x4->params.b_intra_refresh = x4->intra_refresh;
402  if (x4->bluray_compat >= 0) {
403  x4->params.b_bluray_compat = x4->bluray_compat;
404  x4->params.b_vfr_input = 0;
405  }
406  if (x4->b_bias != INT_MIN)
407  x4->params.i_bframe_bias = x4->b_bias;
408  if (x4->b_pyramid >= 0)
409  x4->params.i_bframe_pyramid = x4->b_pyramid;
410  if (x4->mixed_refs >= 0)
411  x4->params.analyse.b_mixed_references = x4->mixed_refs;
412  if (x4->dct8x8 >= 0)
413  x4->params.analyse.b_transform_8x8 = x4->dct8x8;
414  if (x4->fast_pskip >= 0)
415  x4->params.analyse.b_fast_pskip = x4->fast_pskip;
416  if (x4->aud >= 0)
417  x4->params.b_aud = x4->aud;
418  if (x4->mbtree >= 0)
419  x4->params.rc.b_mb_tree = x4->mbtree;
420  if (x4->direct_pred >= 0)
421  x4->params.analyse.i_direct_mv_pred = x4->direct_pred;
422 
423  if (x4->slice_max_size >= 0)
424  x4->params.i_slice_max_size = x4->slice_max_size;
425 
426  if (x4->fastfirstpass)
427  x264_param_apply_fastfirstpass(&x4->params);
428 
429  if (x4->nal_hrd >= 0)
430  x4->params.i_nal_hrd = x4->nal_hrd;
431 
432  if (x4->profile)
433  if (x264_param_apply_profile(&x4->params, x4->profile) < 0) {
434  av_log(avctx, AV_LOG_ERROR, "Error setting profile %s.\n", x4->profile);
435  return AVERROR(EINVAL);
436  }
437 
438  x4->params.i_width = avctx->width;
439  x4->params.i_height = avctx->height;
440  x4->params.vui.i_sar_width = avctx->sample_aspect_ratio.num;
441  x4->params.vui.i_sar_height = avctx->sample_aspect_ratio.den;
442  x4->params.i_fps_num = x4->params.i_timebase_den = avctx->time_base.den;
443  x4->params.i_fps_den = x4->params.i_timebase_num = avctx->time_base.num;
444 
445  x4->params.analyse.b_psnr = avctx->flags & CODEC_FLAG_PSNR;
446 
447  x4->params.i_threads = avctx->thread_count;
448  if (avctx->thread_type)
449  x4->params.b_sliced_threads = avctx->thread_type == FF_THREAD_SLICE;
450 
451  x4->params.b_interlaced = avctx->flags & CODEC_FLAG_INTERLACED_DCT;
452 
453  x4->params.b_open_gop = !(avctx->flags & CODEC_FLAG_CLOSED_GOP);
454 
455  x4->params.i_slice_count = avctx->slices;
456 
457  x4->params.vui.b_fullrange = avctx->pix_fmt == AV_PIX_FMT_YUVJ420P;
458 
459  if (avctx->flags & CODEC_FLAG_GLOBAL_HEADER)
460  x4->params.b_repeat_headers = 0;
461 
462  if (x4->x264_params) {
463  AVDictionary *dict = NULL;
464  AVDictionaryEntry *en = NULL;
465 
466  if (!av_dict_parse_string(&dict, x4->x264_params, "=", ":", 0)) {
467  while ((en = av_dict_get(dict, "", en, AV_DICT_IGNORE_SUFFIX))) {
468  if (x264_param_parse(&x4->params, en->key, en->value) < 0)
469  av_log(avctx, AV_LOG_WARNING,
470  "Error parsing option '%s = %s'.\n",
471  en->key, en->value);
472  }
473 
474  av_dict_free(&dict);
475  }
476  }
477 
478  // update AVCodecContext with x264 parameters
479  avctx->has_b_frames = x4->params.i_bframe ?
480  x4->params.i_bframe_pyramid ? 2 : 1 : 0;
481  if (avctx->max_b_frames < 0)
482  avctx->max_b_frames = 0;
483 
484  avctx->bit_rate = x4->params.rc.i_bitrate*1000;
485 
486  x4->enc = x264_encoder_open(&x4->params);
487  if (!x4->enc)
488  return -1;
489 
490  avctx->coded_frame = av_frame_alloc();
491  if (!avctx->coded_frame)
492  return AVERROR(ENOMEM);
493 
494  if (avctx->flags & CODEC_FLAG_GLOBAL_HEADER) {
495  x264_nal_t *nal;
496  uint8_t *p;
497  int nnal, s, i;
498 
499  s = x264_encoder_headers(x4->enc, &nal, &nnal);
500  avctx->extradata = p = av_malloc(s);
501 
502  for (i = 0; i < nnal; i++) {
503  /* Don't put the SEI in extradata. */
504  if (nal[i].i_type == NAL_SEI) {
505  av_log(avctx, AV_LOG_INFO, "%s\n", nal[i].p_payload+25);
506  x4->sei_size = nal[i].i_payload;
507  x4->sei = av_malloc(x4->sei_size);
508  memcpy(x4->sei, nal[i].p_payload, nal[i].i_payload);
509  continue;
510  }
511  memcpy(p, nal[i].p_payload, nal[i].i_payload);
512  p += nal[i].i_payload;
513  }
514  avctx->extradata_size = p - avctx->extradata;
515  }
516 
517  return 0;
518 }
519 
520 static const enum AVPixelFormat pix_fmts_8bit[] = {
528 };
529 static const enum AVPixelFormat pix_fmts_9bit[] = {
533 };
534 static const enum AVPixelFormat pix_fmts_10bit[] = {
540 };
541 
542 static av_cold void X264_init_static(AVCodec *codec)
543 {
544  if (x264_bit_depth == 8)
545  codec->pix_fmts = pix_fmts_8bit;
546  else if (x264_bit_depth == 9)
547  codec->pix_fmts = pix_fmts_9bit;
548  else if (x264_bit_depth == 10)
549  codec->pix_fmts = pix_fmts_10bit;
550 }
551 
552 #define OFFSET(x) offsetof(X264Context, x)
553 #define VE AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_ENCODING_PARAM
554 static const AVOption options[] = {
555  { "preset", "Set the encoding preset (cf. x264 --fullhelp)", OFFSET(preset), AV_OPT_TYPE_STRING, { .str = "medium" }, 0, 0, VE},
556  { "tune", "Tune the encoding params (cf. x264 --fullhelp)", OFFSET(tune), AV_OPT_TYPE_STRING, { 0 }, 0, 0, VE},
557  { "profile", "Set profile restrictions (cf. x264 --fullhelp) ", OFFSET(profile), AV_OPT_TYPE_STRING, { 0 }, 0, 0, VE},
558  { "fastfirstpass", "Use fast settings when encoding first pass", OFFSET(fastfirstpass), AV_OPT_TYPE_INT, { .i64 = 1 }, 0, 1, VE},
559  { "crf", "Select the quality for constant quality mode", OFFSET(crf), AV_OPT_TYPE_FLOAT, {.dbl = -1 }, -1, FLT_MAX, VE },
560  { "crf_max", "In CRF mode, prevents VBV from lowering quality beyond this point.",OFFSET(crf_max), AV_OPT_TYPE_FLOAT, {.dbl = -1 }, -1, FLT_MAX, VE },
561  { "qp", "Constant quantization parameter rate control method",OFFSET(cqp), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, INT_MAX, VE },
562  { "aq-mode", "AQ method", OFFSET(aq_mode), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, INT_MAX, VE, "aq_mode"},
563  { "none", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = X264_AQ_NONE}, INT_MIN, INT_MAX, VE, "aq_mode" },
564  { "variance", "Variance AQ (complexity mask)", 0, AV_OPT_TYPE_CONST, {.i64 = X264_AQ_VARIANCE}, INT_MIN, INT_MAX, VE, "aq_mode" },
565  { "autovariance", "Auto-variance AQ (experimental)", 0, AV_OPT_TYPE_CONST, {.i64 = X264_AQ_AUTOVARIANCE}, INT_MIN, INT_MAX, VE, "aq_mode" },
566  { "aq-strength", "AQ strength. Reduces blocking and blurring in flat and textured areas.", OFFSET(aq_strength), AV_OPT_TYPE_FLOAT, {.dbl = -1}, -1, FLT_MAX, VE},
567  { "psy", "Use psychovisual optimizations.", OFFSET(psy), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, 1, VE },
568  { "psy-rd", "Strength of psychovisual optimization, in <psy-rd>:<psy-trellis> format.", OFFSET(psy_rd), AV_OPT_TYPE_STRING, {0 }, 0, 0, VE},
569  { "rc-lookahead", "Number of frames to look ahead for frametype and ratecontrol", OFFSET(rc_lookahead), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, INT_MAX, VE },
570  { "weightb", "Weighted prediction for B-frames.", OFFSET(weightb), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, 1, VE },
571  { "weightp", "Weighted prediction analysis method.", OFFSET(weightp), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, INT_MAX, VE, "weightp" },
572  { "none", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = X264_WEIGHTP_NONE}, INT_MIN, INT_MAX, VE, "weightp" },
573  { "simple", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = X264_WEIGHTP_SIMPLE}, INT_MIN, INT_MAX, VE, "weightp" },
574  { "smart", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = X264_WEIGHTP_SMART}, INT_MIN, INT_MAX, VE, "weightp" },
575  { "ssim", "Calculate and print SSIM stats.", OFFSET(ssim), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, 1, VE },
576  { "intra-refresh", "Use Periodic Intra Refresh instead of IDR frames.",OFFSET(intra_refresh),AV_OPT_TYPE_INT, { .i64 = -1 }, -1, 1, VE },
577  { "bluray-compat", "Bluray compatibility workarounds.", OFFSET(bluray_compat) ,AV_OPT_TYPE_INT, { .i64 = -1 }, -1, 1, VE },
578  { "b-bias", "Influences how often B-frames are used", OFFSET(b_bias), AV_OPT_TYPE_INT, { .i64 = INT_MIN}, INT_MIN, INT_MAX, VE },
579  { "b-pyramid", "Keep some B-frames as references.", OFFSET(b_pyramid), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, INT_MAX, VE, "b_pyramid" },
580  { "none", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = X264_B_PYRAMID_NONE}, INT_MIN, INT_MAX, VE, "b_pyramid" },
581  { "strict", "Strictly hierarchical pyramid", 0, AV_OPT_TYPE_CONST, {.i64 = X264_B_PYRAMID_STRICT}, INT_MIN, INT_MAX, VE, "b_pyramid" },
582  { "normal", "Non-strict (not Blu-ray compatible)", 0, AV_OPT_TYPE_CONST, {.i64 = X264_B_PYRAMID_NORMAL}, INT_MIN, INT_MAX, VE, "b_pyramid" },
583  { "mixed-refs", "One reference per partition, as opposed to one reference per macroblock", OFFSET(mixed_refs), AV_OPT_TYPE_INT, { .i64 = -1}, -1, 1, VE },
584  { "8x8dct", "High profile 8x8 transform.", OFFSET(dct8x8), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, 1, VE},
585  { "fast-pskip", NULL, OFFSET(fast_pskip), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, 1, VE},
586  { "aud", "Use access unit delimiters.", OFFSET(aud), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, 1, VE},
587  { "mbtree", "Use macroblock tree ratecontrol.", OFFSET(mbtree), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, 1, VE},
588  { "deblock", "Loop filter parameters, in <alpha:beta> form.", OFFSET(deblock), AV_OPT_TYPE_STRING, { 0 }, 0, 0, VE},
589  { "cplxblur", "Reduce fluctuations in QP (before curve compression)", OFFSET(cplxblur), AV_OPT_TYPE_FLOAT, {.dbl = -1 }, -1, FLT_MAX, VE},
590  { "partitions", "A comma-separated list of partitions to consider. "
591  "Possible values: p8x8, p4x4, b8x8, i8x8, i4x4, none, all", OFFSET(partitions), AV_OPT_TYPE_STRING, { 0 }, 0, 0, VE},
592  { "direct-pred", "Direct MV prediction mode", OFFSET(direct_pred), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, INT_MAX, VE, "direct-pred" },
593  { "none", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = X264_DIRECT_PRED_NONE }, 0, 0, VE, "direct-pred" },
594  { "spatial", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = X264_DIRECT_PRED_SPATIAL }, 0, 0, VE, "direct-pred" },
595  { "temporal", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = X264_DIRECT_PRED_TEMPORAL }, 0, 0, VE, "direct-pred" },
596  { "auto", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = X264_DIRECT_PRED_AUTO }, 0, 0, VE, "direct-pred" },
597  { "slice-max-size","Limit the size of each slice in bytes", OFFSET(slice_max_size),AV_OPT_TYPE_INT, { .i64 = -1 }, -1, INT_MAX, VE },
598  { "stats", "Filename for 2 pass stats", OFFSET(stats), AV_OPT_TYPE_STRING, { 0 }, 0, 0, VE },
599  { "nal-hrd", "Signal HRD information (requires vbv-bufsize; "
600  "cbr not allowed in .mp4)", OFFSET(nal_hrd), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, INT_MAX, VE, "nal-hrd" },
601  { "none", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = X264_NAL_HRD_NONE}, INT_MIN, INT_MAX, VE, "nal-hrd" },
602  { "vbr", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = X264_NAL_HRD_VBR}, INT_MIN, INT_MAX, VE, "nal-hrd" },
603  { "cbr", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = X264_NAL_HRD_CBR}, INT_MIN, INT_MAX, VE, "nal-hrd" },
604  { "x264-params", "Override the x264 configuration using a :-separated list of key=value parameters", OFFSET(x264_params), AV_OPT_TYPE_STRING, { 0 }, 0, 0, VE },
605  { NULL },
606 };
607 
608 static const AVClass class = {
609  .class_name = "libx264",
610  .item_name = av_default_item_name,
611  .option = options,
613 };
614 
615 static const AVCodecDefault x264_defaults[] = {
616  { "b", "0" },
617  { "bf", "-1" },
618  { "g", "-1" },
619  { "i_qfactor", "-1" },
620  { "qmin", "-1" },
621  { "qmax", "-1" },
622  { "qdiff", "-1" },
623  { "qblur", "-1" },
624  { "qcomp", "-1" },
625  { "refs", "-1" },
626  { "sc_threshold", "-1" },
627  { "trellis", "-1" },
628  { "nr", "-1" },
629  { "me_range", "-1" },
630  { "me_method", "-1" },
631  { "subq", "-1" },
632  { "b_strategy", "-1" },
633  { "keyint_min", "-1" },
634  { "coder", "-1" },
635  { "cmp", "-1" },
636  { "threads", AV_STRINGIFY(X264_THREADS_AUTO) },
637  { "thread_type", "0" },
638  { "flags", "+cgop" },
639  { "rc_init_occupancy","-1" },
640  { NULL },
641 };
642 
644  .name = "libx264",
645  .long_name = NULL_IF_CONFIG_SMALL("libx264 H.264 / AVC / MPEG-4 AVC / MPEG-4 part 10"),
646  .type = AVMEDIA_TYPE_VIDEO,
647  .id = AV_CODEC_ID_H264,
648  .priv_data_size = sizeof(X264Context),
649  .init = X264_init,
650  .encode2 = X264_frame,
651  .close = X264_close,
652  .capabilities = CODEC_CAP_DELAY | CODEC_CAP_AUTO_THREADS,
653  .priv_class = &class,
654  .defaults = x264_defaults,
655  .init_static_data = X264_init_static,
656 };
static int convert_pix_fmt(enum AVPixelFormat pix_fmt)
Definition: libx264.c:253
void * av_malloc(size_t size)
Allocate a block of size bytes with alignment suitable for all memory accesses (including vectors if ...
Definition: mem.c:62
Views are packed per line, as if interlaced.
Definition: stereo3d.h:94
char * partitions
Definition: libx264.c:74
int size
This structure describes decoded (raw) audio or video data.
Definition: frame.h:107
int dct8x8
Definition: libx264.c:68
AVOption.
Definition: opt.h:233
Views are alternated temporally.
Definition: stereo3d.h:63
#define CODEC_FLAG_PASS2
Use internal 2pass ratecontrol in second pass mode.
Definition: avcodec.h:669
AVCodec ff_libx264_encoder
Definition: libx264.c:643
float qblur
amount of qscale smoothing over time (0.0-1.0)
Definition: avcodec.h:2054
planar YUV 4:4:4, 24bpp, (1 Cr & Cb sample per 1x1 Y samples)
Definition: pixfmt.h:70
#define AV_LOG_WARNING
Something somehow does not look correct.
Definition: log.h:129
memory handling functions
#define CODEC_FLAG_PASS1
Use internal 2pass ratecontrol in first pass mode.
Definition: avcodec.h:668
AVFrame * coded_frame
the picture in the bitstream
Definition: avcodec.h:2506
int max_b_frames
maximum number of B-frames between non-B-frames Note: The output will be delayed by max_b_frames+1 re...
Definition: avcodec.h:1302
int rc_initial_buffer_occupancy
Number of bits which should be loaded into the rc buffer before decoding starts.
Definition: avcodec.h:2152
int num
numerator
Definition: rational.h:44
enhanced predictive zonal search
Definition: avcodec.h:528
AVRational sample_aspect_ratio
sample aspect ratio (0 if unknown) That is the width of a pixel divided by the height of the pixel...
Definition: avcodec.h:1422
enum AVPixelFormat pix_fmt
Pixel format, see AV_PIX_FMT_xxx.
Definition: avcodec.h:1247
int bluray_compat
Definition: libx264.c:64
static void X264_log(void *p, int level, const char *fmt, va_list args)
Definition: libx264.c:82
AVDictionaryEntry * av_dict_get(AVDictionary *m, const char *key, const AVDictionaryEntry *prev, int flags)
Get a dictionary entry with matching key.
Definition: dict.c:39
AVCodec.
Definition: avcodec.h:2755
static av_cold int X264_init(AVCodecContext *avctx)
Definition: libx264.c:278
int scenechange_threshold
scene change detection threshold 0 is default, larger means fewer detected scene changes.
Definition: avcodec.h:1596
AVRational time_base
This is the fundamental unit of time (in seconds) in terms of which frame timestamps are represented...
Definition: avcodec.h:1173
void av_freep(void *arg)
Free a memory block which has been allocated with av_malloc(z)() or av_realloc() and set the pointer ...
Definition: mem.c:198
AVFrameSideData * av_frame_get_side_data(const AVFrame *frame, enum AVFrameSideDataType type)
Definition: frame.c:469
x264_param_t params
Definition: libx264.c:43
#define CODEC_FLAG_PSNR
error[?] variables will be set during encoding.
Definition: avcodec.h:678
const char * class_name
The name of the class; usually it is the same name as the context structure type to which the AVClass...
Definition: log.h:38
uint8_t
#define av_cold
Definition: attributes.h:66
AVFrame * av_frame_alloc(void)
Allocate an AVFrame and set its fields to default values.
Definition: frame.c:43
AVOptions.
Stereo 3D type: this structure describes how two videos are packed within a single video surface...
Definition: stereo3d.h:120
int me_range
maximum motion estimation search range in subpel units If 0 then no limit.
Definition: avcodec.h:1529
#define CODEC_FLAG_GLOBAL_HEADER
Place global headers in extradata instead of every keyframe.
Definition: avcodec.h:684
float b_quant_factor
qscale factor between IP and B-frames If > 0 then the last P-frame quantizer will be used (q= lastp_q...
Definition: avcodec.h:1311
int64_t pts
Presentation timestamp in time_base units (time when frame should be shown to user).
Definition: frame.h:183
uint8_t * extradata
some codecs need / can use extradata like Huffman tables.
Definition: avcodec.h:1162
int me_cmp
motion estimation comparison function
Definition: avcodec.h:1429
int coder_type
coder type
Definition: avcodec.h:2164
uint8_t * data
Definition: avcodec.h:973
int b_pyramid
Definition: libx264.c:66
x264_picture_t pic
Definition: libx264.c:45
float cplxblur
Definition: libx264.c:73
#define FF_CMP_CHROMA
Definition: avcodec.h:1461
char * stats
Definition: libx264.c:77
int intra_refresh
Definition: libx264.c:63
#define AV_PIX_FMT_NV20
Definition: pixfmt.h:246
int rc_lookahead
Definition: libx264.c:59
hexagon based search
Definition: avcodec.h:530
#define AV_PKT_FLAG_KEY
The packet contains a keyframe.
Definition: avcodec.h:1023
int chromaoffset
chroma qp offset from luma
Definition: avcodec.h:1704
#define CODEC_FLAG_LOOP_FILTER
loop filter
Definition: avcodec.h:688
static enum AVPixelFormat pix_fmts_10bit[]
Definition: libx264.c:534
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
Definition: log.h:123
int has_b_frames
Size of the frame reordering buffer in the decoder.
Definition: avcodec.h:1332
void av_free(void *ptr)
Free a memory block which has been allocated with av_malloc(z)() or av_realloc(). ...
Definition: mem.c:186
static const AVCodecDefault defaults[]
Definition: libspeexenc.c:345
#define CODEC_CAP_DELAY
Encoder or decoder requires flushing with NULL input at the end in order to give the complete and cor...
Definition: avcodec.h:740
#define AVERROR(e)
Definition: error.h:43
void av_frame_free(AVFrame **frame)
Free the frame and any dynamically allocated objects in it, e.g.
Definition: frame.c:55
int qmax
maximum quantizer
Definition: avcodec.h:2068
char * profile
Definition: libx264.c:50
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification. ...
Definition: internal.h:142
#define AV_LOG_DEBUG
Stuff which is only useful for libav* developers.
Definition: log.h:144
int fastfirstpass
Definition: libx264.c:51
void av_dict_free(AVDictionary **pm)
Free all the memory allocated for an AVDictionary struct and all keys and values. ...
Definition: dict.c:159
int flags
CODEC_FLAG_*.
Definition: avcodec.h:1142
planar YUV 4:2:0, 12bpp, 1 plane for Y and 1 plane for the UV components, which are interleaved (firs...
Definition: pixfmt.h:92
int rc_max_rate
maximum bitrate
Definition: avcodec.h:2115
void av_log(void *avcl, int level, const char *fmt,...)
Definition: log.c:148
int mbtree
Definition: libx264.c:71
const char * name
Name of the codec implementation.
Definition: avcodec.h:2762
float i_quant_factor
qscale factor between P and I-frames If > 0 then the last p frame quantizer will be used (q= lastp_q*...
Definition: avcodec.h:1348
#define AV_PIX_FMT_YUV444P10
Definition: pixfmt.h:226
char * deblock
Definition: libx264.c:72
transformed exhaustive search algorithm
Definition: avcodec.h:532
int flags
A combination of AV_PKT_FLAG values.
Definition: avcodec.h:979
planar YUV 4:2:2, 16bpp, (1 Cr & Cb sample per 2x1 Y samples)
Definition: pixfmt.h:69
int rc_buffer_size
decoder bitstream buffer size
Definition: avcodec.h:2093
common internal API header
char * psy_rd
Definition: libx264.c:57
int refs
number of reference frames
Definition: avcodec.h:1697
static enum AVPixelFormat pix_fmts_9bit[]
Definition: libx264.c:529
#define PARSE_X264_OPT(name, var)
Definition: libx264.c:272
int bit_rate
the average bitrate
Definition: avcodec.h:1112
enum AVPixelFormat * pix_fmts
array of supported pixel formats, or NULL if unknown, array is terminated by -1
Definition: avcodec.h:2776
enum AVPictureType pict_type
Picture type of the frame.
Definition: frame.h:168
planar YUV 4:2:0, 12bpp, full scale (JPEG), deprecated in favor of PIX_FMT_YUV420P and setting color_...
Definition: pixfmt.h:77
int width
picture width / height.
Definition: avcodec.h:1217
int cqp
Definition: libx264.c:54
x264_t * enc
Definition: libx264.c:44
#define CODEC_CAP_AUTO_THREADS
Codec supports avctx->thread_count == 0 (auto).
Definition: avcodec.h:794
int b_frame_strategy
Definition: avcodec.h:1317
#define FF_THREAD_SLICE
Decode more than one part of a single frame at once.
Definition: avcodec.h:2526
int level
level
Definition: avcodec.h:2679
int quality
quality (between 1 (good) and FF_LAMBDA_MAX (bad))
Definition: frame.h:207
int ff_alloc_packet(AVPacket *avpkt, int size)
Check AVPacket size and/or allocate data.
Definition: utils.c:1125
#define CODEC_FLAG_INTERLACED_DCT
Use interlaced DCT.
Definition: avcodec.h:682
int slice_max_size
Definition: libx264.c:76
int nal_hrd
Definition: libx264.c:78
int max_qdiff
maximum quantizer difference between frames
Definition: avcodec.h:2075
enum AVPixelFormat pix_fmt
Definition: movenc.c:821
int weightp
Definition: libx264.c:60
#define AV_PIX_FMT_YUV444P9
Definition: pixfmt.h:223
LIBAVUTIL_VERSION_INT
Definition: eval.c:55
char * x264_params
Definition: libx264.c:79
int thread_count
thread count is used to decide how many independent tasks should be passed to execute() ...
Definition: avcodec.h:2514
static enum AVPixelFormat pix_fmts_8bit[]
Definition: libx264.c:520
static const AVCodecDefault x264_defaults[]
Definition: libx264.c:615
int av_dict_parse_string(AVDictionary **pm, const char *str, const char *key_val_sep, const char *pairs_sep, int flags)
Parse the key/value pairs list and add to a dictionary.
Definition: dict.c:136
NULL
Definition: eval.c:55
enum AVStereo3DType type
How views are packed within the video.
Definition: stereo3d.h:124
#define AV_LOG_INFO
Standard information.
Definition: log.h:134
Libavcodec external API header.
static av_cold int X264_close(AVCodecContext *avctx)
Definition: libx264.c:238
int linesize[AV_NUM_DATA_POINTERS]
For video, size in bytes of each picture line.
Definition: frame.h:125
av_default_item_name
Definition: dnxhdenc.c:45
main external API structure.
Definition: avcodec.h:1054
static void close(AVCodecParserContext *s)
Definition: h264_parser.c:489
static const AVOption options[]
Definition: libx264.c:554
int qmin
minimum quantizer
Definition: avcodec.h:2061
uint8_t * data
Definition: frame.h:76
#define FF_CODER_TYPE_AC
Definition: avcodec.h:2155
int extradata_size
Definition: avcodec.h:1163
#define AV_PIX_FMT_YUV420P10
Definition: pixfmt.h:224
float crf
Definition: libx264.c:52
int aq_mode
Definition: libx264.c:55
int aud
Definition: libx264.c:70
#define AV_STRINGIFY(s)
Definition: macros.h:36
Describe the class of an AVClass context structure.
Definition: log.h:33
uint8_t * sei
Definition: libx264.c:46
void av_vlog(void *avcl, int level, const char *fmt, va_list vl)
Send the specified message to the log if the level is less than or equal to the current av_log_level...
Definition: log.c:160
int psy
Definition: libx264.c:58
#define AV_PIX_FMT_YUV420P9
Definition: pixfmt.h:221
float qcompress
amount of qscale change between easy & hard scenes (0.0-1.0)
Definition: avcodec.h:2053
int sei_size
Definition: libx264.c:47
#define CODEC_FLAG_CLOSED_GOP
Definition: avcodec.h:690
char * preset
Definition: libx264.c:48
Views are on top of each other.
Definition: stereo3d.h:52
#define AV_PIX_FMT_YUV422P10
Definition: pixfmt.h:225
uint8_t * data[AV_NUM_DATA_POINTERS]
pointer to the picture/channel planes.
Definition: frame.h:113
uint8_t level
Definition: svq3.c:143
int b_bias
Definition: libx264.c:65
int fast_pskip
Definition: libx264.c:69
int noise_reduction
noise reduction strength
Definition: avcodec.h:1603
Views are next to each other.
Definition: stereo3d.h:42
int gop_size
the number of pictures in a group of pictures, or 0 for intra_only
Definition: avcodec.h:1238
static av_cold void X264_init_static(AVCodec *codec)
Definition: libx264.c:542
int mixed_refs
Definition: libx264.c:67
char * tune
Definition: libx264.c:49
planar YUV 4:2:0, 12bpp, (1 Cr & Cb sample per 2x2 Y samples)
Definition: pixfmt.h:65
#define VE
Definition: libx264.c:553
int weightb
Definition: libx264.c:61
float aq_strength
Definition: libx264.c:56
common internal api header.
Bi-dir predicted.
Definition: avutil.h:255
char * key
Definition: dict.h:75
int den
denominator
Definition: rational.h:45
interleaved chroma YUV 4:2:2, 16bpp, (1 Cr & Cb sample per 2x1 Y samples)
Definition: pixfmt.h:190
static av_cold int init(AVCodecParserContext *s)
Definition: h264_parser.c:498
int trellis
trellis RD quantization
Definition: avcodec.h:2220
int slices
Number of slices.
Definition: avcodec.h:1770
void * priv_data
Definition: avcodec.h:1090
Definition: h264.h:107
char * value
Definition: dict.h:76
int top_field_first
If the content is interlaced, is top field displayed first.
Definition: frame.h:297
uneven multi-hexagon search
Definition: avcodec.h:531
Views are packed in a checkerboard-like structure per pixel.
Definition: stereo3d.h:73
Views are packed per column.
Definition: stereo3d.h:104
int ssim
Definition: libx264.c:62
#define FF_QP2LAMBDA
factor to convert from H.263 QP to lambda
Definition: avutil.h:207
int64_t dts
Decompression timestamp in AVStream->time_base units; the time at which the packet is decompressed...
Definition: avcodec.h:972
float crf_max
Definition: libx264.c:53
#define OFFSET(x)
Definition: libx264.c:552
int direct_pred
Definition: libx264.c:75
#define AV_DICT_IGNORE_SUFFIX
Definition: dict.h:62
static int X264_frame(AVCodecContext *ctx, AVPacket *pkt, const AVFrame *frame, int *got_packet)
Definition: libx264.c:131
int me_method
Motion estimation algorithm used for video coding.
Definition: avcodec.h:1256
Stereoscopic 3d metadata.
Definition: frame.h:62
AVPixelFormat
Pixel format.
Definition: pixfmt.h:63
This structure stores compressed data.
Definition: avcodec.h:950
int me_subpel_quality
subpel ME quality
Definition: avcodec.h:1503
int64_t pts
Presentation timestamp in AVStream->time_base units; the time at which the decompressed packet will b...
Definition: avcodec.h:966
Predicted.
Definition: avutil.h:254
int thread_type
Which multithreading methods to use.
Definition: avcodec.h:2524
int keyint_min
minimum GOP size
Definition: avcodec.h:1690
static int encode_nals(AVCodecContext *ctx, AVPacket *pkt, x264_nal_t *nals, int nnal)
Definition: libx264.c:98