libx264.c
Go to the documentation of this file.
1 /*
2  * H.264 encoding using the x264 library
3  * Copyright (C) 2005 Mans Rullgard <mans@mansr.com>
4  *
5  * This file is part of Libav.
6  *
7  * Libav is free software; you can redistribute it and/or
8  * modify it under the terms of the GNU Lesser General Public
9  * License as published by the Free Software Foundation; either
10  * version 2.1 of the License, or (at your option) any later version.
11  *
12  * Libav is distributed in the hope that it will be useful,
13  * but WITHOUT ANY WARRANTY; without even the implied warranty of
14  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15  * Lesser General Public License for more details.
16  *
17  * You should have received a copy of the GNU Lesser General Public
18  * License along with Libav; if not, write to the Free Software
19  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20  */
21 
22 #include "libavutil/internal.h"
23 #include "libavutil/opt.h"
24 #include "libavutil/mem.h"
25 #include "libavutil/pixdesc.h"
26 #include "avcodec.h"
27 #include "internal.h"
28 #include <x264.h>
29 #include <float.h>
30 #include <math.h>
31 #include <stdio.h>
32 #include <stdlib.h>
33 #include <string.h>
34 
35 typedef struct X264Context {
36  AVClass *class;
37  x264_param_t params;
38  x264_t *enc;
39  x264_picture_t pic;
41  int sei_size;
43  char *preset;
44  char *tune;
45  char *profile;
47  float crf;
48  float crf_max;
49  int cqp;
50  int aq_mode;
51  float aq_strength;
52  char *psy_rd;
53  int psy;
55  int weightp;
56  int weightb;
57  int ssim;
59  int b_bias;
60  int b_pyramid;
62  int dct8x8;
64  int aud;
65  int mbtree;
66  char *deblock;
67  float cplxblur;
68  char *partitions;
71  char *stats;
72  int nal_hrd;
73 } X264Context;
74 
75 static void X264_log(void *p, int level, const char *fmt, va_list args)
76 {
77  static const int level_map[] = {
78  [X264_LOG_ERROR] = AV_LOG_ERROR,
79  [X264_LOG_WARNING] = AV_LOG_WARNING,
80  [X264_LOG_INFO] = AV_LOG_INFO,
81  [X264_LOG_DEBUG] = AV_LOG_DEBUG
82  };
83 
84  if (level < 0 || level > X264_LOG_DEBUG)
85  return;
86 
87  av_vlog(p, level_map[level], fmt, args);
88 }
89 
90 
91 static int encode_nals(AVCodecContext *ctx, AVPacket *pkt,
92  x264_nal_t *nals, int nnal)
93 {
94  X264Context *x4 = ctx->priv_data;
95  uint8_t *p;
96  int i, size = x4->sei_size, ret;
97 
98  if (!nnal)
99  return 0;
100 
101  for (i = 0; i < nnal; i++)
102  size += nals[i].i_payload;
103 
104  if ((ret = ff_alloc_packet(pkt, size)) < 0)
105  return ret;
106 
107  p = pkt->data;
108 
109  /* Write the SEI as part of the first frame. */
110  if (x4->sei_size > 0 && nnal > 0) {
111  memcpy(p, x4->sei, x4->sei_size);
112  p += x4->sei_size;
113  x4->sei_size = 0;
114  }
115 
116  for (i = 0; i < nnal; i++){
117  memcpy(p, nals[i].p_payload, nals[i].i_payload);
118  p += nals[i].i_payload;
119  }
120 
121  return 1;
122 }
123 
124 static int X264_frame(AVCodecContext *ctx, AVPacket *pkt, const AVFrame *frame,
125  int *got_packet)
126 {
127  X264Context *x4 = ctx->priv_data;
128  x264_nal_t *nal;
129  int nnal, i, ret;
130  x264_picture_t pic_out;
131 
132  x264_picture_init( &x4->pic );
133  x4->pic.img.i_csp = x4->params.i_csp;
134  if (x264_bit_depth > 8)
135  x4->pic.img.i_csp |= X264_CSP_HIGH_DEPTH;
136  x4->pic.img.i_plane = 3;
137 
138  if (frame) {
139  for (i = 0; i < 3; i++) {
140  x4->pic.img.plane[i] = frame->data[i];
141  x4->pic.img.i_stride[i] = frame->linesize[i];
142  }
143 
144  x4->pic.i_pts = frame->pts;
145  x4->pic.i_type =
146  frame->pict_type == AV_PICTURE_TYPE_I ? X264_TYPE_KEYFRAME :
147  frame->pict_type == AV_PICTURE_TYPE_P ? X264_TYPE_P :
148  frame->pict_type == AV_PICTURE_TYPE_B ? X264_TYPE_B :
149  X264_TYPE_AUTO;
150  if (x4->params.b_tff != frame->top_field_first) {
151  x4->params.b_tff = frame->top_field_first;
152  x264_encoder_reconfig(x4->enc, &x4->params);
153  }
154  if (x4->params.vui.i_sar_height != ctx->sample_aspect_ratio.den ||
155  x4->params.vui.i_sar_width != ctx->sample_aspect_ratio.num) {
156  x4->params.vui.i_sar_height = ctx->sample_aspect_ratio.den;
157  x4->params.vui.i_sar_width = ctx->sample_aspect_ratio.num;
158  x264_encoder_reconfig(x4->enc, &x4->params);
159  }
160  }
161 
162  do {
163  if (x264_encoder_encode(x4->enc, &nal, &nnal, frame? &x4->pic: NULL, &pic_out) < 0)
164  return -1;
165 
166  ret = encode_nals(ctx, pkt, nal, nnal);
167  if (ret < 0)
168  return -1;
169  } while (!ret && !frame && x264_encoder_delayed_frames(x4->enc));
170 
171  pkt->pts = pic_out.i_pts;
172  pkt->dts = pic_out.i_dts;
173 
174  switch (pic_out.i_type) {
175  case X264_TYPE_IDR:
176  case X264_TYPE_I:
178  break;
179  case X264_TYPE_P:
181  break;
182  case X264_TYPE_B:
183  case X264_TYPE_BREF:
185  break;
186  }
187 
188  pkt->flags |= AV_PKT_FLAG_KEY*pic_out.b_keyframe;
189  if (ret)
190  x4->out_pic.quality = (pic_out.i_qpplus1 - 1) * FF_QP2LAMBDA;
191 
192  *got_packet = ret;
193  return 0;
194 }
195 
197 {
198  X264Context *x4 = avctx->priv_data;
199 
200  av_freep(&avctx->extradata);
201  av_free(x4->sei);
202 
203  if (x4->enc)
204  x264_encoder_close(x4->enc);
205 
206  return 0;
207 }
208 
210 {
211  switch (pix_fmt) {
212  case AV_PIX_FMT_YUV420P:
213  case AV_PIX_FMT_YUVJ420P:
214  case AV_PIX_FMT_YUV420P9:
215  case AV_PIX_FMT_YUV420P10: return X264_CSP_I420;
216  case AV_PIX_FMT_YUV422P:
217  case AV_PIX_FMT_YUV422P10: return X264_CSP_I422;
218  case AV_PIX_FMT_YUV444P:
219  case AV_PIX_FMT_YUV444P9:
220  case AV_PIX_FMT_YUV444P10: return X264_CSP_I444;
221  };
222  return 0;
223 }
224 
225 #define PARSE_X264_OPT(name, var)\
226  if (x4->var && x264_param_parse(&x4->params, name, x4->var) < 0) {\
227  av_log(avctx, AV_LOG_ERROR, "Error parsing option '%s' with value '%s'.\n", name, x4->var);\
228  return AVERROR(EINVAL);\
229  }
230 
231 static av_cold int X264_init(AVCodecContext *avctx)
232 {
233  X264Context *x4 = avctx->priv_data;
234 
235  x264_param_default(&x4->params);
236 
237  x4->params.b_deblocking_filter = avctx->flags & CODEC_FLAG_LOOP_FILTER;
238 
239  if (x4->preset || x4->tune)
240  if (x264_param_default_preset(&x4->params, x4->preset, x4->tune) < 0) {
241  av_log(avctx, AV_LOG_ERROR, "Error setting preset/tune %s/%s.\n", x4->preset, x4->tune);
242  return AVERROR(EINVAL);
243  }
244 
245  if (avctx->level > 0)
246  x4->params.i_level_idc = avctx->level;
247 
248  x4->params.pf_log = X264_log;
249  x4->params.p_log_private = avctx;
250  x4->params.i_log_level = X264_LOG_DEBUG;
251  x4->params.i_csp = convert_pix_fmt(avctx->pix_fmt);
252 
253  if (avctx->bit_rate) {
254  x4->params.rc.i_bitrate = avctx->bit_rate / 1000;
255  x4->params.rc.i_rc_method = X264_RC_ABR;
256  }
257  x4->params.rc.i_vbv_buffer_size = avctx->rc_buffer_size / 1000;
258  x4->params.rc.i_vbv_max_bitrate = avctx->rc_max_rate / 1000;
259  x4->params.rc.b_stat_write = avctx->flags & CODEC_FLAG_PASS1;
260  if (avctx->flags & CODEC_FLAG_PASS2) {
261  x4->params.rc.b_stat_read = 1;
262  } else {
263  if (x4->crf >= 0) {
264  x4->params.rc.i_rc_method = X264_RC_CRF;
265  x4->params.rc.f_rf_constant = x4->crf;
266  } else if (x4->cqp >= 0) {
267  x4->params.rc.i_rc_method = X264_RC_CQP;
268  x4->params.rc.i_qp_constant = x4->cqp;
269  }
270 
271  if (x4->crf_max >= 0)
272  x4->params.rc.f_rf_constant_max = x4->crf_max;
273  }
274 
275  if (avctx->rc_buffer_size && avctx->rc_initial_buffer_occupancy > 0 &&
276  (avctx->rc_initial_buffer_occupancy <= avctx->rc_buffer_size)) {
277  x4->params.rc.f_vbv_buffer_init =
278  (float)avctx->rc_initial_buffer_occupancy / avctx->rc_buffer_size;
279  }
280 
281  x4->params.rc.f_ip_factor = 1 / fabs(avctx->i_quant_factor);
282  x4->params.rc.f_pb_factor = avctx->b_quant_factor;
283  x4->params.analyse.i_chroma_qp_offset = avctx->chromaoffset;
284 
285  if (avctx->me_method == ME_EPZS)
286  x4->params.analyse.i_me_method = X264_ME_DIA;
287  else if (avctx->me_method == ME_HEX)
288  x4->params.analyse.i_me_method = X264_ME_HEX;
289  else if (avctx->me_method == ME_UMH)
290  x4->params.analyse.i_me_method = X264_ME_UMH;
291  else if (avctx->me_method == ME_FULL)
292  x4->params.analyse.i_me_method = X264_ME_ESA;
293  else if (avctx->me_method == ME_TESA)
294  x4->params.analyse.i_me_method = X264_ME_TESA;
295 
296  if (avctx->gop_size >= 0)
297  x4->params.i_keyint_max = avctx->gop_size;
298  if (avctx->max_b_frames >= 0)
299  x4->params.i_bframe = avctx->max_b_frames;
300  if (avctx->scenechange_threshold >= 0)
301  x4->params.i_scenecut_threshold = avctx->scenechange_threshold;
302  if (avctx->qmin >= 0)
303  x4->params.rc.i_qp_min = avctx->qmin;
304  if (avctx->qmax >= 0)
305  x4->params.rc.i_qp_max = avctx->qmax;
306  if (avctx->max_qdiff >= 0)
307  x4->params.rc.i_qp_step = avctx->max_qdiff;
308  if (avctx->qblur >= 0)
309  x4->params.rc.f_qblur = avctx->qblur; /* temporally blur quants */
310  if (avctx->qcompress >= 0)
311  x4->params.rc.f_qcompress = avctx->qcompress; /* 0.0 => cbr, 1.0 => constant qp */
312  if (avctx->refs >= 0)
313  x4->params.i_frame_reference = avctx->refs;
314  if (avctx->trellis >= 0)
315  x4->params.analyse.i_trellis = avctx->trellis;
316  if (avctx->me_range >= 0)
317  x4->params.analyse.i_me_range = avctx->me_range;
318  if (avctx->noise_reduction >= 0)
319  x4->params.analyse.i_noise_reduction = avctx->noise_reduction;
320  if (avctx->me_subpel_quality >= 0)
321  x4->params.analyse.i_subpel_refine = avctx->me_subpel_quality;
322  if (avctx->b_frame_strategy >= 0)
323  x4->params.i_bframe_adaptive = avctx->b_frame_strategy;
324  if (avctx->keyint_min >= 0)
325  x4->params.i_keyint_min = avctx->keyint_min;
326  if (avctx->coder_type >= 0)
327  x4->params.b_cabac = avctx->coder_type == FF_CODER_TYPE_AC;
328  if (avctx->me_cmp >= 0)
329  x4->params.analyse.b_chroma_me = avctx->me_cmp & FF_CMP_CHROMA;
330 
331  if (x4->aq_mode >= 0)
332  x4->params.rc.i_aq_mode = x4->aq_mode;
333  if (x4->aq_strength >= 0)
334  x4->params.rc.f_aq_strength = x4->aq_strength;
335  PARSE_X264_OPT("psy-rd", psy_rd);
336  PARSE_X264_OPT("deblock", deblock);
337  PARSE_X264_OPT("partitions", partitions);
338  PARSE_X264_OPT("stats", stats);
339  if (x4->psy >= 0)
340  x4->params.analyse.b_psy = x4->psy;
341  if (x4->rc_lookahead >= 0)
342  x4->params.rc.i_lookahead = x4->rc_lookahead;
343  if (x4->weightp >= 0)
344  x4->params.analyse.i_weighted_pred = x4->weightp;
345  if (x4->weightb >= 0)
346  x4->params.analyse.b_weighted_bipred = x4->weightb;
347  if (x4->cplxblur >= 0)
348  x4->params.rc.f_complexity_blur = x4->cplxblur;
349 
350  if (x4->ssim >= 0)
351  x4->params.analyse.b_ssim = x4->ssim;
352  if (x4->intra_refresh >= 0)
353  x4->params.b_intra_refresh = x4->intra_refresh;
354  if (x4->b_bias != INT_MIN)
355  x4->params.i_bframe_bias = x4->b_bias;
356  if (x4->b_pyramid >= 0)
357  x4->params.i_bframe_pyramid = x4->b_pyramid;
358  if (x4->mixed_refs >= 0)
359  x4->params.analyse.b_mixed_references = x4->mixed_refs;
360  if (x4->dct8x8 >= 0)
361  x4->params.analyse.b_transform_8x8 = x4->dct8x8;
362  if (x4->fast_pskip >= 0)
363  x4->params.analyse.b_fast_pskip = x4->fast_pskip;
364  if (x4->aud >= 0)
365  x4->params.b_aud = x4->aud;
366  if (x4->mbtree >= 0)
367  x4->params.rc.b_mb_tree = x4->mbtree;
368  if (x4->direct_pred >= 0)
369  x4->params.analyse.i_direct_mv_pred = x4->direct_pred;
370 
371  if (x4->slice_max_size >= 0)
372  x4->params.i_slice_max_size = x4->slice_max_size;
373 
374  if (x4->fastfirstpass)
375  x264_param_apply_fastfirstpass(&x4->params);
376 
377  if (x4->nal_hrd >= 0)
378  x4->params.i_nal_hrd = x4->nal_hrd;
379 
380  if (x4->profile)
381  if (x264_param_apply_profile(&x4->params, x4->profile) < 0) {
382  av_log(avctx, AV_LOG_ERROR, "Error setting profile %s.\n", x4->profile);
383  return AVERROR(EINVAL);
384  }
385 
386  x4->params.i_width = avctx->width;
387  x4->params.i_height = avctx->height;
388  x4->params.vui.i_sar_width = avctx->sample_aspect_ratio.num;
389  x4->params.vui.i_sar_height = avctx->sample_aspect_ratio.den;
390  x4->params.i_fps_num = x4->params.i_timebase_den = avctx->time_base.den;
391  x4->params.i_fps_den = x4->params.i_timebase_num = avctx->time_base.num;
392 
393  x4->params.analyse.b_psnr = avctx->flags & CODEC_FLAG_PSNR;
394 
395  x4->params.i_threads = avctx->thread_count;
396  if (avctx->thread_type)
397  x4->params.b_sliced_threads = avctx->thread_type == FF_THREAD_SLICE;
398 
399  x4->params.b_interlaced = avctx->flags & CODEC_FLAG_INTERLACED_DCT;
400 
401  x4->params.b_open_gop = !(avctx->flags & CODEC_FLAG_CLOSED_GOP);
402 
403  x4->params.i_slice_count = avctx->slices;
404 
405  x4->params.vui.b_fullrange = avctx->pix_fmt == AV_PIX_FMT_YUVJ420P;
406 
407  if (avctx->flags & CODEC_FLAG_GLOBAL_HEADER)
408  x4->params.b_repeat_headers = 0;
409 
410  // update AVCodecContext with x264 parameters
411  avctx->has_b_frames = x4->params.i_bframe ?
412  x4->params.i_bframe_pyramid ? 2 : 1 : 0;
413  if (avctx->max_b_frames < 0)
414  avctx->max_b_frames = 0;
415 
416  avctx->bit_rate = x4->params.rc.i_bitrate*1000;
417 
418  x4->enc = x264_encoder_open(&x4->params);
419  if (!x4->enc)
420  return -1;
421 
422  avctx->coded_frame = &x4->out_pic;
423 
424  if (avctx->flags & CODEC_FLAG_GLOBAL_HEADER) {
425  x264_nal_t *nal;
426  uint8_t *p;
427  int nnal, s, i;
428 
429  s = x264_encoder_headers(x4->enc, &nal, &nnal);
430  avctx->extradata = p = av_malloc(s);
431 
432  for (i = 0; i < nnal; i++) {
433  /* Don't put the SEI in extradata. */
434  if (nal[i].i_type == NAL_SEI) {
435  av_log(avctx, AV_LOG_INFO, "%s\n", nal[i].p_payload+25);
436  x4->sei_size = nal[i].i_payload;
437  x4->sei = av_malloc(x4->sei_size);
438  memcpy(x4->sei, nal[i].p_payload, nal[i].i_payload);
439  continue;
440  }
441  memcpy(p, nal[i].p_payload, nal[i].i_payload);
442  p += nal[i].i_payload;
443  }
444  avctx->extradata_size = p - avctx->extradata;
445  }
446 
447  return 0;
448 }
449 
450 static const enum AVPixelFormat pix_fmts_8bit[] = {
456 };
457 static const enum AVPixelFormat pix_fmts_9bit[] = {
461 };
462 static const enum AVPixelFormat pix_fmts_10bit[] = {
467 };
468 
469 static av_cold void X264_init_static(AVCodec *codec)
470 {
471  if (x264_bit_depth == 8)
472  codec->pix_fmts = pix_fmts_8bit;
473  else if (x264_bit_depth == 9)
474  codec->pix_fmts = pix_fmts_9bit;
475  else if (x264_bit_depth == 10)
476  codec->pix_fmts = pix_fmts_10bit;
477 }
478 
479 #define OFFSET(x) offsetof(X264Context, x)
480 #define VE AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_ENCODING_PARAM
481 static const AVOption options[] = {
482  { "preset", "Set the encoding preset (cf. x264 --fullhelp)", OFFSET(preset), AV_OPT_TYPE_STRING, { .str = "medium" }, 0, 0, VE},
483  { "tune", "Tune the encoding params (cf. x264 --fullhelp)", OFFSET(tune), AV_OPT_TYPE_STRING, { 0 }, 0, 0, VE},
484  { "profile", "Set profile restrictions (cf. x264 --fullhelp) ", OFFSET(profile), AV_OPT_TYPE_STRING, { 0 }, 0, 0, VE},
485  { "fastfirstpass", "Use fast settings when encoding first pass", OFFSET(fastfirstpass), AV_OPT_TYPE_INT, { .i64 = 1 }, 0, 1, VE},
486  { "crf", "Select the quality for constant quality mode", OFFSET(crf), AV_OPT_TYPE_FLOAT, {.dbl = -1 }, -1, FLT_MAX, VE },
487  { "crf_max", "In CRF mode, prevents VBV from lowering quality beyond this point.",OFFSET(crf_max), AV_OPT_TYPE_FLOAT, {.dbl = -1 }, -1, FLT_MAX, VE },
488  { "qp", "Constant quantization parameter rate control method",OFFSET(cqp), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, INT_MAX, VE },
489  { "aq-mode", "AQ method", OFFSET(aq_mode), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, INT_MAX, VE, "aq_mode"},
490  { "none", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = X264_AQ_NONE}, INT_MIN, INT_MAX, VE, "aq_mode" },
491  { "variance", "Variance AQ (complexity mask)", 0, AV_OPT_TYPE_CONST, {.i64 = X264_AQ_VARIANCE}, INT_MIN, INT_MAX, VE, "aq_mode" },
492  { "autovariance", "Auto-variance AQ (experimental)", 0, AV_OPT_TYPE_CONST, {.i64 = X264_AQ_AUTOVARIANCE}, INT_MIN, INT_MAX, VE, "aq_mode" },
493  { "aq-strength", "AQ strength. Reduces blocking and blurring in flat and textured areas.", OFFSET(aq_strength), AV_OPT_TYPE_FLOAT, {.dbl = -1}, -1, FLT_MAX, VE},
494  { "psy", "Use psychovisual optimizations.", OFFSET(psy), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, 1, VE },
495  { "psy-rd", "Strength of psychovisual optimization, in <psy-rd>:<psy-trellis> format.", OFFSET(psy_rd), AV_OPT_TYPE_STRING, {0 }, 0, 0, VE},
496  { "rc-lookahead", "Number of frames to look ahead for frametype and ratecontrol", OFFSET(rc_lookahead), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, INT_MAX, VE },
497  { "weightb", "Weighted prediction for B-frames.", OFFSET(weightb), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, 1, VE },
498  { "weightp", "Weighted prediction analysis method.", OFFSET(weightp), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, INT_MAX, VE, "weightp" },
499  { "none", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = X264_WEIGHTP_NONE}, INT_MIN, INT_MAX, VE, "weightp" },
500  { "simple", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = X264_WEIGHTP_SIMPLE}, INT_MIN, INT_MAX, VE, "weightp" },
501  { "smart", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = X264_WEIGHTP_SMART}, INT_MIN, INT_MAX, VE, "weightp" },
502  { "ssim", "Calculate and print SSIM stats.", OFFSET(ssim), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, 1, VE },
503  { "intra-refresh", "Use Periodic Intra Refresh instead of IDR frames.",OFFSET(intra_refresh),AV_OPT_TYPE_INT, { .i64 = -1 }, -1, 1, VE },
504  { "b-bias", "Influences how often B-frames are used", OFFSET(b_bias), AV_OPT_TYPE_INT, { .i64 = INT_MIN}, INT_MIN, INT_MAX, VE },
505  { "b-pyramid", "Keep some B-frames as references.", OFFSET(b_pyramid), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, INT_MAX, VE, "b_pyramid" },
506  { "none", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = X264_B_PYRAMID_NONE}, INT_MIN, INT_MAX, VE, "b_pyramid" },
507  { "strict", "Strictly hierarchical pyramid", 0, AV_OPT_TYPE_CONST, {.i64 = X264_B_PYRAMID_STRICT}, INT_MIN, INT_MAX, VE, "b_pyramid" },
508  { "normal", "Non-strict (not Blu-ray compatible)", 0, AV_OPT_TYPE_CONST, {.i64 = X264_B_PYRAMID_NORMAL}, INT_MIN, INT_MAX, VE, "b_pyramid" },
509  { "mixed-refs", "One reference per partition, as opposed to one reference per macroblock", OFFSET(mixed_refs), AV_OPT_TYPE_INT, { .i64 = -1}, -1, 1, VE },
510  { "8x8dct", "High profile 8x8 transform.", OFFSET(dct8x8), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, 1, VE},
511  { "fast-pskip", NULL, OFFSET(fast_pskip), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, 1, VE},
512  { "aud", "Use access unit delimiters.", OFFSET(aud), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, 1, VE},
513  { "mbtree", "Use macroblock tree ratecontrol.", OFFSET(mbtree), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, 1, VE},
514  { "deblock", "Loop filter parameters, in <alpha:beta> form.", OFFSET(deblock), AV_OPT_TYPE_STRING, { 0 }, 0, 0, VE},
515  { "cplxblur", "Reduce fluctuations in QP (before curve compression)", OFFSET(cplxblur), AV_OPT_TYPE_FLOAT, {.dbl = -1 }, -1, FLT_MAX, VE},
516  { "partitions", "A comma-separated list of partitions to consider. "
517  "Possible values: p8x8, p4x4, b8x8, i8x8, i4x4, none, all", OFFSET(partitions), AV_OPT_TYPE_STRING, { 0 }, 0, 0, VE},
518  { "direct-pred", "Direct MV prediction mode", OFFSET(direct_pred), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, INT_MAX, VE, "direct-pred" },
519  { "none", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = X264_DIRECT_PRED_NONE }, 0, 0, VE, "direct-pred" },
520  { "spatial", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = X264_DIRECT_PRED_SPATIAL }, 0, 0, VE, "direct-pred" },
521  { "temporal", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = X264_DIRECT_PRED_TEMPORAL }, 0, 0, VE, "direct-pred" },
522  { "auto", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = X264_DIRECT_PRED_AUTO }, 0, 0, VE, "direct-pred" },
523  { "slice-max-size","Limit the size of each slice in bytes", OFFSET(slice_max_size),AV_OPT_TYPE_INT, { .i64 = -1 }, -1, INT_MAX, VE },
524  { "stats", "Filename for 2 pass stats", OFFSET(stats), AV_OPT_TYPE_STRING, { 0 }, 0, 0, VE },
525  { "nal-hrd", "Signal HRD information (requires vbv-bufsize; "
526  "cbr not allowed in .mp4)", OFFSET(nal_hrd), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, INT_MAX, VE, "nal-hrd" },
527  { "none", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = X264_NAL_HRD_NONE}, INT_MIN, INT_MAX, VE, "nal-hrd" },
528  { "vbr", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = X264_NAL_HRD_VBR}, INT_MIN, INT_MAX, VE, "nal-hrd" },
529  { "cbr", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = X264_NAL_HRD_CBR}, INT_MIN, INT_MAX, VE, "nal-hrd" },
530  { NULL },
531 };
532 
533 static const AVClass class = {
534  .class_name = "libx264",
535  .item_name = av_default_item_name,
536  .option = options,
538 };
539 
540 static const AVCodecDefault x264_defaults[] = {
541  { "b", "0" },
542  { "bf", "-1" },
543  { "g", "-1" },
544  { "qmin", "-1" },
545  { "qmax", "-1" },
546  { "qdiff", "-1" },
547  { "qblur", "-1" },
548  { "qcomp", "-1" },
549  { "refs", "-1" },
550  { "sc_threshold", "-1" },
551  { "trellis", "-1" },
552  { "nr", "-1" },
553  { "me_range", "-1" },
554  { "me_method", "-1" },
555  { "subq", "-1" },
556  { "b_strategy", "-1" },
557  { "keyint_min", "-1" },
558  { "coder", "-1" },
559  { "cmp", "-1" },
560  { "threads", AV_STRINGIFY(X264_THREADS_AUTO) },
561  { "thread_type", "0" },
562  { "flags", "+cgop" },
563  { "rc_init_occupancy","-1" },
564  { NULL },
565 };
566 
568  .name = "libx264",
569  .type = AVMEDIA_TYPE_VIDEO,
570  .id = AV_CODEC_ID_H264,
571  .priv_data_size = sizeof(X264Context),
572  .init = X264_init,
573  .encode2 = X264_frame,
574  .close = X264_close,
575  .capabilities = CODEC_CAP_DELAY | CODEC_CAP_AUTO_THREADS,
576  .long_name = NULL_IF_CONFIG_SMALL("libx264 H.264 / AVC / MPEG-4 AVC / MPEG-4 part 10"),
577  .priv_class = &class,
578  .defaults = x264_defaults,
579  .init_static_data = X264_init_static,
580 };
static int convert_pix_fmt(enum AVPixelFormat pix_fmt)
Definition: libx264.c:209
void * av_malloc(size_t size)
Allocate a block of size bytes with alignment suitable for all memory accesses (including vectors if ...
Definition: mem.c:61
char * partitions
Definition: libx264.c:68
int size
This structure describes decoded (raw) audio or video data.
Definition: avcodec.h:989
int dct8x8
Definition: libx264.c:62
AVOption.
Definition: opt.h:233
AVCodec ff_libx264_encoder
Definition: libx264.c:567
float qblur
amount of qscale smoothing over time (0.0-1.0)
Definition: avcodec.h:2278
planar YUV 4:4:4, 24bpp, (1 Cr & Cb sample per 1x1 Y samples)
Definition: pixfmt.h:70
memory handling functions
AVFrame * coded_frame
the picture in the bitstream
Definition: avcodec.h:2725
int max_b_frames
maximum number of B-frames between non-B-frames Note: The output will be delayed by max_b_frames+1 re...
Definition: avcodec.h:1588
int rc_initial_buffer_occupancy
Number of bits which should be loaded into the rc buffer before decoding starts.
Definition: avcodec.h:2376
int num
numerator
Definition: rational.h:44
enhanced predictive zonal search
Definition: avcodec.h:517
AVRational sample_aspect_ratio
sample aspect ratio (0 if unknown) That is the width of a pixel divided by the height of the pixel...
Definition: avcodec.h:1724
enum AVPixelFormat pix_fmt
Pixel format, see AV_PIX_FMT_xxx.
Definition: avcodec.h:1533
static void X264_log(void *p, int level, const char *fmt, va_list args)
Definition: libx264.c:75
AVCodec.
Definition: avcodec.h:2960
static av_cold int X264_init(AVCodecContext *avctx)
Definition: libx264.c:231
int scenechange_threshold
scene change detection threshold 0 is default, larger means fewer detected scene changes.
Definition: avcodec.h:1907
AVRational time_base
This is the fundamental unit of time (in seconds) in terms of which frame timestamps are represented...
Definition: avcodec.h:1465
void av_freep(void *arg)
Free a memory block which has been allocated with av_malloc(z)() or av_realloc() and set the pointer ...
Definition: mem.c:151
x264_param_t params
Definition: libx264.c:37
const char * class_name
The name of the class; usually it is the same name as the context structure type to which the AVClass...
Definition: log.h:38
uint8_t
AVOptions.
int me_range
maximum motion estimation search range in subpel units If 0 then no limit.
Definition: avcodec.h:1833
float b_quant_factor
qscale factor between IP and B-frames If > 0 then the last P-frame quantizer will be used (q= lastp_q...
Definition: avcodec.h:1597
int64_t pts
presentation timestamp in time_base units (time when frame should be shown to user) If AV_NOPTS_VALUE...
Definition: avcodec.h:1088
uint8_t * extradata
some codecs need / can use extradata like Huffman tables.
Definition: avcodec.h:1454
int me_cmp
motion estimation comparison function
Definition: avcodec.h:1731
int coder_type
coder type
Definition: avcodec.h:2388
uint8_t * data
Definition: avcodec.h:915
int b_pyramid
Definition: libx264.c:60
x264_picture_t pic
Definition: libx264.c:39
float cplxblur
Definition: libx264.c:67
char * stats
Definition: libx264.c:71
int intra_refresh
Definition: libx264.c:58
static int init(AVCodecParserContext *s)
Definition: h264_parser.c:335
int rc_lookahead
Definition: libx264.c:54
hexagon based search
Definition: avcodec.h:519
void av_vlog(void *avcl, int level, const char *fmt, va_list vl)
Definition: log.c:158
int chromaoffset
chroma qp offset from luma
Definition: avcodec.h:2029
static enum AVPixelFormat pix_fmts_10bit[]
Definition: libx264.c:462
int has_b_frames
Size of the frame reordering buffer in the decoder.
Definition: avcodec.h:1634
void av_free(void *ptr)
Free a memory block which has been allocated with av_malloc(z)() or av_realloc(). ...
Definition: mem.c:139
int qmax
maximum quantizer
Definition: avcodec.h:2292
char * profile
Definition: libx264.c:45
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification. ...
Definition: internal.h:88
int fastfirstpass
Definition: libx264.c:46
int flags
CODEC_FLAG_*.
Definition: avcodec.h:1434
int rc_max_rate
maximum bitrate
Definition: avcodec.h:2339
void av_log(void *avcl, int level, const char *fmt,...)
Definition: log.c:146
int mbtree
Definition: libx264.c:65
const char * name
Name of the codec implementation.
Definition: avcodec.h:2967
float i_quant_factor
qscale factor between P and I-frames If > 0 then the last p frame quantizer will be used (q= lastp_q*...
Definition: avcodec.h:1650
char * deblock
Definition: libx264.c:66
transformed exhaustive search algorithm
Definition: avcodec.h:522
int flags
A combination of AV_PKT_FLAG values.
Definition: avcodec.h:921
planar YUV 4:2:2, 16bpp, (1 Cr & Cb sample per 2x1 Y samples)
Definition: pixfmt.h:69
int rc_buffer_size
decoder bitstream buffer size
Definition: avcodec.h:2317
common internal API header
char * psy_rd
Definition: libx264.c:52
int refs
number of reference frames
Definition: avcodec.h:2022
static enum AVPixelFormat pix_fmts_9bit[]
Definition: libx264.c:457
#define PARSE_X264_OPT(name, var)
Definition: libx264.c:225
int bit_rate
the average bitrate
Definition: avcodec.h:1404
enum AVPixelFormat * pix_fmts
array of supported pixel formats, or NULL if unknown, array is terminated by -1
Definition: avcodec.h:2981
enum AVPictureType pict_type
Picture type of the frame, see ?_TYPE below.
Definition: avcodec.h:1065
planar YUV 4:2:0, 12bpp, full scale (JPEG), deprecated in favor of PIX_FMT_YUV420P and setting color_...
Definition: pixfmt.h:77
int width
picture width / height.
Definition: avcodec.h:1508
int cqp
Definition: libx264.c:49
x264_t * enc
Definition: libx264.c:38
int b_frame_strategy
Definition: avcodec.h:1603
int level
level
Definition: avcodec.h:2885
int quality
quality (between 1 (good) and FF_LAMBDA_MAX (bad))
Definition: avcodec.h:1122
int ff_alloc_packet(AVPacket *avpkt, int size)
Check AVPacket size and/or allocate data.
Definition: utils.c:878
int slice_max_size
Definition: libx264.c:70
int nal_hrd
Definition: libx264.c:72
int max_qdiff
maximum quantizer difference between frames
Definition: avcodec.h:2299
enum AVPixelFormat pix_fmt
Definition: movenc.c:801
int weightp
Definition: libx264.c:55
LIBAVUTIL_VERSION_INT
Definition: eval.c:52
int thread_count
thread count is used to decide how many independent tasks should be passed to execute() ...
Definition: avcodec.h:2733
static enum AVPixelFormat pix_fmts_8bit[]
Definition: libx264.c:450
static const AVCodecDefault x264_defaults[]
Definition: libx264.c:540
NULL
Definition: eval.c:52
AVFrame out_pic
Definition: libx264.c:42
external API header
static av_cold int X264_close(AVCodecContext *avctx)
Definition: libx264.c:196
int linesize[AV_NUM_DATA_POINTERS]
Size, in bytes, of the data for each picture/channel plane.
Definition: avcodec.h:1008
av_default_item_name
Definition: dnxhdenc.c:43
main external API structure.
Definition: avcodec.h:1339
static void close(AVCodecParserContext *s)
Definition: h264_parser.c:326
static const AVOption options[]
Definition: libx264.c:481
int qmin
minimum quantizer
Definition: avcodec.h:2285
int extradata_size
Definition: avcodec.h:1455
float crf
Definition: libx264.c:47
int aq_mode
Definition: libx264.c:50
int aud
Definition: libx264.c:64
Describe the class of an AVClass context structure.
Definition: log.h:33
uint8_t * sei
Definition: libx264.c:40
int psy
Definition: libx264.c:53
struct X264Context X264Context
float qcompress
amount of qscale change between easy & hard scenes (0.0-1.0)
Definition: avcodec.h:2277
int sei_size
Definition: libx264.c:41
char * preset
Definition: libx264.c:43
uint8_t * data[AV_NUM_DATA_POINTERS]
pointer to the picture/channel planes.
Definition: avcodec.h:997
uint8_t level
Definition: svq3.c:125
int b_bias
Definition: libx264.c:59
int fast_pskip
Definition: libx264.c:63
int noise_reduction
noise reduction strength
Definition: avcodec.h:1914
int gop_size
the number of pictures in a group of pictures, or 0 for intra_only
Definition: avcodec.h:1524
static av_cold void X264_init_static(AVCodec *codec)
Definition: libx264.c:469
int mixed_refs
Definition: libx264.c:61
char * tune
Definition: libx264.c:44
planar YUV 4:2:0, 12bpp, (1 Cr & Cb sample per 2x2 Y samples)
Definition: pixfmt.h:65
#define VE
Definition: libx264.c:480
int weightb
Definition: libx264.c:56
float aq_strength
Definition: libx264.c:51
common internal api header.
Bi-dir predicted.
Definition: avutil.h:247
int den
denominator
Definition: rational.h:45
int trellis
trellis RD quantization
Definition: avcodec.h:2444
int slices
Number of slices.
Definition: avcodec.h:2095
void * priv_data
Definition: avcodec.h:1382
Definition: h264.h:107
int top_field_first
If the content is interlaced, is top field displayed first.
Definition: avcodec.h:1239
uneven multi-hexagon search
Definition: avcodec.h:520
int ssim
Definition: libx264.c:57
int64_t dts
Decompression timestamp in AVStream->time_base units; the time at which the packet is decompressed...
Definition: avcodec.h:914
float crf_max
Definition: libx264.c:48
#define OFFSET(x)
Definition: libx264.c:479
int direct_pred
Definition: libx264.c:69
static int X264_frame(AVCodecContext *ctx, AVPacket *pkt, const AVFrame *frame, int *got_packet)
Definition: libx264.c:124
int me_method
Motion estimation algorithm used for video coding.
Definition: avcodec.h:1542
AVPixelFormat
Pixel format.
Definition: pixfmt.h:63
This structure stores compressed data.
Definition: avcodec.h:898
int me_subpel_quality
subpel ME quality
Definition: avcodec.h:1807
int64_t pts
Presentation timestamp in AVStream->time_base units; the time at which the decompressed packet will b...
Definition: avcodec.h:908
Predicted.
Definition: avutil.h:246
int thread_type
Which multithreading methods to use.
Definition: avcodec.h:2743
int keyint_min
minimum GOP size
Definition: avcodec.h:2015
static int encode_nals(AVCodecContext *ctx, AVPacket *pkt, x264_nal_t *nals, int nnal)
Definition: libx264.c:91