26 #define VPX_DISABLE_CTRL_TYPECHECKS 1
27 #define VPX_CODEC_DISABLE_COMPAT 1
28 #include <vpx/vpx_encoder.h>
29 #include <vpx/vp8cx.h>
72 [VP8E_UPD_ENTROPY] =
"VP8E_UPD_ENTROPY",
73 [VP8E_UPD_REFERENCE] =
"VP8E_UPD_REFERENCE",
74 [VP8E_USE_REFERENCE] =
"VP8E_USE_REFERENCE",
75 [VP8E_SET_ROI_MAP] =
"VP8E_SET_ROI_MAP",
76 [VP8E_SET_ACTIVEMAP] =
"VP8E_SET_ACTIVEMAP",
77 [VP8E_SET_SCALEMODE] =
"VP8E_SET_SCALEMODE",
78 [VP8E_SET_CPUUSED] =
"VP8E_SET_CPUUSED",
79 [VP8E_SET_ENABLEAUTOALTREF] =
"VP8E_SET_ENABLEAUTOALTREF",
80 [VP8E_SET_NOISE_SENSITIVITY] =
"VP8E_SET_NOISE_SENSITIVITY",
81 [VP8E_SET_SHARPNESS] =
"VP8E_SET_SHARPNESS",
82 [VP8E_SET_STATIC_THRESHOLD] =
"VP8E_SET_STATIC_THRESHOLD",
83 [VP8E_SET_TOKEN_PARTITIONS] =
"VP8E_SET_TOKEN_PARTITIONS",
84 [VP8E_GET_LAST_QUANTIZER] =
"VP8E_GET_LAST_QUANTIZER",
85 [VP8E_SET_ARNR_MAXFRAMES] =
"VP8E_SET_ARNR_MAXFRAMES",
86 [VP8E_SET_ARNR_STRENGTH] =
"VP8E_SET_ARNR_STRENGTH",
87 [VP8E_SET_ARNR_TYPE] =
"VP8E_SET_ARNR_TYPE",
88 [VP8E_SET_CQ_LEVEL] =
"VP8E_SET_CQ_LEVEL",
94 const char *error = vpx_codec_error(&ctx->encoder);
95 const char *detail = vpx_codec_error_detail(&ctx->encoder);
103 const struct vpx_codec_enc_cfg *cfg)
108 av_log(avctx, level,
"vpx_codec_enc_cfg\n");
109 av_log(avctx, level,
"generic settings\n"
110 " %*s%u\n %*s%u\n %*s%u\n %*s%u\n %*s%u\n"
111 " %*s{%u/%u}\n %*s%u\n %*s%d\n %*s%u\n",
112 width,
"g_usage:", cfg->g_usage,
113 width,
"g_threads:", cfg->g_threads,
114 width,
"g_profile:", cfg->g_profile,
115 width,
"g_w:", cfg->g_w,
116 width,
"g_h:", cfg->g_h,
117 width,
"g_timebase:", cfg->g_timebase.num, cfg->g_timebase.den,
118 width,
"g_error_resilient:", cfg->g_error_resilient,
119 width,
"g_pass:", cfg->g_pass,
120 width,
"g_lag_in_frames:", cfg->g_lag_in_frames);
121 av_log(avctx, level,
"rate control settings\n"
122 " %*s%u\n %*s%u\n %*s%u\n %*s%u\n"
123 " %*s%d\n %*s%p(%zu)\n %*s%u\n",
124 width,
"rc_dropframe_thresh:", cfg->rc_dropframe_thresh,
125 width,
"rc_resize_allowed:", cfg->rc_resize_allowed,
126 width,
"rc_resize_up_thresh:", cfg->rc_resize_up_thresh,
127 width,
"rc_resize_down_thresh:", cfg->rc_resize_down_thresh,
128 width,
"rc_end_usage:", cfg->rc_end_usage,
129 width,
"rc_twopass_stats_in:", cfg->rc_twopass_stats_in.buf, cfg->rc_twopass_stats_in.sz,
130 width,
"rc_target_bitrate:", cfg->rc_target_bitrate);
131 av_log(avctx, level,
"quantizer settings\n"
133 width,
"rc_min_quantizer:", cfg->rc_min_quantizer,
134 width,
"rc_max_quantizer:", cfg->rc_max_quantizer);
135 av_log(avctx, level,
"bitrate tolerance\n"
137 width,
"rc_undershoot_pct:", cfg->rc_undershoot_pct,
138 width,
"rc_overshoot_pct:", cfg->rc_overshoot_pct);
139 av_log(avctx, level,
"decoder buffer model\n"
140 " %*s%u\n %*s%u\n %*s%u\n",
141 width,
"rc_buf_sz:", cfg->rc_buf_sz,
142 width,
"rc_buf_initial_sz:", cfg->rc_buf_initial_sz,
143 width,
"rc_buf_optimal_sz:", cfg->rc_buf_optimal_sz);
144 av_log(avctx, level,
"2 pass rate control settings\n"
145 " %*s%u\n %*s%u\n %*s%u\n",
146 width,
"rc_2pass_vbr_bias_pct:", cfg->rc_2pass_vbr_bias_pct,
147 width,
"rc_2pass_vbr_minsection_pct:", cfg->rc_2pass_vbr_minsection_pct,
148 width,
"rc_2pass_vbr_maxsection_pct:", cfg->rc_2pass_vbr_maxsection_pct);
149 av_log(avctx, level,
"keyframing settings\n"
150 " %*s%d\n %*s%u\n %*s%u\n",
151 width,
"kf_mode:", cfg->kf_mode,
152 width,
"kf_min_dist:", cfg->kf_min_dist,
153 width,
"kf_max_dist:", cfg->kf_max_dist);
154 av_log(avctx, level,
"\n");
185 enum vp8e_enc_control_id
id,
int val)
192 snprintf(buf,
sizeof(buf),
"%s:",
ctlidstr[
id]);
195 res = vpx_codec_control(&ctx->encoder,
id, val);
196 if (res != VPX_CODEC_OK) {
197 snprintf(buf,
sizeof(buf),
"Failed to set %s codec control",
202 return res == VPX_CODEC_OK ? 0 :
AVERROR(EINVAL);
209 vpx_codec_destroy(&ctx->encoder);
220 const struct vpx_codec_iface *iface = &vpx_codec_vp8_cx_algo;
221 struct vpx_codec_enc_cfg enccfg;
227 if ((res = vpx_codec_enc_config_default(iface, &enccfg, 0)) != VPX_CODEC_OK) {
229 vpx_codec_err_to_string(res));
234 enccfg.g_w = avctx->
width;
235 enccfg.g_h = avctx->
height;
240 if (ctx->lag_in_frames >= 0)
241 enccfg.g_lag_in_frames = ctx->lag_in_frames;
244 enccfg.g_pass = VPX_RC_FIRST_PASS;
246 enccfg.g_pass = VPX_RC_LAST_PASS;
248 enccfg.g_pass = VPX_RC_ONE_PASS;
251 avctx->
bit_rate = enccfg.rc_target_bitrate * 1000;
257 enccfg.rc_end_usage = VPX_CQ;
260 enccfg.rc_end_usage = VPX_CBR;
263 enccfg.rc_min_quantizer = avctx->
qmin;
265 enccfg.rc_max_quantizer = avctx->
qmax;
270 enccfg.rc_2pass_vbr_minsection_pct =
273 enccfg.rc_2pass_vbr_maxsection_pct =
280 enccfg.rc_buf_initial_sz =
282 enccfg.rc_buf_optimal_sz = enccfg.rc_buf_sz * 5 / 6;
288 enccfg.kf_max_dist = avctx->
gop_size;
290 if (enccfg.g_pass == VPX_RC_FIRST_PASS)
291 enccfg.g_lag_in_frames = 0;
292 else if (enccfg.g_pass == VPX_RC_LAST_PASS) {
300 ctx->twopass_stats.sz = strlen(avctx->
stats_in) * 3 / 4;
301 ctx->twopass_stats.buf =
av_malloc(ctx->twopass_stats.sz);
302 if (!ctx->twopass_stats.buf) {
304 "Stat buffer alloc (%zu bytes) failed\n",
305 ctx->twopass_stats.sz);
309 ctx->twopass_stats.sz);
310 if (decode_size < 0) {
315 ctx->twopass_stats.sz = decode_size;
316 enccfg.rc_twopass_stats_in = ctx->twopass_stats;
323 enccfg.g_profile = avctx->
profile;
325 enccfg.g_error_resilient = ctx->error_resilient;
329 res = vpx_codec_enc_init(&ctx->encoder, iface, &enccfg, 0);
330 if (res != VPX_CODEC_OK) {
337 if (ctx->cpu_used != INT_MIN)
339 if (ctx->auto_alt_ref >= 0)
340 codecctl_int(avctx, VP8E_SET_ENABLEAUTOALTREF, ctx->auto_alt_ref);
341 if (ctx->arnr_max_frames >= 0)
342 codecctl_int(avctx, VP8E_SET_ARNR_MAXFRAMES, ctx->arnr_max_frames);
343 if (ctx->arnr_strength >= 0)
344 codecctl_int(avctx, VP8E_SET_ARNR_STRENGTH, ctx->arnr_strength);
345 if (ctx->arnr_type >= 0)
346 codecctl_int(avctx, VP8E_SET_ARNR_TYPE, ctx->arnr_type);
353 vpx_img_wrap(&ctx->rawimg, VPX_IMG_FMT_I420, avctx->
width, avctx->
height, 1,
366 const struct vpx_codec_cx_pkt *src)
368 dst->
pts = src->data.frame.pts;
369 dst->
duration = src->data.frame.duration;
370 dst->
flags = src->data.frame.flags;
371 dst->
sz = src->data.frame.sz;
372 dst->
buf = src->data.frame.buf;
389 coded_frame->
pts = cx_frame->
pts;
399 "Error getting output packet of size %zu.\n", cx_frame->
sz);
417 const struct vpx_codec_cx_pkt *pkt;
418 const void *iter =
NULL;
421 if (ctx->coded_frame_list) {
424 size =
storeframe(avctx, cx_frame, pkt_out, coded_frame);
427 ctx->coded_frame_list = cx_frame->
next;
433 while ((pkt = vpx_codec_get_cx_data(&ctx->encoder, &iter))) {
435 case VPX_CODEC_CX_FRAME_PKT:
441 assert(!ctx->coded_frame_list);
443 size =
storeframe(avctx, &cx_frame, pkt_out, coded_frame);
452 "Frame queue element alloc failed\n");
458 if (!cx_frame->
buf) {
460 "Data buffer alloc (%zu bytes) failed\n",
464 memcpy(cx_frame->
buf, pkt->data.frame.buf, pkt->data.frame.sz);
468 case VPX_CODEC_STATS_PKT: {
469 struct vpx_fixed_buf *stats = &ctx->twopass_stats;
471 stats->sz + pkt->data.twopass_stats.sz);
476 memcpy((
uint8_t*)stats->buf + stats->sz,
477 pkt->data.twopass_stats.buf, pkt->data.twopass_stats.sz);
478 stats->sz += pkt->data.twopass_stats.sz;
481 case VPX_CODEC_PSNR_PKT:
482 case VPX_CODEC_CUSTOM_PKT:
492 const AVFrame *frame,
int *got_packet)
495 struct vpx_image *rawimg =
NULL;
496 int64_t timestamp = 0;
498 vpx_enc_frame_flags_t
flags = 0;
501 rawimg = &ctx->rawimg;
502 rawimg->planes[VPX_PLANE_Y] = frame->
data[0];
503 rawimg->planes[VPX_PLANE_U] = frame->
data[1];
504 rawimg->planes[VPX_PLANE_V] = frame->
data[2];
505 rawimg->stride[VPX_PLANE_Y] = frame->
linesize[0];
506 rawimg->stride[VPX_PLANE_U] = frame->
linesize[1];
507 rawimg->stride[VPX_PLANE_V] = frame->
linesize[2];
508 timestamp = frame->
pts;
510 flags |= VPX_EFLAG_FORCE_KF;
513 res = vpx_codec_encode(&ctx->encoder, rawimg, timestamp,
515 if (res != VPX_CODEC_OK) {
531 ctx->twopass_stats.sz);
534 *got_packet = !!coded_size;
538 #define OFFSET(x) offsetof(VP8Context, x)
539 #define VE AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_ENCODING_PARAM
541 {
"cpu-used",
"Quality/Speed ratio modifier",
OFFSET(cpu_used),
AV_OPT_TYPE_INT, {.i64 = INT_MIN}, INT_MIN, INT_MAX,
VE},
542 {
"auto-alt-ref",
"Enable use of alternate reference "
544 {
"lag-in-frames",
"Number of frames to look ahead for "
546 {
"arnr-maxframes",
"altref noise reduction max frame count",
OFFSET(arnr_max_frames),
AV_OPT_TYPE_INT, {.i64 = -1}, -1, INT_MAX,
VE},
547 {
"arnr-strength",
"altref noise reduction filter strength",
OFFSET(arnr_strength),
AV_OPT_TYPE_INT, {.i64 = -1}, -1, INT_MAX,
VE},
548 {
"arnr-type",
"altref noise reduction filter type",
OFFSET(arnr_type),
AV_OPT_TYPE_INT, {.i64 = -1}, -1, INT_MAX,
VE,
"arnr_type"},
552 {
"deadline",
"Time to spend encoding, in microseconds.",
OFFSET(deadline),
AV_OPT_TYPE_INT, {.i64 = VPX_DL_GOOD_QUALITY}, INT_MIN, INT_MAX,
VE,
"quality"},
556 {
"error-resilient",
"Error resilience configuration",
OFFSET(error_resilient),
AV_OPT_TYPE_FLAGS, {.i64 = 0}, INT_MIN, INT_MAX,
VE,
"er"},
557 #ifdef VPX_ERROR_RESILIENT_DEFAULT
558 {
"default",
"Improve resiliency against losses of whole frames", 0,
AV_OPT_TYPE_CONST, {.i64 = VPX_ERROR_RESILIENT_DEFAULT}, 0, 0,
VE,
"er"},
559 {
"partitions",
"The frame partitions are independently decodable "
560 "by the bool decoder, meaning that partitions can be decoded even "
561 "though earlier partitions have been lost. Note that intra predicition"
562 " is still done over the partition boundary.", 0,
AV_OPT_TYPE_CONST, {.i64 = VPX_ERROR_RESILIENT_PARTITIONS}, 0, 0,
VE,
"er"},
579 {
"keyint_min",
"-1" },
594 .priv_class = &
class,
void * av_malloc(size_t size)
Allocate a block of size bytes with alignment suitable for all memory accesses (including vectors if ...
This structure describes decoded (raw) audio or video data.
int64_t av_rescale_rnd(int64_t a, int64_t b, int64_t c, enum AVRounding rnd)
Rescale a 64-bit integer with specified rounding.
AVFrame * coded_frame
the picture in the bitstream
int rc_initial_buffer_occupancy
Number of bits which should be loaded into the rc buffer before decoding starts.
struct FrameListData * coded_frame_list
size_t sz
length of compressed data
AVCodec ff_libvpx_encoder
char * stats_in
pass2 encoding statistics input buffer Concatenated stuff from stats_out of pass1 should be placed he...
AVRational time_base
This is the fundamental unit of time (in seconds) in terms of which frame timestamps are represented...
void av_freep(void *arg)
Free a memory block which has been allocated with av_malloc(z)() or av_realloc() and set the pointer ...
const char * class_name
The name of the class; usually it is the same name as the context structure type to which the AVClass...
static void cx_pktcpy(struct FrameListData *dst, const struct vpx_codec_cx_pkt *src)
static av_cold int codecctl_int(AVCodecContext *avctx, enum vp8e_enc_control_id id, int val)
int64_t pts
time stamp to show frame (in timebase units)
static void coded_frame_add(void *list, struct FrameListData *cx_frame)
int64_t pts
presentation timestamp in time_base units (time when frame should be shown to user) If AV_NOPTS_VALUE...
int mb_threshold
Macroblock threshold below which the user specified macroblock types will be used.
char * stats_out
pass1 encoding statistics output buffer
static int init(AVCodecParserContext *s)
int frame_skip_threshold
frame skip threshold
int qmax
maximum quantizer
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification. ...
Round to nearest and halfway cases away from zero.
static const AVOption options[]
int rc_max_rate
maximum bitrate
void av_log(void *avcl, int level, const char *fmt,...)
const char * name
Name of the codec implementation.
static av_always_inline av_const double round(double x)
char * av_base64_encode(char *out, int out_size, const uint8_t *in, int in_size)
Encode data to base64 and null-terminate.
int flags
A combination of AV_PKT_FLAG values.
int rc_buffer_size
decoder bitstream buffer size
#define CODEC_CAP_AUTO_THREADS
AVFrame * avcodec_alloc_frame(void)
Allocate an AVFrame and set its fields to default values.
static av_cold void dump_enc_cfg(AVCodecContext *avctx, const struct vpx_codec_enc_cfg *cfg)
int bit_rate
the average bitrate
enum AVPictureType pict_type
Picture type of the frame, see ?_TYPE below.
#define AV_BASE64_SIZE(x)
Calculate the output size needed to base64-encode x bytes.
int width
picture width / height.
static av_cold int vp8_free(AVCodecContext *avctx)
int ff_alloc_packet(AVPacket *avpkt, int size)
Check AVPacket size and/or allocate data.
int ticks_per_frame
For some codecs, the time base is closer to the field rate than the frame rate.
static av_cold void log_encoder_error(AVCodecContext *avctx, const char *desc)
struct vpx_fixed_buf twopass_stats
int thread_count
thread count is used to decide how many independent tasks should be passed to execute() ...
struct FrameListData * next
static const AVCodecDefault defaults[]
int linesize[AV_NUM_DATA_POINTERS]
Size, in bytes, of the data for each picture/channel plane.
main external API structure.
static void close(AVCodecParserContext *s)
int qmin
minimum quantizer
static int storeframe(AVCodecContext *avctx, struct FrameListData *cx_frame, AVPacket *pkt, AVFrame *coded_frame)
Store coded frame information in format suitable for return from encode2().
Describe the class of an AVClass context structure.
uint32_t flags
flags for this frame
static av_cold int vp8_init(AVCodecContext *avctx)
static av_cold void free_coded_frame(struct FrameListData *cx_frame)
float qcompress
amount of qscale change between easy & hard scenes (0.0-1.0)
static int vp8_encode(AVCodecContext *avctx, AVPacket *pkt, const AVFrame *frame, int *got_packet)
void * buf
compressed data buffer
uint8_t * data[AV_NUM_DATA_POINTERS]
pointer to the picture/channel planes.
struct vpx_codec_ctx encoder
int noise_reduction
noise reduction strength
int gop_size
the number of pictures in a group of pictures, or 0 for intra_only
static const char *const ctlidstr[]
String mappings for enum vp8e_enc_control_id.
planar YUV 4:2:0, 12bpp, (1 Cr & Cb sample per 2x2 Y samples)
common internal api header.
common internal and external API header
void * av_realloc(void *ptr, size_t size)
Allocate or reallocate a block of memory.
#define AVERROR_INVALIDDATA
static av_cold void free_frame_list(struct FrameListData *list)
int slices
Number of slices.
Portion of struct vpx_codec_cx_pkt from vpx_encoder.h.
struct VP8EncoderContext VP8Context
int key_frame
1 -> keyframe, 0-> not
unsigned long duration
duration to show frame (in timebase units)
int av_base64_decode(uint8_t *out, const char *in, int out_size)
Decode a base64-encoded string.
int64_t dts
Decompression timestamp in AVStream->time_base units; the time at which the packet is decompressed...
static int queue_frames(AVCodecContext *avctx, AVPacket *pkt_out, AVFrame *coded_frame)
Queue multiple output frames from the encoder, returning the front-most.
int rc_min_rate
minimum bitrate
AVPixelFormat
Pixel format.
This structure stores compressed data.
int64_t pts
Presentation timestamp in AVStream->time_base units; the time at which the decompressed packet will b...
#define FF_PROFILE_UNKNOWN
int keyint_min
minimum GOP size