26 #define VPX_DISABLE_CTRL_TYPECHECKS 1
27 #define VPX_CODEC_DISABLE_COMPAT 1
28 #include <vpx/vpx_encoder.h>
29 #include <vpx/vp8cx.h>
63 typedef struct VPxEncoderContext {
65 struct vpx_codec_ctx encoder;
66 struct vpx_image rawimg;
67 struct vpx_codec_ctx encoder_alpha;
68 struct vpx_image rawimg_alpha;
70 struct vpx_fixed_buf twopass_stats;
82 #define VP8F_ERROR_RESILIENT 0x00000001
83 #define VP8F_AUTO_ALT_REF 0x00000002
116 [VP8E_SET_CPUUSED] =
"VP8E_SET_CPUUSED",
117 [VP8E_SET_ENABLEAUTOALTREF] =
"VP8E_SET_ENABLEAUTOALTREF",
118 [VP8E_SET_NOISE_SENSITIVITY] =
"VP8E_SET_NOISE_SENSITIVITY",
119 [VP8E_SET_STATIC_THRESHOLD] =
"VP8E_SET_STATIC_THRESHOLD",
120 [VP8E_SET_TOKEN_PARTITIONS] =
"VP8E_SET_TOKEN_PARTITIONS",
121 [VP8E_SET_ARNR_MAXFRAMES] =
"VP8E_SET_ARNR_MAXFRAMES",
122 [VP8E_SET_ARNR_STRENGTH] =
"VP8E_SET_ARNR_STRENGTH",
123 [VP8E_SET_ARNR_TYPE] =
"VP8E_SET_ARNR_TYPE",
124 [VP8E_SET_TUNING] =
"VP8E_SET_TUNING",
125 [VP8E_SET_CQ_LEVEL] =
"VP8E_SET_CQ_LEVEL",
126 [VP8E_SET_MAX_INTRA_BITRATE_PCT] =
"VP8E_SET_MAX_INTRA_BITRATE_PCT",
127 #if CONFIG_LIBVPX_VP9_ENCODER
128 [VP9E_SET_LOSSLESS] =
"VP9E_SET_LOSSLESS",
129 [VP9E_SET_TILE_COLUMNS] =
"VP9E_SET_TILE_COLUMNS",
130 [VP9E_SET_TILE_ROWS] =
"VP9E_SET_TILE_ROWS",
131 [VP9E_SET_FRAME_PARALLEL_DECODING] =
"VP9E_SET_FRAME_PARALLEL_DECODING",
132 [VP9E_SET_AQ_MODE] =
"VP9E_SET_AQ_MODE",
133 #if VPX_ENCODER_ABI_VERSION > 8
134 [VP9E_SET_COLOR_SPACE] =
"VP9E_SET_COLOR_SPACE",
136 #if VPX_ENCODER_ABI_VERSION >= 11
137 [VP9E_SET_COLOR_RANGE] =
"VP9E_SET_COLOR_RANGE",
139 #if VPX_ENCODER_ABI_VERSION >= 12
140 [VP9E_SET_TARGET_LEVEL] =
"VP9E_SET_TARGET_LEVEL",
141 [VP9E_GET_LEVEL] =
"VP9E_GET_LEVEL",
143 #ifdef VPX_CTRL_VP9E_SET_ROW_MT
144 [VP9E_SET_ROW_MT] =
"VP9E_SET_ROW_MT",
153 const char *detail = vpx_codec_error_detail(&ctx->
encoder);
161 const struct vpx_codec_enc_cfg *cfg)
166 av_log(avctx, level,
"vpx_codec_enc_cfg\n");
167 av_log(avctx, level,
"generic settings\n"
168 " %*s%u\n %*s%u\n %*s%u\n %*s%u\n %*s%u\n"
169 #
if CONFIG_LIBVPX_VP9_ENCODER && defined(VPX_IMG_FMT_HIGHBITDEPTH)
172 " %*s{%u/%u}\n %*s%u\n %*s%d\n %*s%u\n",
173 width,
"g_usage:", cfg->g_usage,
174 width,
"g_threads:", cfg->g_threads,
175 width,
"g_profile:", cfg->g_profile,
176 width,
"g_w:", cfg->g_w,
177 width,
"g_h:", cfg->g_h,
178 #
if CONFIG_LIBVPX_VP9_ENCODER && defined(VPX_IMG_FMT_HIGHBITDEPTH)
179 width,
"g_bit_depth:", cfg->g_bit_depth,
180 width,
"g_input_bit_depth:", cfg->g_input_bit_depth,
182 width,
"g_timebase:", cfg->g_timebase.num, cfg->g_timebase.den,
183 width,
"g_error_resilient:", cfg->g_error_resilient,
184 width,
"g_pass:", cfg->g_pass,
185 width,
"g_lag_in_frames:", cfg->g_lag_in_frames);
186 av_log(avctx, level,
"rate control settings\n"
187 " %*s%u\n %*s%u\n %*s%u\n %*s%u\n"
189 width,
"rc_dropframe_thresh:", cfg->rc_dropframe_thresh,
190 width,
"rc_resize_allowed:", cfg->rc_resize_allowed,
191 width,
"rc_resize_up_thresh:", cfg->rc_resize_up_thresh,
192 width,
"rc_resize_down_thresh:", cfg->rc_resize_down_thresh,
193 width,
"rc_end_usage:", cfg->rc_end_usage,
194 width,
"rc_twopass_stats_in:", cfg->rc_twopass_stats_in.buf, cfg->rc_twopass_stats_in.sz,
195 width,
"rc_target_bitrate:", cfg->rc_target_bitrate);
196 av_log(avctx, level,
"quantizer settings\n"
198 width,
"rc_min_quantizer:", cfg->rc_min_quantizer,
199 width,
"rc_max_quantizer:", cfg->rc_max_quantizer);
200 av_log(avctx, level,
"bitrate tolerance\n"
202 width,
"rc_undershoot_pct:", cfg->rc_undershoot_pct,
203 width,
"rc_overshoot_pct:", cfg->rc_overshoot_pct);
204 av_log(avctx, level,
"decoder buffer model\n"
205 " %*s%u\n %*s%u\n %*s%u\n",
206 width,
"rc_buf_sz:", cfg->rc_buf_sz,
207 width,
"rc_buf_initial_sz:", cfg->rc_buf_initial_sz,
208 width,
"rc_buf_optimal_sz:", cfg->rc_buf_optimal_sz);
209 av_log(avctx, level,
"2 pass rate control settings\n"
210 " %*s%u\n %*s%u\n %*s%u\n",
211 width,
"rc_2pass_vbr_bias_pct:", cfg->rc_2pass_vbr_bias_pct,
212 width,
"rc_2pass_vbr_minsection_pct:", cfg->rc_2pass_vbr_minsection_pct,
213 width,
"rc_2pass_vbr_maxsection_pct:", cfg->rc_2pass_vbr_maxsection_pct);
214 av_log(avctx, level,
"keyframing settings\n"
215 " %*s%d\n %*s%u\n %*s%u\n",
216 width,
"kf_mode:", cfg->kf_mode,
217 width,
"kf_min_dist:", cfg->kf_min_dist,
218 width,
"kf_max_dist:", cfg->kf_max_dist);
219 av_log(avctx, level,
"\n");
252 enum vp8e_enc_control_id
id,
int val)
262 res = vpx_codec_control(&ctx->
encoder,
id, val);
263 if (res != VPX_CODEC_OK) {
264 snprintf(buf,
sizeof(buf),
"Failed to set %s codec control",
269 return res == VPX_CODEC_OK ? 0 :
AVERROR(EINVAL);
272 #if VPX_ENCODER_ABI_VERSION >= 12
274 enum vp8e_enc_control_id
id,
int *
val)
284 res = vpx_codec_control(&ctx->
encoder,
id, val);
285 if (res != VPX_CODEC_OK) {
286 snprintf(buf,
sizeof(buf),
"Failed to set %s codec control",
291 return res == VPX_CODEC_OK ? 0 :
AVERROR(EINVAL);
299 #if VPX_ENCODER_ABI_VERSION >= 12
303 if (!codecctl_intp(avctx, VP9E_GET_LEVEL, &level_out))
308 vpx_codec_destroy(&ctx->
encoder);
317 #if CONFIG_LIBVPX_VP9_ENCODER
319 struct vpx_codec_enc_cfg *enccfg, vpx_codec_flags_t *
flags,
320 vpx_img_fmt_t *img_fmt)
323 #ifdef VPX_IMG_FMT_HIGHBITDEPTH
324 enccfg->g_bit_depth = enccfg->g_input_bit_depth = 8;
329 enccfg->g_profile = 0;
330 *img_fmt = VPX_IMG_FMT_I420;
333 enccfg->g_profile = 1;
334 *img_fmt = VPX_IMG_FMT_I422;
336 #if VPX_IMAGE_ABI_VERSION >= 3
338 enccfg->g_profile = 1;
339 *img_fmt = VPX_IMG_FMT_I440;
342 ctx->vpx_cs = VPX_CS_SRGB;
345 enccfg->g_profile = 1;
346 *img_fmt = VPX_IMG_FMT_I444;
348 #ifdef VPX_IMG_FMT_HIGHBITDEPTH
351 if (codec_caps & VPX_CODEC_CAP_HIGHBITDEPTH) {
352 enccfg->g_bit_depth = enccfg->g_input_bit_depth =
354 enccfg->g_profile = 2;
355 *img_fmt = VPX_IMG_FMT_I42016;
356 *flags |= VPX_CODEC_USE_HIGHBITDEPTH;
362 if (codec_caps & VPX_CODEC_CAP_HIGHBITDEPTH) {
363 enccfg->g_bit_depth = enccfg->g_input_bit_depth =
365 enccfg->g_profile = 3;
366 *img_fmt = VPX_IMG_FMT_I42216;
367 *flags |= VPX_CODEC_USE_HIGHBITDEPTH;
371 #if VPX_IMAGE_ABI_VERSION >= 3
374 if (codec_caps & VPX_CODEC_CAP_HIGHBITDEPTH) {
375 enccfg->g_bit_depth = enccfg->g_input_bit_depth =
377 enccfg->g_profile = 3;
378 *img_fmt = VPX_IMG_FMT_I44016;
379 *flags |= VPX_CODEC_USE_HIGHBITDEPTH;
385 ctx->vpx_cs = VPX_CS_SRGB;
389 if (codec_caps & VPX_CODEC_CAP_HIGHBITDEPTH) {
390 enccfg->g_bit_depth = enccfg->g_input_bit_depth =
393 enccfg->g_profile = 3;
394 *img_fmt = VPX_IMG_FMT_I44416;
395 *flags |= VPX_CODEC_USE_HIGHBITDEPTH;
407 #if VPX_ENCODER_ABI_VERSION > 8
410 enum vpx_color_space vpx_cs;
435 #if VPX_ENCODER_ABI_VERSION >= 11
438 enum vpx_color_range vpx_cr;
455 const struct vpx_codec_iface *iface)
458 struct vpx_codec_enc_cfg enccfg = { 0 };
459 struct vpx_codec_enc_cfg enccfg_alpha;
463 vpx_img_fmt_t img_fmt = VPX_IMG_FMT_I420;
464 #if CONFIG_LIBVPX_VP9_ENCODER
465 vpx_codec_caps_t codec_caps = vpx_codec_get_caps(iface);
474 if ((res = vpx_codec_enc_config_default(iface, &enccfg, 0)) != VPX_CODEC_OK) {
476 vpx_codec_err_to_string(res));
480 #if CONFIG_LIBVPX_VP9_ENCODER
482 if (
set_pix_fmt(avctx, codec_caps, &enccfg, &flags, &img_fmt))
495 enccfg.g_w = avctx->
width;
496 enccfg.g_h = avctx->
height;
503 enccfg.g_pass = VPX_RC_FIRST_PASS;
505 enccfg.g_pass = VPX_RC_LAST_PASS;
507 enccfg.g_pass = VPX_RC_ONE_PASS;
511 enccfg.rc_end_usage = VPX_CBR;
512 }
else if (ctx->
crf >= 0) {
513 enccfg.rc_end_usage = VPX_CQ;
514 #if CONFIG_LIBVPX_VP9_ENCODER
516 enccfg.rc_end_usage = VPX_Q;
523 #if CONFIG_LIBVPX_VP9_ENCODER
524 }
else if (enccfg.rc_end_usage == VPX_Q) {
527 if (enccfg.rc_end_usage == VPX_CQ) {
528 enccfg.rc_target_bitrate = 1000000;
530 avctx->
bit_rate = enccfg.rc_target_bitrate * 1000;
532 "Neither bitrate nor constrained quality specified, using default bitrate of %dkbit/sec\n",
533 enccfg.rc_target_bitrate);
538 enccfg.rc_min_quantizer =
539 enccfg.rc_max_quantizer = 0;
541 if (avctx->
qmin >= 0)
542 enccfg.rc_min_quantizer = avctx->
qmin;
543 if (avctx->
qmax >= 0)
544 enccfg.rc_max_quantizer = avctx->
qmax;
547 if (enccfg.rc_end_usage == VPX_CQ
548 #
if CONFIG_LIBVPX_VP9_ENCODER
549 || enccfg.rc_end_usage == VPX_Q
552 if (ctx->
crf < enccfg.rc_min_quantizer || ctx->
crf > enccfg.rc_max_quantizer) {
554 "CQ level %d must be between minimum and maximum quantizer value (%d-%d)\n",
555 ctx->
crf, enccfg.rc_min_quantizer, enccfg.rc_max_quantizer);
560 #if FF_API_PRIVATE_OPT
571 enccfg.rc_2pass_vbr_minsection_pct =
574 enccfg.rc_2pass_vbr_maxsection_pct =
581 enccfg.rc_buf_initial_sz =
583 enccfg.rc_buf_optimal_sz = enccfg.rc_buf_sz * 5 / 6;
588 "deprecated, use the undershoot-pct private option instead.\n");
602 enccfg.kf_max_dist = avctx->
gop_size;
604 if (enccfg.g_pass == VPX_RC_FIRST_PASS)
605 enccfg.g_lag_in_frames = 0;
606 else if (enccfg.g_pass == VPX_RC_LAST_PASS) {
607 int decode_size, ret;
625 if (decode_size < 0) {
638 enccfg.g_profile = avctx->
profile;
644 res = vpx_codec_enc_init(&ctx->
encoder, iface, &enccfg, flags);
645 if (res != VPX_CODEC_OK) {
651 enccfg_alpha = enccfg;
652 res = vpx_codec_enc_init(&ctx->
encoder_alpha, iface, &enccfg_alpha, flags);
653 if (res != VPX_CODEC_OK) {
677 av_log(avctx,
AV_LOG_ERROR,
"Transparency encoding with auto_alt_ref does not work\n");
682 #if FF_API_PRIVATE_OPT
695 "use the static-thresh private option instead.\n");
706 #if CONFIG_LIBVPX_VP9_ENCODER
718 #if VPX_ENCODER_ABI_VERSION > 8
719 set_colorspace(avctx);
721 #if VPX_ENCODER_ABI_VERSION >= 11
722 set_color_range(avctx);
724 #if VPX_ENCODER_ABI_VERSION >= 12
727 #ifdef VPX_CTRL_VP9E_SET_ROW_MT
739 #if CONFIG_LIBVPX_VP9_ENCODER && defined(VPX_IMG_FMT_HIGHBITDEPTH)
741 ctx->
rawimg.bit_depth = enccfg.g_bit_depth;
752 if (enccfg.rc_end_usage == VPX_CBR ||
753 enccfg.g_pass != VPX_RC_ONE_PASS) {
764 const struct vpx_codec_cx_pkt *
src,
765 const struct vpx_codec_cx_pkt *src_alpha,
768 dst->
pts = src->data.frame.pts;
769 dst->
duration = src->data.frame.duration;
770 dst->
flags = src->data.frame.flags;
771 dst->
sz = src->data.frame.sz;
772 dst->
buf = src->data.frame.buf;
775 if (!(dst->
flags & VPX_FRAME_IS_INVISIBLE)) {
783 memcpy(dst->
sse, ctx->
sse,
sizeof(dst->
sse));
790 dst->
buf_alpha = src_alpha->data.frame.buf;
791 dst->
sz_alpha = src_alpha->data.frame.sz;
814 #if FF_API_CODED_FRAME
821 if (!!(cx_frame->
flags & VPX_FRAME_IS_KEY)) {
823 #if FF_API_CODED_FRAME
831 #if FF_API_CODED_FRAME
839 cx_frame->
have_sse ? 3 : 0, pict_type);
844 #if FF_API_CODED_FRAME
852 for (i = 0; i < 3; ++i) {
853 avctx->
error[i] += cx_frame->
sse[i + 1];
886 const struct vpx_codec_cx_pkt *
pkt;
887 const struct vpx_codec_cx_pkt *pkt_alpha =
NULL;
888 const void *iter =
NULL;
889 const void *iter_alpha =
NULL;
904 while ((pkt = vpx_codec_get_cx_data(&ctx->
encoder, &iter)) &&
908 case VPX_CODEC_CX_FRAME_PKT:
915 cx_pktcpy(&cx_frame, pkt, pkt_alpha, ctx);
925 "Frame queue element alloc failed\n");
928 cx_pktcpy(cx_frame, pkt, pkt_alpha, ctx);
931 if (!cx_frame->
buf) {
938 memcpy(cx_frame->
buf, pkt->data.frame.buf, pkt->data.frame.sz);
948 memcpy(cx_frame->
buf_alpha, pkt_alpha->data.frame.buf, pkt_alpha->data.frame.sz);
953 case VPX_CODEC_STATS_PKT: {
958 pkt->data.twopass_stats.sz)) < 0) {
963 memcpy((
uint8_t*)stats->buf + stats->sz,
964 pkt->data.twopass_stats.buf, pkt->data.twopass_stats.sz);
965 stats->sz += pkt->data.twopass_stats.sz;
968 case VPX_CODEC_PSNR_PKT:
970 ctx->
sse[0] = pkt->data.psnr.sse[0];
971 ctx->
sse[1] = pkt->data.psnr.sse[1];
972 ctx->
sse[2] = pkt->data.psnr.sse[2];
973 ctx->
sse[3] = pkt->data.psnr.sse[3];
976 case VPX_CODEC_CUSTOM_PKT:
989 struct vpx_image *rawimg =
NULL;
990 struct vpx_image *rawimg_alpha =
NULL;
991 int64_t timestamp = 0;
993 vpx_enc_frame_flags_t flags = 0;
997 rawimg->planes[VPX_PLANE_Y] = frame->
data[0];
998 rawimg->planes[VPX_PLANE_U] = frame->
data[1];
999 rawimg->planes[VPX_PLANE_V] = frame->
data[2];
1000 rawimg->stride[VPX_PLANE_Y] = frame->
linesize[0];
1001 rawimg->stride[VPX_PLANE_U] = frame->
linesize[1];
1002 rawimg->stride[VPX_PLANE_V] = frame->
linesize[2];
1006 rawimg_alpha->planes[VPX_PLANE_Y] = frame->
data[3];
1009 if (!u_plane || !v_plane) {
1015 rawimg_alpha->planes[VPX_PLANE_U] = u_plane;
1017 rawimg_alpha->planes[VPX_PLANE_V] = v_plane;
1018 rawimg_alpha->stride[VPX_PLANE_Y] = frame->
linesize[0];
1019 rawimg_alpha->stride[VPX_PLANE_U] = frame->
linesize[1];
1020 rawimg_alpha->stride[VPX_PLANE_V] = frame->
linesize[2];
1022 timestamp = frame->
pts;
1023 #if VPX_IMAGE_ABI_VERSION >= 4
1026 rawimg->range = VPX_CR_STUDIO_RANGE;
1029 rawimg->range = VPX_CR_FULL_RANGE;
1034 flags |= VPX_EFLAG_FORCE_KF;
1037 res = vpx_codec_encode(&ctx->
encoder, rawimg, timestamp,
1039 if (res != VPX_CODEC_OK) {
1045 res = vpx_codec_encode(&ctx->
encoder_alpha, rawimg_alpha, timestamp,
1047 if (res != VPX_CODEC_OK) {
1069 av_freep(&rawimg_alpha->planes[VPX_PLANE_U]);
1070 av_freep(&rawimg_alpha->planes[VPX_PLANE_V]);
1073 *got_packet = !!coded_size;
1077 #define OFFSET(x) offsetof(VPxContext, x)
1078 #define VE AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_ENCODING_PARAM
1080 #ifndef VPX_ERROR_RESILIENT_DEFAULT
1081 #define VPX_ERROR_RESILIENT_DEFAULT 1
1082 #define VPX_ERROR_RESILIENT_PARTITIONS 2
1085 #define COMMON_OPTIONS \
1086 { "auto-alt-ref", "Enable use of alternate reference " \
1087 "frames (2-pass only)", OFFSET(auto_alt_ref), AV_OPT_TYPE_INT, {.i64 = -1}, -1, 2, VE}, \
1088 { "lag-in-frames", "Number of frames to look ahead for " \
1089 "alternate reference frame selection", OFFSET(lag_in_frames), AV_OPT_TYPE_INT, {.i64 = -1}, -1, INT_MAX, VE}, \
1090 { "arnr-maxframes", "altref noise reduction max frame count", OFFSET(arnr_max_frames), AV_OPT_TYPE_INT, {.i64 = -1}, -1, INT_MAX, VE}, \
1091 { "arnr-strength", "altref noise reduction filter strength", OFFSET(arnr_strength), AV_OPT_TYPE_INT, {.i64 = -1}, -1, INT_MAX, VE}, \
1092 { "arnr-type", "altref noise reduction filter type", OFFSET(arnr_type), AV_OPT_TYPE_INT, {.i64 = -1}, -1, INT_MAX, VE, "arnr_type"}, \
1093 { "backward", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = 1}, 0, 0, VE, "arnr_type" }, \
1094 { "forward", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = 2}, 0, 0, VE, "arnr_type" }, \
1095 { "centered", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = 3}, 0, 0, VE, "arnr_type" }, \
1096 { "tune", "Tune the encoding to a specific scenario", OFFSET(tune), AV_OPT_TYPE_INT, {.i64 = -1}, -1, INT_MAX, VE, "tune"}, \
1097 { "psnr", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = VP8_TUNE_PSNR}, 0, 0, VE, "tune"}, \
1098 { "ssim", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = VP8_TUNE_SSIM}, 0, 0, VE, "tune"}, \
1099 { "deadline", "Time to spend encoding, in microseconds.", OFFSET(deadline), AV_OPT_TYPE_INT, {.i64 = VPX_DL_GOOD_QUALITY}, INT_MIN, INT_MAX, VE, "quality"}, \
1100 { "best", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = VPX_DL_BEST_QUALITY}, 0, 0, VE, "quality"}, \
1101 { "good", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = VPX_DL_GOOD_QUALITY}, 0, 0, VE, "quality"}, \
1102 { "realtime", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = VPX_DL_REALTIME}, 0, 0, VE, "quality"}, \
1103 { "error-resilient", "Error resilience configuration", OFFSET(error_resilient), AV_OPT_TYPE_FLAGS, {.i64 = 0}, INT_MIN, INT_MAX, VE, "er"}, \
1104 { "max-intra-rate", "Maximum I-frame bitrate (pct) 0=unlimited", OFFSET(max_intra_rate), AV_OPT_TYPE_INT, {.i64 = -1}, -1, INT_MAX, VE}, \
1105 { "default", "Improve resiliency against losses of whole frames", 0, AV_OPT_TYPE_CONST, {.i64 = VPX_ERROR_RESILIENT_DEFAULT}, 0, 0, VE, "er"}, \
1106 { "partitions", "The frame partitions are independently decodable " \
1107 "by the bool decoder, meaning that partitions can be decoded even " \
1108 "though earlier partitions have been lost. Note that intra predicition" \
1109 " is still done over the partition boundary.", 0, AV_OPT_TYPE_CONST, {.i64 = VPX_ERROR_RESILIENT_PARTITIONS}, 0, 0, VE, "er"}, \
1110 { "crf", "Select the quality for constant quality mode", offsetof(VPxContext, crf), AV_OPT_TYPE_INT, {.i64 = -1}, -1, 63, VE }, \
1111 { "static-thresh", "A change threshold on blocks below which they will be skipped by the encoder", OFFSET(static_thresh), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, INT_MAX, VE }, \
1112 { "drop-threshold", "Frame drop threshold", offsetof(VPxContext, drop_threshold), AV_OPT_TYPE_INT, {.i64 = 0 }, INT_MIN, INT_MAX, VE }, \
1113 { "noise-sensitivity", "Noise sensitivity", OFFSET(noise_sensitivity), AV_OPT_TYPE_INT, {.i64 = 0 }, 0, 4, VE}, \
1114 { "undershoot-pct", "Datarate undershoot (min) target (%)", OFFSET(rc_undershoot_pct), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, 100, VE }, \
1115 { "overshoot-pct", "Datarate overshoot (max) target (%)", OFFSET(rc_overshoot_pct), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, 1000, VE }, \
1117 #define LEGACY_OPTIONS \
1118 {"speed", "", offsetof(VPxContext, cpu_used), AV_OPT_TYPE_INT, {.i64 = 1}, -16, 16, VE}, \
1119 {"quality", "", offsetof(VPxContext, deadline), AV_OPT_TYPE_INT, {.i64 = VPX_DL_GOOD_QUALITY}, INT_MIN, INT_MAX, VE, "quality"}, \
1120 {"vp8flags", "", offsetof(VPxContext, flags), AV_OPT_TYPE_FLAGS, {.i64 = 0}, 0, UINT_MAX, VE, "flags"}, \
1121 {"error_resilient", "enable error resilience", 0, AV_OPT_TYPE_CONST, {.i64 = VP8F_ERROR_RESILIENT}, INT_MIN, INT_MAX, VE, "flags"}, \
1122 {"altref", "enable use of alternate reference frames (VP8/2-pass only)", 0, AV_OPT_TYPE_CONST, {.i64 = VP8F_AUTO_ALT_REF}, INT_MIN, INT_MAX, VE, "flags"}, \
1123 {"arnr_max_frames", "altref noise reduction max frame count", offsetof(VPxContext, arnr_max_frames), AV_OPT_TYPE_INT, {.i64 = 0}, 0, 15, VE}, \
1124 {"arnr_strength", "altref noise reduction filter strength", offsetof(VPxContext, arnr_strength), AV_OPT_TYPE_INT, {.i64 = 3}, 0, 6, VE}, \
1125 {"arnr_type", "altref noise reduction filter type", offsetof(VPxContext, arnr_type), AV_OPT_TYPE_INT, {.i64 = 3}, 1, 3, VE}, \
1126 {"rc_lookahead", "Number of frames to look ahead for alternate reference frame selection", offsetof(VPxContext, lag_in_frames), AV_OPT_TYPE_INT, {.i64 = 25}, 0, 25, VE}, \
1128 #if CONFIG_LIBVPX_VP8_ENCODER
1129 static const AVOption vp8_options[] = {
1137 #if CONFIG_LIBVPX_VP9_ENCODER
1138 static const AVOption vp9_options[] = {
1142 {
"tile-columns",
"Number of tile columns to use, log2",
OFFSET(tile_columns),
AV_OPT_TYPE_INT, {.i64 = -1}, -1, 6,
VE},
1143 {
"tile-rows",
"Number of tile rows to use, log2",
OFFSET(tile_rows),
AV_OPT_TYPE_INT, {.i64 = -1}, -1, 2,
VE},
1144 {
"frame-parallel",
"Enable frame parallel decodability features",
OFFSET(frame_parallel),
AV_OPT_TYPE_BOOL,{.i64 = -1}, -1, 1,
VE},
1145 {
"aq-mode",
"adaptive quantization mode",
OFFSET(aq_mode),
AV_OPT_TYPE_INT, {.i64 = -1}, -1, 3,
VE,
"aq_mode"},
1147 {
"variance",
"Variance based Aq", 0,
AV_OPT_TYPE_CONST, {.i64 = 1}, 0, 0,
VE,
"aq_mode" },
1148 {
"complexity",
"Complexity based Aq", 0,
AV_OPT_TYPE_CONST, {.i64 = 2}, 0, 0,
VE,
"aq_mode" },
1150 #if VPX_ENCODER_ABI_VERSION >= 12
1153 #ifdef VPX_CTRL_VP9E_SET_ROW_MT
1161 #undef COMMON_OPTIONS
1162 #undef LEGACY_OPTIONS
1168 {
"keyint_min",
"-1" },
1172 #if CONFIG_LIBVPX_VP8_ENCODER
1175 return vpx_init(avctx, vpx_codec_vp8_cx());
1178 static const AVClass class_vp8 = {
1181 .option = vp8_options,
1185 AVCodec ff_libvpx_vp8_encoder = {
1196 .priv_class = &class_vp8,
1201 #if CONFIG_LIBVPX_VP9_ENCODER
1204 return vpx_init(avctx, vpx_codec_vp9_cx());
1207 static const AVClass class_vp9 = {
1210 .option = vp9_options,
1214 AVCodec ff_libvpx_vp9_encoder = {
1215 .
name =
"libvpx-vp9",
1225 .priv_class = &class_vp9,
also ITU-R BT1361 / IEC 61966-2-4 xvYCC709 / SMPTE RP177 Annex B
const char const char void * val
#define AVERROR_INVALIDDATA
Invalid data found when processing input.
#define AV_PIX_FMT_YUV440P10
This structure describes decoded (raw) audio or video data.
static av_cold int vpx_free(AVCodecContext *avctx)
int ff_side_data_set_encoder_stats(AVPacket *pkt, int quality, int64_t *error, int error_count, int pict_type)
uint64_t error[AV_NUM_DATA_POINTERS]
error
planar YUV 4:4:4, 24bpp, (1 Cr & Cb sample per 1x1 Y samples)
#define AV_LOG_WARNING
Something somehow does not look correct.
int64_t bit_rate
the average bitrate
#define LIBAVUTIL_VERSION_INT
static av_cold int init(AVCodecContext *avctx)
struct FrameListData * coded_frame_list
int max_bitrate
Maximum bitrate of the stream, in bits per second.
also ITU-R BT601-6 625 / ITU-R BT1358 625 / ITU-R BT1700 625 PAL & SECAM / IEC 61966-2-4 xvYCC601 ...
int rc_initial_buffer_occupancy
Number of bits which should be loaded into the rc buffer before decoding starts.
enum AVColorRange color_range
MPEG vs JPEG YUV range.
#define AV_PIX_FMT_GBRP10
also ITU-R BT601-6 525 / ITU-R BT1358 525 / ITU-R BT1700 NTSC
enum AVPixelFormat pix_fmt
Pixel format, see AV_PIX_FMT_xxx.
size_t sz
length of compressed data
static int sse(MpegEncContext *s, uint8_t *src1, uint8_t *src2, int w, int h, int stride)
#define AV_PIX_FMT_YUV420P12
char * stats_in
pass2 encoding statistics input buffer Concatenated stuff from stats_out of pass1 should be placed he...
static void cx_pktcpy(struct FrameListData *dst, const struct vpx_codec_cx_pkt *src, const struct vpx_codec_cx_pkt *src_alpha, VPxContext *ctx)
#define AV_CODEC_CAP_AUTO_THREADS
Codec supports avctx->thread_count == 0 (auto).
struct vpx_fixed_buf twopass_stats
order of coefficients is actually GBR, also IEC 61966-2-1 (sRGB)
int min_bitrate
Minimum bitrate of the stream, in bits per second.
functionally identical to above
AVRational time_base
This is the fundamental unit of time (in seconds) in terms of which frame timestamps are represented...
#define VP8F_AUTO_ALT_REF
Enable automatic alternate reference frame generation.
const char * class_name
The name of the class; usually it is the same name as the context structure type to which the AVClass...
#define AV_CODEC_CAP_DELAY
Encoder or decoder requires flushing with NULL input at the end in order to give the complete and cor...
#define av_assert0(cond)
assert() equivalent, that is always enabled.
planar YUV 4:2:0, 20bpp, (1 Cr & Cb sample per 2x2 Y & A samples)
attribute_deprecated float rc_buffer_aggressivity
static av_cold int codecctl_int(AVCodecContext *avctx, enum vp8e_enc_control_id id, int val)
int64_t pts
time stamp to show frame (in timebase units)
static void coded_frame_add(void *list, struct FrameListData *cx_frame)
int64_t pts
Presentation timestamp in time_base units (time when frame should be shown to user).
#define AV_LOG_VERBOSE
Detailed information.
int buffer_size
The size of the buffer to which the ratecontrol is applied, in bits.
#define AV_PIX_FMT_YUV422P12
char * stats_out
pass1 encoding statistics output buffer
attribute_deprecated uint64_t error[AV_NUM_DATA_POINTERS]
attribute_deprecated int frame_skip_threshold
#define AV_PKT_FLAG_KEY
The packet contains a keyframe.
static int vpx_encode(AVCodecContext *avctx, AVPacket *pkt, const AVFrame *frame, int *got_packet)
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
static int storeframe(AVCodecContext *avctx, struct FrameListData *cx_frame, AVPacket *pkt)
Store coded frame information in format suitable for return from encode2().
int qmax
maximum quantizer
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification. ...
enum AVColorRange color_range
MPEG vs JPEG YUV range.
#define AV_LOG_DEBUG
Stuff which is only useful for libav* developers.
int flags
AV_CODEC_FLAG_*.
Round to nearest and halfway cases away from zero.
simple assert() macros that are a bit more flexible than ISO C assert().
const char * name
Name of the codec implementation.
#define AV_PIX_FMT_YUV444P10
char * av_base64_encode(char *out, int out_size, const uint8_t *in, int in_size)
Encode data to base64 and null-terminate.
int flags
A combination of AV_PKT_FLAG values.
planar YUV 4:2:2, 16bpp, (1 Cr & Cb sample per 2x1 Y samples)
int rc_buffer_size
decoder bitstream buffer size
int64_t rc_min_rate
minimum bitrate
common internal API header
static av_cold void dump_enc_cfg(AVCodecContext *avctx, const struct vpx_codec_enc_cfg *cfg)
enum AVPictureType pict_type
Picture type of the frame.
struct vpx_image rawimg_alpha
#define AV_BASE64_SIZE(x)
Calculate the output size needed to base64-encode x bytes to a null-terminated string.
int width
picture width / height.
#define FF_PROFILE_UNKNOWN
ITU-R BT2020 non-constant luminance system.
attribute_deprecated int noise_reduction
#define AV_CODEC_FLAG_PSNR
error[?] variables will be set during encoding.
#define AV_CODEC_FLAG_PASS1
Use internal 2pass ratecontrol in first pass mode.
int ticks_per_frame
For some codecs, the time base is closer to the field rate than the frame rate.
static av_cold void log_encoder_error(AVCodecContext *avctx, const char *desc)
attribute_deprecated int mb_threshold
int64_t av_rescale_rnd(int64_t a, int64_t b, int64_t c, enum AVRounding rnd)
Rescale a 64-bit integer with specified rounding.
static void error(const char *err)
int thread_count
thread count is used to decide how many independent tasks should be passed to execute() ...
struct FrameListData * next
the normal 2^n-1 "JPEG" YUV ranges
#define VP8F_ERROR_RESILIENT
Enable measures appropriate for streaming over lossy links.
static av_cold int vpx_init(AVCodecContext *avctx, const struct vpx_codec_iface *iface)
This structure describes the bitrate properties of an encoded bitstream.
static const AVCodecDefault defaults[]
#define AV_LOG_INFO
Standard information.
int av_reallocp(void *ptr, size_t size)
Allocate, reallocate, or free a block of memory through a pointer to a pointer.
Libavcodec external API header.
av_cold void ff_vp9_init_static(AVCodec *codec)
int linesize[AV_NUM_DATA_POINTERS]
For video, size in bytes of each picture line.
static av_cold int vp9_init(AVFormatContext *ctx, int st_index, PayloadContext *data)
static int set_pix_fmt(AVCodecContext *avctx, struct vpx_image *img, int has_alpha_channel)
main external API structure.
static int queue_frames(AVCodecContext *avctx, AVPacket *pkt_out)
Queue multiple output frames from the encoder, returning the front-most.
void av_packet_unref(AVPacket *pkt)
Wipe the packet.
int qmin
minimum quantizer
Data found in BlockAdditional element of matroska container.
#define AV_PIX_FMT_YUV420P10
Describe the class of an AVClass context structure.
static const AVProfile profiles[]
enum AVColorSpace colorspace
YUV colorspace type.
uint32_t flags
flags for this frame
#define AV_PIX_FMT_YUV440P12
int ff_alloc_packet2(AVCodecContext *avctx, AVPacket *avpkt, int64_t size, int64_t min_size)
Check AVPacket size and/or allocate data.
static av_cold void free_coded_frame(struct FrameListData *cx_frame)
float qcompress
amount of qscale change between easy & hard scenes (0.0-1.0)
static enum AVPixelFormat pix_fmts[]
void * buf
compressed data buffer
#define AV_PIX_FMT_GBRP12
int have_sse
true if we have pending sse[]
#define AV_PIX_FMT_YUV422P10
#define AV_PIX_FMT_YUV444P12
uint8_t * data[AV_NUM_DATA_POINTERS]
pointer to the picture/channel planes.
the normal 219*2^(n-8) "MPEG" YUV ranges
int flags
VP8 specific flags, see VP8F_* below.
int gop_size
the number of pictures in a group of pictures, or 0 for intra_only
static const char *const ctlidstr[]
String mappings for enum vp8e_enc_control_id.
struct vpx_codec_ctx encoder_alpha
static av_cold int vp8_init(AVFormatContext *s, int st_index, PayloadContext *vp8)
planar YUV 4:2:0, 12bpp, (1 Cr & Cb sample per 2x2 Y samples)
#define FF_DISABLE_DEPRECATION_WARNINGS
common internal api header.
common internal and external API header
struct vpx_codec_ctx encoder
attribute_deprecated AVFrame * coded_frame
the picture in the bitstream
AVCPBProperties * ff_add_cpb_side_data(AVCodecContext *avctx)
Add a CPB properties side data to an encoding context.
static av_cold void free_frame_list(struct FrameListData *list)
#define AV_CODEC_FLAG_PASS2
Use internal 2pass ratecontrol in second pass mode.
int slices
Number of slices.
#define FF_ENABLE_DEPRECATION_WARNINGS
Portion of struct vpx_codec_cx_pkt from vpx_encoder.h.
int avg_bitrate
Average bitrate of the stream, in bits per second.
int key_frame
1 -> keyframe, 0-> not
unsigned long duration
duration to show frame (in timebase units)
int av_base64_decode(uint8_t *out, const char *in_str, int out_size)
Decode a base64-encoded string.
static void stats(const struct CachedBuf *in, int n_in, unsigned *_max, unsigned *_sum)
int64_t dts
Decompression timestamp in AVStream->time_base units; the time at which the packet is decompressed...
int have_sse
true if we have pending sse[]
planar YUV 4:4:0 (1 Cr & Cb sample per 1x2 Y samples)
uint8_t * av_packet_new_side_data(AVPacket *pkt, enum AVPacketSideDataType type, int size)
Allocate new information of a packet.
const AVProfile ff_vp9_profiles[]
AVPixelFormat
Pixel format.
This structure stores compressed data.
int64_t pts
Presentation timestamp in AVStream->time_base units; the time at which the decompressed packet will b...
int64_t rc_max_rate
maximum bitrate
int keyint_min
minimum GOP size