FFmpeg
libvpxenc.c
Go to the documentation of this file.
1 /*
2  * Copyright (c) 2010, Google, Inc.
3  *
4  * This file is part of FFmpeg.
5  *
6  * FFmpeg is free software; you can redistribute it and/or
7  * modify it under the terms of the GNU Lesser General Public
8  * License as published by the Free Software Foundation; either
9  * version 2.1 of the License, or (at your option) any later version.
10  *
11  * FFmpeg is distributed in the hope that it will be useful,
12  * but WITHOUT ANY WARRANTY; without even the implied warranty of
13  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14  * Lesser General Public License for more details.
15  *
16  * You should have received a copy of the GNU Lesser General Public
17  * License along with FFmpeg; if not, write to the Free Software
18  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
19  */
20 
21 /**
22  * @file
23  * VP8/9 encoder support via libvpx
24  */
25 
26 #include "config_components.h"
27 
28 #define VPX_DISABLE_CTRL_TYPECHECKS 1
29 #define VPX_CODEC_DISABLE_COMPAT 1
30 #include <vpx/vpx_encoder.h>
31 #include <vpx/vp8cx.h>
32 
33 #include "avcodec.h"
34 #include "codec_internal.h"
35 #include "encode.h"
36 #include "libavutil/avassert.h"
37 #include "libavutil/mem.h"
38 #include "libvpx.h"
39 #include "profiles.h"
40 #include "libavutil/avstring.h"
41 #include "libavutil/base64.h"
42 #include "libavutil/common.h"
43 #include "libavutil/cpu.h"
44 #include "libavutil/fifo.h"
45 #include "libavutil/internal.h"
46 #include "libavutil/intreadwrite.h"
47 #include "libavutil/mathematics.h"
48 #include "libavutil/opt.h"
49 #include "libavutil/pixdesc.h"
50 
51 #define IS_VP9(avctx) (CONFIG_LIBVPX_VP9_ENCODER && avctx->codec_id == AV_CODEC_ID_VP9)
52 #define IS_VP8(avctx) (CONFIG_LIBVPX_VP8_ENCODER && avctx->codec_id == AV_CODEC_ID_VP8)
53 
54 /**
55  * Portion of struct vpx_codec_cx_pkt from vpx_encoder.h.
56  * One encoded frame returned from the library.
57  */
58 struct FrameListData {
59  void *buf; /**< compressed data buffer */
60  size_t sz; /**< length of compressed data */
61  int64_t pts; /**< time stamp to show frame
62  (in timebase units) */
63  uint32_t flags; /**< flags for this frame */
64  uint64_t sse[4];
65  int have_sse; /**< true if we have pending sse[] */
66  struct FrameListData *next;
67 };
68 
69 typedef struct FrameData {
70  int64_t pts;
72 
73  void *frame_opaque;
75 
77 } FrameData;
78 
79 typedef struct VPxEncoderContext {
80  AVClass *class;
81  struct vpx_codec_ctx encoder;
82  struct vpx_image rawimg;
83  struct vpx_codec_ctx encoder_alpha;
84  struct vpx_image rawimg_alpha;
85  uint8_t is_alpha;
86  struct vpx_fixed_buf twopass_stats;
88  int deadline; //i.e., RT/GOOD/BEST
89  uint64_t sse[4];
90  int have_sse; /**< true if we have pending sse[] */
93 
94  int cpu_used;
95  int sharpness;
96  /**
97  * VP8 specific flags, see VP8F_* below.
98  */
99  int flags;
100 #define VP8F_ERROR_RESILIENT 0x00000001 ///< Enable measures appropriate for streaming over lossy links
101 #define VP8F_AUTO_ALT_REF 0x00000002 ///< Enable automatic alternate reference frame generation
102 
104 
108 
109  int tune;
110 
113  int crf;
118 
122 
123  // VP8-only
125 
126  // VP9-only
127  int lossless;
131  int aq_mode;
134  int vpx_cs;
135  float level;
136  int row_mt;
141 
142  // This FIFO is used to propagate various properties from frames to packets.
144  /**
145  * If the driver does not support ROI then warn the first time we
146  * encounter a frame with ROI side data.
147  */
149 #if CONFIG_LIBVPX_VP9_ENCODER && defined(VPX_CTRL_VP9E_SET_MAX_INTER_BITRATE_PCT)
150  vpx_svc_ref_frame_config_t ref_frame_config;
151 #endif
152 } VPxContext;
153 
154 /** String mappings for enum vp8e_enc_control_id */
155 static const char *const ctlidstr[] = {
156  [VP8E_SET_CPUUSED] = "VP8E_SET_CPUUSED",
157  [VP8E_SET_ENABLEAUTOALTREF] = "VP8E_SET_ENABLEAUTOALTREF",
158  [VP8E_SET_NOISE_SENSITIVITY] = "VP8E_SET_NOISE_SENSITIVITY",
159  [VP8E_SET_STATIC_THRESHOLD] = "VP8E_SET_STATIC_THRESHOLD",
160  [VP8E_SET_TOKEN_PARTITIONS] = "VP8E_SET_TOKEN_PARTITIONS",
161  [VP8E_SET_ARNR_MAXFRAMES] = "VP8E_SET_ARNR_MAXFRAMES",
162  [VP8E_SET_ARNR_STRENGTH] = "VP8E_SET_ARNR_STRENGTH",
163  [VP8E_SET_ARNR_TYPE] = "VP8E_SET_ARNR_TYPE",
164  [VP8E_SET_TUNING] = "VP8E_SET_TUNING",
165  [VP8E_SET_CQ_LEVEL] = "VP8E_SET_CQ_LEVEL",
166  [VP8E_SET_MAX_INTRA_BITRATE_PCT] = "VP8E_SET_MAX_INTRA_BITRATE_PCT",
167  [VP8E_SET_SHARPNESS] = "VP8E_SET_SHARPNESS",
168  [VP8E_SET_TEMPORAL_LAYER_ID] = "VP8E_SET_TEMPORAL_LAYER_ID",
169  [VP8E_SET_SCREEN_CONTENT_MODE] = "VP8E_SET_SCREEN_CONTENT_MODE",
170 #if CONFIG_LIBVPX_VP9_ENCODER
171  [VP9E_SET_LOSSLESS] = "VP9E_SET_LOSSLESS",
172  [VP9E_SET_TILE_COLUMNS] = "VP9E_SET_TILE_COLUMNS",
173  [VP9E_SET_TILE_ROWS] = "VP9E_SET_TILE_ROWS",
174  [VP9E_SET_FRAME_PARALLEL_DECODING] = "VP9E_SET_FRAME_PARALLEL_DECODING",
175  [VP9E_SET_AQ_MODE] = "VP9E_SET_AQ_MODE",
176  [VP9E_SET_COLOR_SPACE] = "VP9E_SET_COLOR_SPACE",
177  [VP9E_SET_SVC_LAYER_ID] = "VP9E_SET_SVC_LAYER_ID",
178 #if VPX_ENCODER_ABI_VERSION >= 12
179  [VP9E_SET_SVC_PARAMETERS] = "VP9E_SET_SVC_PARAMETERS",
180  [VP9E_SET_SVC_REF_FRAME_CONFIG] = "VP9E_SET_SVC_REF_FRAME_CONFIG",
181 #endif
182  [VP9E_SET_SVC] = "VP9E_SET_SVC",
183 #if VPX_ENCODER_ABI_VERSION >= 11
184  [VP9E_SET_COLOR_RANGE] = "VP9E_SET_COLOR_RANGE",
185 #endif
186 #if VPX_ENCODER_ABI_VERSION >= 12
187  [VP9E_SET_TARGET_LEVEL] = "VP9E_SET_TARGET_LEVEL",
188  [VP9E_GET_LEVEL] = "VP9E_GET_LEVEL",
189 #endif
190 #ifdef VPX_CTRL_VP9E_SET_ROW_MT
191  [VP9E_SET_ROW_MT] = "VP9E_SET_ROW_MT",
192 #endif
193 #ifdef VPX_CTRL_VP9E_SET_TUNE_CONTENT
194  [VP9E_SET_TUNE_CONTENT] = "VP9E_SET_TUNE_CONTENT",
195 #endif
196 #ifdef VPX_CTRL_VP9E_SET_TPL
197  [VP9E_SET_TPL] = "VP9E_SET_TPL",
198 #endif
199 #ifdef VPX_CTRL_VP9E_SET_MIN_GF_INTERVAL
200  [VP9E_SET_MIN_GF_INTERVAL] = "VP9E_SET_MIN_GF_INTERVAL",
201 #endif
202 #endif
203 };
204 
205 static av_cold void log_encoder_error(AVCodecContext *avctx, const char *desc)
206 {
207  VPxContext *ctx = avctx->priv_data;
208  const char *error = vpx_codec_error(&ctx->encoder);
209  const char *detail = vpx_codec_error_detail(&ctx->encoder);
210 
211  av_log(avctx, AV_LOG_ERROR, "%s: %s\n", desc, error);
212  if (detail)
213  av_log(avctx, AV_LOG_ERROR, " Additional information: %s\n", detail);
214 }
215 
217  const struct vpx_codec_enc_cfg *cfg,
218  int level)
219 {
220  int width = -30;
221  int i;
222 
223  av_log(avctx, level, "vpx_codec_enc_cfg\n");
224  av_log(avctx, level, "generic settings\n"
225  " %*s%u\n %*s%u\n %*s%u\n %*s%u\n %*s%u\n"
226 #if CONFIG_LIBVPX_VP9_ENCODER
227  " %*s%u\n %*s%u\n"
228 #endif
229  " %*s{%u/%u}\n %*s%u\n %*s%d\n %*s%u\n",
230  width, "g_usage:", cfg->g_usage,
231  width, "g_threads:", cfg->g_threads,
232  width, "g_profile:", cfg->g_profile,
233  width, "g_w:", cfg->g_w,
234  width, "g_h:", cfg->g_h,
235 #if CONFIG_LIBVPX_VP9_ENCODER
236  width, "g_bit_depth:", cfg->g_bit_depth,
237  width, "g_input_bit_depth:", cfg->g_input_bit_depth,
238 #endif
239  width, "g_timebase:", cfg->g_timebase.num, cfg->g_timebase.den,
240  width, "g_error_resilient:", cfg->g_error_resilient,
241  width, "g_pass:", cfg->g_pass,
242  width, "g_lag_in_frames:", cfg->g_lag_in_frames);
243  av_log(avctx, level, "rate control settings\n"
244  " %*s%u\n %*s%u\n %*s%u\n %*s%u\n"
245  " %*s%d\n %*s%p(%"SIZE_SPECIFIER")\n %*s%u\n",
246  width, "rc_dropframe_thresh:", cfg->rc_dropframe_thresh,
247  width, "rc_resize_allowed:", cfg->rc_resize_allowed,
248  width, "rc_resize_up_thresh:", cfg->rc_resize_up_thresh,
249  width, "rc_resize_down_thresh:", cfg->rc_resize_down_thresh,
250  width, "rc_end_usage:", cfg->rc_end_usage,
251  width, "rc_twopass_stats_in:", cfg->rc_twopass_stats_in.buf, cfg->rc_twopass_stats_in.sz,
252  width, "rc_target_bitrate:", cfg->rc_target_bitrate);
253  av_log(avctx, level, "quantizer settings\n"
254  " %*s%u\n %*s%u\n",
255  width, "rc_min_quantizer:", cfg->rc_min_quantizer,
256  width, "rc_max_quantizer:", cfg->rc_max_quantizer);
257  av_log(avctx, level, "bitrate tolerance\n"
258  " %*s%u\n %*s%u\n",
259  width, "rc_undershoot_pct:", cfg->rc_undershoot_pct,
260  width, "rc_overshoot_pct:", cfg->rc_overshoot_pct);
261  av_log(avctx, level, "temporal layering settings\n"
262  " %*s%u\n", width, "ts_number_layers:", cfg->ts_number_layers);
263  if (avctx->codec_id == AV_CODEC_ID_VP8) {
264  av_log(avctx, level,
265  "\n %*s", width, "ts_target_bitrate:");
266  for (i = 0; i < VPX_TS_MAX_LAYERS; i++)
267  av_log(avctx, level,
268  "%u ", cfg->ts_target_bitrate[i]);
269  }
270 #if (VPX_ENCODER_ABI_VERSION >= 12) && CONFIG_LIBVPX_VP9_ENCODER
271  if (avctx->codec_id == AV_CODEC_ID_VP9) {
272  av_log(avctx, level,
273  "\n %*s", width, "layer_target_bitrate:");
274  for (i = 0; i < VPX_TS_MAX_LAYERS; i++)
275  av_log(avctx, level,
276  "%u ", cfg->layer_target_bitrate[i]);
277  }
278 #endif
279  av_log(avctx, level, "\n");
280  av_log(avctx, level,
281  "\n %*s", width, "ts_rate_decimator:");
282  for (i = 0; i < VPX_TS_MAX_LAYERS; i++)
283  av_log(avctx, level, "%u ", cfg->ts_rate_decimator[i]);
284  av_log(avctx, level, "\n");
285  av_log(avctx, level,
286  "\n %*s%u\n", width, "ts_periodicity:", cfg->ts_periodicity);
287  av_log(avctx, level,
288  "\n %*s", width, "ts_layer_id:");
289  for (i = 0; i < VPX_TS_MAX_PERIODICITY; i++)
290  av_log(avctx, level, "%u ", cfg->ts_layer_id[i]);
291  av_log(avctx, level, "\n");
292  av_log(avctx, level, "decoder buffer model\n"
293  " %*s%u\n %*s%u\n %*s%u\n",
294  width, "rc_buf_sz:", cfg->rc_buf_sz,
295  width, "rc_buf_initial_sz:", cfg->rc_buf_initial_sz,
296  width, "rc_buf_optimal_sz:", cfg->rc_buf_optimal_sz);
297  av_log(avctx, level, "2 pass rate control settings\n"
298  " %*s%u\n %*s%u\n %*s%u\n",
299  width, "rc_2pass_vbr_bias_pct:", cfg->rc_2pass_vbr_bias_pct,
300  width, "rc_2pass_vbr_minsection_pct:", cfg->rc_2pass_vbr_minsection_pct,
301  width, "rc_2pass_vbr_maxsection_pct:", cfg->rc_2pass_vbr_maxsection_pct);
302 #if VPX_ENCODER_ABI_VERSION >= 14
303  av_log(avctx, level, " %*s%u\n",
304  width, "rc_2pass_vbr_corpus_complexity:", cfg->rc_2pass_vbr_corpus_complexity);
305 #endif
306  av_log(avctx, level, "keyframing settings\n"
307  " %*s%d\n %*s%u\n %*s%u\n",
308  width, "kf_mode:", cfg->kf_mode,
309  width, "kf_min_dist:", cfg->kf_min_dist,
310  width, "kf_max_dist:", cfg->kf_max_dist);
311  av_log(avctx, level, "\n");
312 }
313 
314 static void coded_frame_add(void *list, struct FrameListData *cx_frame)
315 {
316  struct FrameListData **p = list;
317 
318  while (*p)
319  p = &(*p)->next;
320  *p = cx_frame;
321  cx_frame->next = NULL;
322 }
323 
324 static av_cold void free_coded_frame(struct FrameListData *cx_frame)
325 {
326  av_freep(&cx_frame->buf);
327  av_freep(&cx_frame);
328 }
329 
331 {
332  struct FrameListData *p = list;
333 
334  while (p) {
335  list = list->next;
337  p = list;
338  }
339 }
340 
341 static void frame_data_uninit(FrameData *fd)
342 {
345 }
346 
347 static av_cold void fifo_free(AVFifo **fifo)
348 {
349  FrameData fd;
350  while (av_fifo_read(*fifo, &fd, 1) >= 0)
351  frame_data_uninit(&fd);
352  av_fifo_freep2(fifo);
353 }
354 
355 static int frame_data_submit(AVCodecContext *avctx, AVFifo *fifo,
356  const AVFrame *frame)
357 {
358  VPxContext *ctx = avctx->priv_data;
359  const struct vpx_codec_enc_cfg *enccfg = ctx->encoder.config.enc;
360 
361  FrameData fd = { .pts = frame->pts };
362  int ret;
363 
364  if (IS_VP9(avctx) &&
365  // Keep HDR10+ if it has bit depth higher than 8 and
366  // it has PQ trc (SMPTE2084).
367  enccfg->g_bit_depth > 8 && avctx->color_trc == AVCOL_TRC_SMPTE2084) {
369 
370  if (sd) {
371  fd.hdr10_plus = av_buffer_ref(sd->buf);
372  if (!fd.hdr10_plus)
373  return AVERROR(ENOMEM);
374  }
375  }
376 
377  fd.duration = frame->duration;
378  fd.frame_opaque = frame->opaque;
379  if (avctx->flags & AV_CODEC_FLAG_COPY_OPAQUE && frame->opaque_ref) {
380  ret = av_buffer_replace(&fd.frame_opaque_ref, frame->opaque_ref);
381  if (ret < 0)
382  goto fail;
383  }
384 
385  ret = av_fifo_write(fifo, &fd, 1);
386  if (ret < 0)
387  goto fail;
388 
389  return 0;
390 fail:
391  frame_data_uninit(&fd);
392  return ret;
393 }
394 
395 static int frame_data_apply(AVCodecContext *avctx, AVFifo *fifo, AVPacket *pkt)
396 {
397  FrameData fd;
398  uint8_t *data;
399  int ret = 0;
400 
401  if (av_fifo_peek(fifo, &fd, 1, 0) < 0)
402  return 0;
403  if (fd.pts != pkt->pts) {
404  av_log(avctx, AV_LOG_WARNING,
405  "Mismatching timestamps: libvpx %"PRId64" queued %"PRId64"; "
406  "this is a bug, please report it\n", pkt->pts, fd.pts);
407  goto skip;
408  }
409 
410  pkt->duration = fd.duration;
411  if (avctx->flags & AV_CODEC_FLAG_COPY_OPAQUE) {
412  pkt->opaque = fd.frame_opaque;
414  fd.frame_opaque_ref = NULL;
415  }
416 
417  if (fd.hdr10_plus) {
419  if (!data) {
420  ret = AVERROR(ENOMEM);
421  goto skip;
422  }
423 
424  memcpy(data, fd.hdr10_plus->data, fd.hdr10_plus->size);
425  }
426 
427 skip:
428  av_fifo_drain2(fifo, 1);
429  frame_data_uninit(&fd);
430 
431  return ret;
432 }
433 
435  enum vp8e_enc_control_id id, int val)
436 {
437  VPxContext *ctx = avctx->priv_data;
438  char buf[80];
439  int width = -30;
440  int res;
441 
442  snprintf(buf, sizeof(buf), "%s:", ctlidstr[id]);
443  av_log(avctx, AV_LOG_DEBUG, " %*s%d\n", width, buf, val);
444 
445  res = vpx_codec_control(&ctx->encoder, id, val);
446  if (res != VPX_CODEC_OK) {
447  snprintf(buf, sizeof(buf), "Failed to set %s codec control",
448  ctlidstr[id]);
449  log_encoder_error(avctx, buf);
450  return AVERROR(EINVAL);
451  }
452 
453  if (ctx->is_alpha) {
454  int res_alpha = vpx_codec_control(&ctx->encoder_alpha, id, val);
455  if (res_alpha != VPX_CODEC_OK) {
456  snprintf(buf, sizeof(buf), "Failed to set %s alpha codec control",
457  ctlidstr[id]);
458  log_encoder_error(avctx, buf);
459  return AVERROR(EINVAL);
460  }
461  }
462 
463  return 0;
464 }
465 
466 #if VPX_ENCODER_ABI_VERSION >= 12
467 static av_cold int codecctl_intp(AVCodecContext *avctx,
468  enum vp8e_enc_control_id id, int *val)
469 {
470  VPxContext *ctx = avctx->priv_data;
471  char buf[80];
472  int width = -30;
473  int res;
474 
475  snprintf(buf, sizeof(buf), "%s:", ctlidstr[id]);
476  av_log(avctx, AV_LOG_DEBUG, " %*s%d\n", width, buf, *val);
477 
478  res = vpx_codec_control(&ctx->encoder, id, val);
479  if (res != VPX_CODEC_OK) {
480  snprintf(buf, sizeof(buf), "Failed to set %s codec control",
481  ctlidstr[id]);
482  log_encoder_error(avctx, buf);
483  return AVERROR(EINVAL);
484  }
485 
486  if (ctx->is_alpha) {
487  int res_alpha = vpx_codec_control(&ctx->encoder_alpha, id, val);
488  if (res_alpha != VPX_CODEC_OK) {
489  snprintf(buf, sizeof(buf), "Failed to set %s alpha codec control",
490  ctlidstr[id]);
491  log_encoder_error(avctx, buf);
492  return AVERROR(EINVAL);
493  }
494  }
495 
496  return 0;
497 }
498 #endif
499 
500 static av_cold int vpx_free(AVCodecContext *avctx)
501 {
502  VPxContext *ctx = avctx->priv_data;
503 
504 #if VPX_ENCODER_ABI_VERSION >= 12
505  if (avctx->codec_id == AV_CODEC_ID_VP9 && ctx->level >= 0 &&
506  !(avctx->flags & AV_CODEC_FLAG_PASS1)) {
507  int level_out = 0;
508  if (!codecctl_intp(avctx, VP9E_GET_LEVEL, &level_out))
509  av_log(avctx, AV_LOG_INFO, "Encoded level %.1f\n", level_out * 0.1);
510  }
511 #endif
512 
513  av_freep(&ctx->ts_layer_flags);
514 
515  vpx_codec_destroy(&ctx->encoder);
516  if (ctx->is_alpha) {
517  vpx_codec_destroy(&ctx->encoder_alpha);
518  av_freep(&ctx->rawimg_alpha.planes[VPX_PLANE_U]);
519  av_freep(&ctx->rawimg_alpha.planes[VPX_PLANE_V]);
520  }
521  av_freep(&ctx->twopass_stats.buf);
522  av_freep(&avctx->stats_out);
523  free_frame_list(ctx->coded_frame_list);
524  free_frame_list(ctx->alpha_coded_frame_list);
525  if (ctx->fifo)
526  fifo_free(&ctx->fifo);
527  return 0;
528 }
529 
530 static void vp8_ts_parse_int_array(int *dest, char *value, size_t value_len, int max_entries)
531 {
532  int dest_idx = 0;
533  char *saveptr = NULL;
534  char *token = av_strtok(value, ",", &saveptr);
535 
536  while (token && dest_idx < max_entries) {
537  dest[dest_idx++] = strtoul(token, NULL, 10);
538  token = av_strtok(NULL, ",", &saveptr);
539  }
540 }
541 
542 #if CONFIG_LIBVPX_VP9_ENCODER && defined(VPX_CTRL_VP9E_SET_MAX_INTER_BITRATE_PCT)
543 static void vp8_ts_parse_int64_array(int64_t *dest, char *value, size_t value_len, int max_entries)
544 {
545  int dest_idx = 0;
546  char *saveptr = NULL;
547  char *token = av_strtok(value, ",", &saveptr);
548 
549  while (token && dest_idx < max_entries) {
550  dest[dest_idx++] = strtoull(token, NULL, 10);
551  token = av_strtok(NULL, ",", &saveptr);
552  }
553 }
554 #endif
555 
556 static void set_temporal_layer_pattern(int layering_mode, vpx_codec_enc_cfg_t *cfg,
557  int *layer_flags, int *flag_periodicity)
558 {
559  switch (layering_mode) {
560  case 2: {
561  /**
562  * 2-layers, 2-frame period.
563  */
564  static const int ids[2] = { 0, 1 };
565  cfg->ts_periodicity = 2;
566  *flag_periodicity = 2;
567  cfg->ts_number_layers = 2;
568  cfg->ts_rate_decimator[0] = 2;
569  cfg->ts_rate_decimator[1] = 1;
570  memcpy(cfg->ts_layer_id, ids, sizeof(ids));
571 
572  layer_flags[0] =
573  VP8_EFLAG_NO_REF_GF | VP8_EFLAG_NO_REF_ARF |
574  VP8_EFLAG_NO_UPD_GF | VP8_EFLAG_NO_UPD_ARF;
575  layer_flags[1] =
576  VP8_EFLAG_NO_UPD_ARF | VP8_EFLAG_NO_UPD_GF |
577  VP8_EFLAG_NO_UPD_LAST |
578  VP8_EFLAG_NO_REF_ARF | VP8_EFLAG_NO_REF_GF;
579  break;
580  }
581  case 3: {
582  /**
583  * 3-layers structure with one reference frame.
584  * This works same as temporal_layering_mode 3.
585  *
586  * 3-layers, 4-frame period.
587  */
588  static const int ids[4] = { 0, 2, 1, 2 };
589  cfg->ts_periodicity = 4;
590  *flag_periodicity = 4;
591  cfg->ts_number_layers = 3;
592  cfg->ts_rate_decimator[0] = 4;
593  cfg->ts_rate_decimator[1] = 2;
594  cfg->ts_rate_decimator[2] = 1;
595  memcpy(cfg->ts_layer_id, ids, sizeof(ids));
596 
597  /**
598  * 0=L, 1=GF, 2=ARF,
599  * Intra-layer prediction disabled.
600  */
601  layer_flags[0] =
602  VP8_EFLAG_NO_REF_GF | VP8_EFLAG_NO_REF_ARF |
603  VP8_EFLAG_NO_UPD_GF | VP8_EFLAG_NO_UPD_ARF;
604  layer_flags[1] =
605  VP8_EFLAG_NO_REF_GF | VP8_EFLAG_NO_REF_ARF |
606  VP8_EFLAG_NO_UPD_LAST | VP8_EFLAG_NO_UPD_GF |
607  VP8_EFLAG_NO_UPD_ARF;
608  layer_flags[2] =
609  VP8_EFLAG_NO_REF_GF | VP8_EFLAG_NO_REF_ARF |
610  VP8_EFLAG_NO_UPD_ARF | VP8_EFLAG_NO_UPD_LAST;
611  layer_flags[3] =
612  VP8_EFLAG_NO_REF_LAST | VP8_EFLAG_NO_REF_ARF |
613  VP8_EFLAG_NO_UPD_LAST | VP8_EFLAG_NO_UPD_GF |
614  VP8_EFLAG_NO_UPD_ARF;
615  break;
616  }
617  case 4: {
618  /**
619  * 3-layers structure.
620  * added dependency between the two TL2 frames (on top of case 3).
621  * 3-layers, 4-frame period.
622  */
623  static const int ids[4] = { 0, 2, 1, 2 };
624  cfg->ts_periodicity = 4;
625  *flag_periodicity = 4;
626  cfg->ts_number_layers = 3;
627  cfg->ts_rate_decimator[0] = 4;
628  cfg->ts_rate_decimator[1] = 2;
629  cfg->ts_rate_decimator[2] = 1;
630  memcpy(cfg->ts_layer_id, ids, sizeof(ids));
631 
632  /**
633  * 0=L, 1=GF, 2=ARF, Intra-layer prediction disabled.
634  */
635  layer_flags[0] =
636  VP8_EFLAG_NO_REF_GF | VP8_EFLAG_NO_REF_ARF |
637  VP8_EFLAG_NO_UPD_GF | VP8_EFLAG_NO_UPD_ARF;
638  layer_flags[1] =
639  VP8_EFLAG_NO_REF_GF | VP8_EFLAG_NO_REF_ARF |
640  VP8_EFLAG_NO_UPD_LAST | VP8_EFLAG_NO_UPD_GF;
641  layer_flags[2] =
642  VP8_EFLAG_NO_REF_GF | VP8_EFLAG_NO_REF_ARF |
643  VP8_EFLAG_NO_UPD_ARF | VP8_EFLAG_NO_UPD_LAST;
644  layer_flags[3] =
645  VP8_EFLAG_NO_REF_LAST |
646  VP8_EFLAG_NO_UPD_LAST | VP8_EFLAG_NO_UPD_GF |
647  VP8_EFLAG_NO_UPD_ARF;
648  break;
649  }
650  default:
651  /**
652  * do not change the layer_flags or the flag_periodicity in this case;
653  * it might be that the code is using external flags to be used.
654  */
655  break;
656 
657  }
658 }
659 
660 static int vpx_ts_param_parse(VPxContext *ctx, struct vpx_codec_enc_cfg *enccfg,
661  char *key, char *value, enum AVCodecID codec_id)
662 {
663  size_t value_len = strlen(value);
664  int ts_layering_mode = 0;
665 
666  if (!value_len)
667  return -1;
668 
669  if (!strcmp(key, "ts_number_layers"))
670  enccfg->ts_number_layers = strtoul(value, &value, 10);
671  else if (!strcmp(key, "ts_target_bitrate")) {
672  if (codec_id == AV_CODEC_ID_VP8)
673  vp8_ts_parse_int_array(enccfg->ts_target_bitrate, value, value_len, VPX_TS_MAX_LAYERS);
674 #if (VPX_ENCODER_ABI_VERSION >= 12) && CONFIG_LIBVPX_VP9_ENCODER
675  if (codec_id == AV_CODEC_ID_VP9)
676  vp8_ts_parse_int_array(enccfg->layer_target_bitrate, value, value_len, VPX_TS_MAX_LAYERS);
677 #endif
678  } else if (!strcmp(key, "ts_rate_decimator")) {
679  vp8_ts_parse_int_array(enccfg->ts_rate_decimator, value, value_len, VPX_TS_MAX_LAYERS);
680  } else if (!strcmp(key, "ts_periodicity")) {
681  enccfg->ts_periodicity = strtoul(value, &value, 10);
682  } else if (!strcmp(key, "ts_layer_id")) {
683  vp8_ts_parse_int_array(enccfg->ts_layer_id, value, value_len, VPX_TS_MAX_PERIODICITY);
684  } else if (!strcmp(key, "ts_layering_mode")) {
685  /* option for pre-defined temporal structures in function set_temporal_layer_pattern. */
686  ts_layering_mode = strtoul(value, &value, 10);
687  }
688 
689 #if (VPX_ENCODER_ABI_VERSION >= 12) && CONFIG_LIBVPX_VP9_ENCODER
690  enccfg->temporal_layering_mode = VP9E_TEMPORAL_LAYERING_MODE_BYPASS; // only bypass mode is supported for now.
691  enccfg->ss_number_layers = 1; // TODO: add spatial scalability support.
692 #endif
693  if (ts_layering_mode) {
694  // make sure the ts_layering_mode comes at the end of the ts_parameter string to ensure that
695  // correct configuration is done.
696  ctx->ts_layer_flags = av_malloc_array(VPX_TS_MAX_PERIODICITY, sizeof(*ctx->ts_layer_flags));
697  set_temporal_layer_pattern(ts_layering_mode, enccfg, ctx->ts_layer_flags, &enccfg->ts_periodicity);
698  }
699 
700  return 0;
701 }
702 
703 #if CONFIG_LIBVPX_VP9_ENCODER && defined(VPX_CTRL_VP9E_SET_MAX_INTER_BITRATE_PCT)
704 static int vpx_ref_frame_config_set_value(vpx_svc_ref_frame_config_t *ref_frame_config,
705  int ss_number_layers, char *key, char *value)
706 {
707  size_t value_len = strlen(value);
708 
709  if (!value_len)
710  return AVERROR(EINVAL);
711 
712  if (!strcmp(key, "rfc_update_buffer_slot")) {
713  vp8_ts_parse_int_array(ref_frame_config->update_buffer_slot, value, value_len, ss_number_layers);
714  } else if (!strcmp(key, "rfc_update_last")) {
715  vp8_ts_parse_int_array(ref_frame_config->update_last, value, value_len, ss_number_layers);
716  } else if (!strcmp(key, "rfc_update_golden")) {
717  vp8_ts_parse_int_array(ref_frame_config->update_golden, value, value_len, ss_number_layers);
718  } else if (!strcmp(key, "rfc_update_alt_ref")) {
719  vp8_ts_parse_int_array(ref_frame_config->update_alt_ref, value, value_len, ss_number_layers);
720  } else if (!strcmp(key, "rfc_lst_fb_idx")) {
721  vp8_ts_parse_int_array(ref_frame_config->lst_fb_idx, value, value_len, ss_number_layers);
722  } else if (!strcmp(key, "rfc_gld_fb_idx")) {
723  vp8_ts_parse_int_array(ref_frame_config->gld_fb_idx, value, value_len, ss_number_layers);
724  } else if (!strcmp(key, "rfc_alt_fb_idx")) {
725  vp8_ts_parse_int_array(ref_frame_config->alt_fb_idx, value, value_len, ss_number_layers);
726  } else if (!strcmp(key, "rfc_reference_last")) {
727  vp8_ts_parse_int_array(ref_frame_config->reference_last, value, value_len, ss_number_layers);
728  } else if (!strcmp(key, "rfc_reference_golden")) {
729  vp8_ts_parse_int_array(ref_frame_config->reference_golden, value, value_len, ss_number_layers);
730  } else if (!strcmp(key, "rfc_reference_alt_ref")) {
731  vp8_ts_parse_int_array(ref_frame_config->reference_alt_ref, value, value_len, ss_number_layers);
732  } else if (!strcmp(key, "rfc_reference_duration")) {
733  vp8_ts_parse_int64_array(ref_frame_config->duration, value, value_len, ss_number_layers);
734  }
735 
736  return 0;
737 }
738 
739 static int vpx_parse_ref_frame_config_element(vpx_svc_ref_frame_config_t *ref_frame_config,
740  int ss_number_layers, const char **buf)
741 {
742  const char key_val_sep[] = "=";
743  const char pairs_sep[] = ":";
744  char *key = av_get_token(buf, key_val_sep);
745  char *val = NULL;
746  int ret;
747 
748  if (key && *key && strspn(*buf, key_val_sep)) {
749  (*buf)++;
750  val = av_get_token(buf, pairs_sep);
751  }
752 
753  if (key && *key && val && *val)
754  ret = vpx_ref_frame_config_set_value(ref_frame_config, ss_number_layers, key, val);
755  else
756  ret = AVERROR(EINVAL);
757 
758  av_freep(&key);
759  av_freep(&val);
760 
761  return ret;
762 }
763 
764 static int vpx_parse_ref_frame_config(vpx_svc_ref_frame_config_t *ref_frame_config,
765  int ss_number_layers, const char *str)
766 {
767  int ret = 0;
768 
769  while (*str) {
770  ret =
771  vpx_parse_ref_frame_config_element(ref_frame_config, ss_number_layers, &str);
772  if (ret < 0)
773  return ret;
774 
775  if (*str)
776  str++;
777  }
778 
779  return ret;
780 }
781 #endif
782 
783 #if CONFIG_LIBVPX_VP9_ENCODER
784 static int set_pix_fmt(AVCodecContext *avctx, vpx_codec_caps_t codec_caps,
785  struct vpx_codec_enc_cfg *enccfg, vpx_codec_flags_t *flags,
786  vpx_img_fmt_t *img_fmt)
787 {
788  VPxContext *ctx = avctx->priv_data;
790  enccfg->g_bit_depth = enccfg->g_input_bit_depth = desc->comp[0].depth;
791  switch (avctx->pix_fmt) {
792  case AV_PIX_FMT_YUV420P:
793  case AV_PIX_FMT_YUVA420P:
794  enccfg->g_profile = 0;
795  *img_fmt = VPX_IMG_FMT_I420;
796  return 0;
797  case AV_PIX_FMT_YUV422P:
798  enccfg->g_profile = 1;
799  *img_fmt = VPX_IMG_FMT_I422;
800  return 0;
801  case AV_PIX_FMT_YUV440P:
802  enccfg->g_profile = 1;
803  *img_fmt = VPX_IMG_FMT_I440;
804  return 0;
805  case AV_PIX_FMT_GBRP:
806  ctx->vpx_cs = VPX_CS_SRGB;
807  case AV_PIX_FMT_YUV444P:
808  enccfg->g_profile = 1;
809  *img_fmt = VPX_IMG_FMT_I444;
810  return 0;
813  if (codec_caps & VPX_CODEC_CAP_HIGHBITDEPTH) {
814  enccfg->g_profile = 2;
815  *img_fmt = VPX_IMG_FMT_I42016;
816  *flags |= VPX_CODEC_USE_HIGHBITDEPTH;
817  return 0;
818  }
819  break;
822  if (codec_caps & VPX_CODEC_CAP_HIGHBITDEPTH) {
823  enccfg->g_profile = 3;
824  *img_fmt = VPX_IMG_FMT_I42216;
825  *flags |= VPX_CODEC_USE_HIGHBITDEPTH;
826  return 0;
827  }
828  break;
831  if (codec_caps & VPX_CODEC_CAP_HIGHBITDEPTH) {
832  enccfg->g_profile = 3;
833  *img_fmt = VPX_IMG_FMT_I44016;
834  *flags |= VPX_CODEC_USE_HIGHBITDEPTH;
835  return 0;
836  }
837  break;
838  case AV_PIX_FMT_GBRP10:
839  case AV_PIX_FMT_GBRP12:
840  ctx->vpx_cs = VPX_CS_SRGB;
843  if (codec_caps & VPX_CODEC_CAP_HIGHBITDEPTH) {
844  enccfg->g_profile = 3;
845  *img_fmt = VPX_IMG_FMT_I44416;
846  *flags |= VPX_CODEC_USE_HIGHBITDEPTH;
847  return 0;
848  }
849  break;
850  default:
851  break;
852  }
853  av_log(avctx, AV_LOG_ERROR, "Unsupported pixel format.\n");
854  return AVERROR_INVALIDDATA;
855 }
856 
857 static void set_colorspace(AVCodecContext *avctx)
858 {
859  enum vpx_color_space vpx_cs;
860  VPxContext *ctx = avctx->priv_data;
861 
862  if (ctx->vpx_cs) {
863  vpx_cs = ctx->vpx_cs;
864  } else {
865  switch (avctx->colorspace) {
866  case AVCOL_SPC_RGB: vpx_cs = VPX_CS_SRGB; break;
867  case AVCOL_SPC_BT709: vpx_cs = VPX_CS_BT_709; break;
868  case AVCOL_SPC_UNSPECIFIED: vpx_cs = VPX_CS_UNKNOWN; break;
869  case AVCOL_SPC_RESERVED: vpx_cs = VPX_CS_RESERVED; break;
870  case AVCOL_SPC_BT470BG: vpx_cs = VPX_CS_BT_601; break;
871  case AVCOL_SPC_SMPTE170M: vpx_cs = VPX_CS_SMPTE_170; break;
872  case AVCOL_SPC_SMPTE240M: vpx_cs = VPX_CS_SMPTE_240; break;
873  case AVCOL_SPC_BT2020_NCL: vpx_cs = VPX_CS_BT_2020; break;
874  default:
875  av_log(avctx, AV_LOG_WARNING, "Unsupported colorspace (%d)\n",
876  avctx->colorspace);
877  return;
878  }
879  }
880  codecctl_int(avctx, VP9E_SET_COLOR_SPACE, vpx_cs);
881 }
882 
883 #if VPX_ENCODER_ABI_VERSION >= 11
884 static void set_color_range(AVCodecContext *avctx)
885 {
886  enum vpx_color_range vpx_cr;
887  switch (avctx->color_range) {
889  case AVCOL_RANGE_MPEG: vpx_cr = VPX_CR_STUDIO_RANGE; break;
890  case AVCOL_RANGE_JPEG: vpx_cr = VPX_CR_FULL_RANGE; break;
891  default:
892  av_log(avctx, AV_LOG_WARNING, "Unsupported color range (%d)\n",
893  avctx->color_range);
894  return;
895  }
896 
897  codecctl_int(avctx, VP9E_SET_COLOR_RANGE, vpx_cr);
898 }
899 #endif
900 #endif
901 
902 /**
903  * Set the target bitrate to VPX library default. Also set CRF to 32 if needed.
904  */
905 static void set_vp8_defaults(AVCodecContext *avctx,
906  struct vpx_codec_enc_cfg *enccfg)
907 {
908  VPxContext *ctx = avctx->priv_data;
909  av_assert0(!avctx->bit_rate);
910  avctx->bit_rate = enccfg->rc_target_bitrate * 1000;
911  if (enccfg->rc_end_usage == VPX_CQ) {
912  av_log(avctx, AV_LOG_WARNING,
913  "Bitrate not specified for constrained quality mode, using default of %dkbit/sec\n",
914  enccfg->rc_target_bitrate);
915  } else {
916  enccfg->rc_end_usage = VPX_CQ;
917  ctx->crf = 32;
918  av_log(avctx, AV_LOG_WARNING,
919  "Neither bitrate nor constrained quality specified, using default CRF of %d and bitrate of %dkbit/sec\n",
920  ctx->crf, enccfg->rc_target_bitrate);
921  }
922 }
923 
924 
925 #if CONFIG_LIBVPX_VP9_ENCODER
926 /**
927  * Keep the target bitrate at 0 to engage constant quality mode. If CRF is not
928  * set, use 32.
929  */
930 static void set_vp9_defaults(AVCodecContext *avctx,
931  struct vpx_codec_enc_cfg *enccfg)
932 {
933  VPxContext *ctx = avctx->priv_data;
934  av_assert0(!avctx->bit_rate);
935  if (enccfg->rc_end_usage != VPX_Q && ctx->lossless < 0) {
936  enccfg->rc_end_usage = VPX_Q;
937  ctx->crf = 32;
938  av_log(avctx, AV_LOG_WARNING,
939  "Neither bitrate nor constrained quality specified, using default CRF of %d\n",
940  ctx->crf);
941  }
942 }
943 #endif
944 
945 /**
946  * Called when the bitrate is not set. It sets appropriate default values for
947  * bitrate and CRF.
948  */
949 static void set_vpx_defaults(AVCodecContext *avctx,
950  struct vpx_codec_enc_cfg *enccfg)
951 {
952  av_assert0(!avctx->bit_rate);
953 #if CONFIG_LIBVPX_VP9_ENCODER
954  if (avctx->codec_id == AV_CODEC_ID_VP9) {
955  set_vp9_defaults(avctx, enccfg);
956  return;
957  }
958 #endif
959  set_vp8_defaults(avctx, enccfg);
960 }
961 
962 static av_cold int vpx_init(AVCodecContext *avctx,
963  const struct vpx_codec_iface *iface)
964 {
965  VPxContext *ctx = avctx->priv_data;
966  struct vpx_codec_enc_cfg enccfg = { 0 };
967  struct vpx_codec_enc_cfg enccfg_alpha;
968  vpx_codec_flags_t flags = (avctx->flags & AV_CODEC_FLAG_PSNR) ? VPX_CODEC_USE_PSNR : 0;
969  AVCPBProperties *cpb_props;
970  int res;
971  vpx_img_fmt_t img_fmt = VPX_IMG_FMT_I420;
972 #if CONFIG_LIBVPX_VP9_ENCODER
973  vpx_codec_caps_t codec_caps = vpx_codec_get_caps(iface);
974  vpx_svc_extra_cfg_t svc_params;
975 #endif
976  const AVDictionaryEntry* en = NULL;
977 
978  av_log(avctx, AV_LOG_INFO, "%s\n", vpx_codec_version_str());
979  av_log(avctx, AV_LOG_VERBOSE, "%s\n", vpx_codec_build_config());
980 
981  if (avctx->pix_fmt == AV_PIX_FMT_YUVA420P)
982  ctx->is_alpha = 1;
983 
984  if ((res = vpx_codec_enc_config_default(iface, &enccfg, 0)) != VPX_CODEC_OK) {
985  av_log(avctx, AV_LOG_ERROR, "Failed to get config: %s\n",
986  vpx_codec_err_to_string(res));
987  return AVERROR(EINVAL);
988  }
989 
990  ctx->fifo = av_fifo_alloc2(1, sizeof(FrameData), AV_FIFO_FLAG_AUTO_GROW);
991  if (!ctx->fifo)
992  return AVERROR(ENOMEM);
993 
994 #if CONFIG_LIBVPX_VP9_ENCODER
995  if (avctx->codec_id == AV_CODEC_ID_VP9) {
996  if (set_pix_fmt(avctx, codec_caps, &enccfg, &flags, &img_fmt))
997  return AVERROR(EINVAL);
998  }
999 #endif
1000 
1001  if(!avctx->bit_rate)
1002  if(avctx->rc_max_rate || avctx->rc_buffer_size || avctx->rc_initial_buffer_occupancy) {
1003  av_log( avctx, AV_LOG_ERROR, "Rate control parameters set without a bitrate\n");
1004  return AVERROR(EINVAL);
1005  }
1006 
1007  dump_enc_cfg(avctx, &enccfg, AV_LOG_DEBUG);
1008 
1009  enccfg.g_w = avctx->width;
1010  enccfg.g_h = avctx->height;
1011  enccfg.g_timebase.num = avctx->time_base.num;
1012  enccfg.g_timebase.den = avctx->time_base.den;
1013  enccfg.g_threads =
1015  enccfg.g_lag_in_frames= ctx->lag_in_frames;
1016 
1017  if (avctx->flags & AV_CODEC_FLAG_PASS1)
1018  enccfg.g_pass = VPX_RC_FIRST_PASS;
1019  else if (avctx->flags & AV_CODEC_FLAG_PASS2)
1020  enccfg.g_pass = VPX_RC_LAST_PASS;
1021  else
1022  enccfg.g_pass = VPX_RC_ONE_PASS;
1023 
1024  if (avctx->rc_min_rate == avctx->rc_max_rate &&
1025  avctx->rc_min_rate == avctx->bit_rate && avctx->bit_rate) {
1026  enccfg.rc_end_usage = VPX_CBR;
1027  } else if (ctx->crf >= 0) {
1028  enccfg.rc_end_usage = VPX_CQ;
1029 #if CONFIG_LIBVPX_VP9_ENCODER
1030  if (!avctx->bit_rate && avctx->codec_id == AV_CODEC_ID_VP9)
1031  enccfg.rc_end_usage = VPX_Q;
1032 #endif
1033  }
1034 
1035  if (avctx->bit_rate) {
1036  enccfg.rc_target_bitrate = av_rescale_rnd(avctx->bit_rate, 1, 1000,
1038 #if CONFIG_LIBVPX_VP9_ENCODER
1039  enccfg.ss_target_bitrate[0] = enccfg.rc_target_bitrate;
1040 #endif
1041  } else {
1042  // Set bitrate to default value. Also sets CRF to default if needed.
1043  set_vpx_defaults(avctx, &enccfg);
1044  }
1045 
1046  if (avctx->codec_id == AV_CODEC_ID_VP9 && ctx->lossless == 1) {
1047  enccfg.rc_min_quantizer =
1048  enccfg.rc_max_quantizer = 0;
1049  } else {
1050  if (avctx->qmin >= 0)
1051  enccfg.rc_min_quantizer = avctx->qmin;
1052  if (avctx->qmax >= 0)
1053  enccfg.rc_max_quantizer = avctx->qmax;
1054  }
1055 
1056  if (enccfg.rc_end_usage == VPX_CQ
1057 #if CONFIG_LIBVPX_VP9_ENCODER
1058  || enccfg.rc_end_usage == VPX_Q
1059 #endif
1060  ) {
1061  if (ctx->crf < enccfg.rc_min_quantizer || ctx->crf > enccfg.rc_max_quantizer) {
1062  av_log(avctx, AV_LOG_ERROR,
1063  "CQ level %d must be between minimum and maximum quantizer value (%d-%d)\n",
1064  ctx->crf, enccfg.rc_min_quantizer, enccfg.rc_max_quantizer);
1065  return AVERROR(EINVAL);
1066  }
1067  }
1068 
1069  enccfg.rc_dropframe_thresh = ctx->drop_threshold;
1070 
1071  //0-100 (0 => CBR, 100 => VBR)
1072  enccfg.rc_2pass_vbr_bias_pct = lrint(avctx->qcompress * 100);
1073  if (avctx->bit_rate)
1074  enccfg.rc_2pass_vbr_minsection_pct =
1075  avctx->rc_min_rate * 100LL / avctx->bit_rate;
1076  if (avctx->rc_max_rate)
1077  enccfg.rc_2pass_vbr_maxsection_pct =
1078  avctx->rc_max_rate * 100LL / avctx->bit_rate;
1079 #if CONFIG_LIBVPX_VP9_ENCODER
1080  if (avctx->codec_id == AV_CODEC_ID_VP9) {
1081 #if VPX_ENCODER_ABI_VERSION >= 14
1082  if (ctx->corpus_complexity >= 0)
1083  enccfg.rc_2pass_vbr_corpus_complexity = ctx->corpus_complexity;
1084 #endif
1085  }
1086 #endif
1087 
1088  if (avctx->rc_buffer_size)
1089  enccfg.rc_buf_sz =
1090  avctx->rc_buffer_size * 1000LL / avctx->bit_rate;
1091  if (avctx->rc_initial_buffer_occupancy)
1092  enccfg.rc_buf_initial_sz =
1093  avctx->rc_initial_buffer_occupancy * 1000LL / avctx->bit_rate;
1094  enccfg.rc_buf_optimal_sz = enccfg.rc_buf_sz * 5 / 6;
1095  if (ctx->rc_undershoot_pct >= 0)
1096  enccfg.rc_undershoot_pct = ctx->rc_undershoot_pct;
1097  if (ctx->rc_overshoot_pct >= 0)
1098  enccfg.rc_overshoot_pct = ctx->rc_overshoot_pct;
1099 
1100  //_enc_init() will balk if kf_min_dist differs from max w/VPX_KF_AUTO
1101  if (avctx->keyint_min >= 0 && avctx->keyint_min == avctx->gop_size)
1102  enccfg.kf_min_dist = avctx->keyint_min;
1103  if (avctx->gop_size >= 0)
1104  enccfg.kf_max_dist = avctx->gop_size;
1105 
1106  if (enccfg.g_pass == VPX_RC_FIRST_PASS)
1107  enccfg.g_lag_in_frames = 0;
1108  else if (enccfg.g_pass == VPX_RC_LAST_PASS) {
1109  int decode_size, ret;
1110 
1111  if (!avctx->stats_in) {
1112  av_log(avctx, AV_LOG_ERROR, "No stats file for second pass\n");
1113  return AVERROR_INVALIDDATA;
1114  }
1115 
1116  ctx->twopass_stats.sz = strlen(avctx->stats_in) * 3 / 4;
1117  ret = av_reallocp(&ctx->twopass_stats.buf, ctx->twopass_stats.sz);
1118  if (ret < 0) {
1119  av_log(avctx, AV_LOG_ERROR,
1120  "Stat buffer alloc (%"SIZE_SPECIFIER" bytes) failed\n",
1121  ctx->twopass_stats.sz);
1122  ctx->twopass_stats.sz = 0;
1123  return ret;
1124  }
1125  decode_size = av_base64_decode(ctx->twopass_stats.buf, avctx->stats_in,
1126  ctx->twopass_stats.sz);
1127  if (decode_size < 0) {
1128  av_log(avctx, AV_LOG_ERROR, "Stat buffer decode failed\n");
1129  return AVERROR_INVALIDDATA;
1130  }
1131 
1132  ctx->twopass_stats.sz = decode_size;
1133  enccfg.rc_twopass_stats_in = ctx->twopass_stats;
1134  }
1135 
1136  /* 0-3: For non-zero values the encoder increasingly optimizes for reduced
1137  complexity playback on low powered devices at the expense of encode
1138  quality. */
1139  if (avctx->profile != AV_PROFILE_UNKNOWN)
1140  enccfg.g_profile = avctx->profile;
1141 
1142  enccfg.g_error_resilient = ctx->error_resilient || ctx->flags & VP8F_ERROR_RESILIENT;
1143 
1144  while ((en = av_dict_iterate(ctx->vpx_ts_parameters, en))) {
1145  if (vpx_ts_param_parse(ctx, &enccfg, en->key, en->value, avctx->codec_id) < 0)
1146  av_log(avctx, AV_LOG_WARNING,
1147  "Error parsing option '%s = %s'.\n",
1148  en->key, en->value);
1149  }
1150 
1151  /* Construct Encoder Context */
1152  res = vpx_codec_enc_init(&ctx->encoder, iface, &enccfg, flags);
1153  if (res != VPX_CODEC_OK) {
1154  dump_enc_cfg(avctx, &enccfg, AV_LOG_WARNING);
1155  log_encoder_error(avctx, "Failed to initialize encoder");
1156  return AVERROR(EINVAL);
1157  }
1158  dump_enc_cfg(avctx, &enccfg, AV_LOG_DEBUG);
1159 
1160 #if CONFIG_LIBVPX_VP9_ENCODER
1161  if (avctx->codec_id == AV_CODEC_ID_VP9 && enccfg.ts_number_layers > 1) {
1162  memset(&svc_params, 0, sizeof(svc_params));
1163  for (int i = 0; i < enccfg.ts_number_layers; ++i) {
1164  svc_params.max_quantizers[i] = enccfg.rc_max_quantizer;
1165  svc_params.min_quantizers[i] = enccfg.rc_min_quantizer;
1166  }
1167  svc_params.scaling_factor_num[0] = enccfg.g_h;
1168  svc_params.scaling_factor_den[0] = enccfg.g_h;
1169 #if VPX_ENCODER_ABI_VERSION >= 12
1170  codecctl_int(avctx, VP9E_SET_SVC, 1);
1171  codecctl_intp(avctx, VP9E_SET_SVC_PARAMETERS, (int *)&svc_params);
1172 #endif
1173  }
1174 #endif
1175  if (ctx->is_alpha) {
1176  enccfg_alpha = enccfg;
1177  res = vpx_codec_enc_init(&ctx->encoder_alpha, iface, &enccfg_alpha, flags);
1178  if (res != VPX_CODEC_OK) {
1179  log_encoder_error(avctx, "Failed to initialize alpha encoder");
1180  return AVERROR(EINVAL);
1181  }
1182  }
1183 
1184  //codec control failures are currently treated only as warnings
1185  av_log(avctx, AV_LOG_DEBUG, "vpx_codec_control\n");
1186  codecctl_int(avctx, VP8E_SET_CPUUSED, ctx->cpu_used);
1187  if (ctx->flags & VP8F_AUTO_ALT_REF)
1188  ctx->auto_alt_ref = 1;
1189  if (ctx->auto_alt_ref >= 0)
1190  codecctl_int(avctx, VP8E_SET_ENABLEAUTOALTREF,
1191  avctx->codec_id == AV_CODEC_ID_VP8 ? !!ctx->auto_alt_ref : ctx->auto_alt_ref);
1192  if (ctx->arnr_max_frames >= 0)
1193  codecctl_int(avctx, VP8E_SET_ARNR_MAXFRAMES, ctx->arnr_max_frames);
1194  if (ctx->arnr_strength >= 0)
1195  codecctl_int(avctx, VP8E_SET_ARNR_STRENGTH, ctx->arnr_strength);
1196  if (ctx->arnr_type >= 0)
1197  codecctl_int(avctx, VP8E_SET_ARNR_TYPE, ctx->arnr_type);
1198  if (ctx->tune >= 0)
1199  codecctl_int(avctx, VP8E_SET_TUNING, ctx->tune);
1200 
1201  if (ctx->auto_alt_ref && ctx->is_alpha && avctx->codec_id == AV_CODEC_ID_VP8) {
1202  av_log(avctx, AV_LOG_ERROR, "Transparency encoding with auto_alt_ref does not work\n");
1203  return AVERROR(EINVAL);
1204  }
1205 
1206  if (ctx->sharpness >= 0)
1207  codecctl_int(avctx, VP8E_SET_SHARPNESS, ctx->sharpness);
1208 
1209  if (CONFIG_LIBVPX_VP8_ENCODER && avctx->codec_id == AV_CODEC_ID_VP8) {
1210  codecctl_int(avctx, VP8E_SET_NOISE_SENSITIVITY, ctx->noise_sensitivity);
1211  codecctl_int(avctx, VP8E_SET_TOKEN_PARTITIONS, av_log2(avctx->slices));
1212  }
1213  codecctl_int(avctx, VP8E_SET_STATIC_THRESHOLD, ctx->static_thresh);
1214  if (ctx->crf >= 0)
1215  codecctl_int(avctx, VP8E_SET_CQ_LEVEL, ctx->crf);
1216  if (ctx->max_intra_rate >= 0)
1217  codecctl_int(avctx, VP8E_SET_MAX_INTRA_BITRATE_PCT, ctx->max_intra_rate);
1218 
1219 #if CONFIG_LIBVPX_VP9_ENCODER
1220  if (avctx->codec_id == AV_CODEC_ID_VP9) {
1221  if (ctx->lossless >= 0)
1222  codecctl_int(avctx, VP9E_SET_LOSSLESS, ctx->lossless);
1223  if (ctx->tile_columns >= 0)
1224  codecctl_int(avctx, VP9E_SET_TILE_COLUMNS, ctx->tile_columns);
1225  if (ctx->tile_rows >= 0)
1226  codecctl_int(avctx, VP9E_SET_TILE_ROWS, ctx->tile_rows);
1227  if (ctx->frame_parallel >= 0)
1228  codecctl_int(avctx, VP9E_SET_FRAME_PARALLEL_DECODING, ctx->frame_parallel);
1229  if (ctx->aq_mode >= 0)
1230  codecctl_int(avctx, VP9E_SET_AQ_MODE, ctx->aq_mode);
1231  set_colorspace(avctx);
1232 #if VPX_ENCODER_ABI_VERSION >= 11
1233  set_color_range(avctx);
1234 #endif
1235 #if VPX_ENCODER_ABI_VERSION >= 12
1236  codecctl_int(avctx, VP9E_SET_TARGET_LEVEL, ctx->level < 0 ? 255 : lrint(ctx->level * 10));
1237 #endif
1238 #ifdef VPX_CTRL_VP9E_SET_ROW_MT
1239  if (ctx->row_mt >= 0)
1240  codecctl_int(avctx, VP9E_SET_ROW_MT, ctx->row_mt);
1241 #endif
1242 #ifdef VPX_CTRL_VP9E_SET_TUNE_CONTENT
1243  if (ctx->tune_content >= 0)
1244  codecctl_int(avctx, VP9E_SET_TUNE_CONTENT, ctx->tune_content);
1245 #endif
1246 #ifdef VPX_CTRL_VP9E_SET_TPL
1247  if (ctx->tpl_model >= 0)
1248  codecctl_int(avctx, VP9E_SET_TPL, ctx->tpl_model);
1249 #endif
1250 #ifdef VPX_CTRL_VP9E_SET_MIN_GF_INTERVAL
1251  if (ctx->min_gf_interval >= 0)
1252  codecctl_int(avctx, VP9E_SET_MIN_GF_INTERVAL, ctx->min_gf_interval);
1253 #endif
1254  }
1255 #endif
1256  if (avctx->codec_id == AV_CODEC_ID_VP8 && ctx->screen_content_mode >= 0) {
1257  if (ctx->screen_content_mode == 2 && ctx->is_alpha) {
1258  av_log(avctx, AV_LOG_ERROR,
1259  "Transparency encoding with screen mode with aggressive rate control not supported\n");
1260  return AVERROR(EINVAL);
1261  }
1262  codecctl_int(avctx, VP8E_SET_SCREEN_CONTENT_MODE, ctx->screen_content_mode);
1263  }
1264 
1265  av_log(avctx, AV_LOG_DEBUG, "Using deadline: %d\n", ctx->deadline);
1266 
1267  //provide dummy value to initialize wrapper, values will be updated each _encode()
1268  vpx_img_wrap(&ctx->rawimg, img_fmt, avctx->width, avctx->height, 1,
1269  (unsigned char*)1);
1270 #if CONFIG_LIBVPX_VP9_ENCODER
1271  if (avctx->codec_id == AV_CODEC_ID_VP9 && (codec_caps & VPX_CODEC_CAP_HIGHBITDEPTH))
1272  ctx->rawimg.bit_depth = enccfg.g_bit_depth;
1273 #endif
1274 
1275  cpb_props = ff_encode_add_cpb_side_data(avctx);
1276  if (!cpb_props)
1277  return AVERROR(ENOMEM);
1278 
1279  if (enccfg.rc_end_usage == VPX_CBR ||
1280  enccfg.g_pass != VPX_RC_ONE_PASS) {
1281  cpb_props->max_bitrate = avctx->rc_max_rate;
1282  cpb_props->min_bitrate = avctx->rc_min_rate;
1283  cpb_props->avg_bitrate = avctx->bit_rate;
1284  }
1285  cpb_props->buffer_size = avctx->rc_buffer_size;
1286 
1287  return 0;
1288 }
1289 
1290 static inline void cx_pktcpy(struct FrameListData *dst,
1291  const struct vpx_codec_cx_pkt *src,
1292  VPxContext *ctx)
1293 {
1294  dst->pts = src->data.frame.pts;
1295  dst->flags = src->data.frame.flags;
1296  dst->sz = src->data.frame.sz;
1297  dst->buf = src->data.frame.buf;
1298  dst->have_sse = 0;
1299  /* For alt-ref frame, don't store PSNR */
1300  if (!(dst->flags & VPX_FRAME_IS_INVISIBLE)) {
1301  dst->have_sse = ctx->have_sse;
1302  if (ctx->have_sse) {
1303  /* associate last-seen SSE to the frame. */
1304  /* Transfers ownership from ctx to dst. */
1305  /* WARNING! This makes the assumption that PSNR_PKT comes
1306  just before the frame it refers to! */
1307  memcpy(dst->sse, ctx->sse, sizeof(dst->sse));
1308  ctx->have_sse = 0;
1309  }
1310  }
1311 }
1312 
1313 /**
1314  * Store coded frame information in format suitable for return from encode2().
1315  *
1316  * Write information from @a cx_frame to @a pkt
1317  * @return packet data size on success
1318  * @return a negative AVERROR on error
1319  */
1320 static int storeframe(AVCodecContext *avctx, struct FrameListData *cx_frame,
1321  struct FrameListData *alpha_cx_frame, AVPacket *pkt)
1322 {
1323  VPxContext *ctx = avctx->priv_data;
1324  int ret = ff_get_encode_buffer(avctx, pkt, cx_frame->sz, 0);
1325  uint8_t *side_data;
1326  enum AVPictureType pict_type;
1327  int quality;
1328 
1329  if (ret < 0)
1330  return ret;
1331 
1332  memcpy(pkt->data, cx_frame->buf, pkt->size);
1333  pkt->pts = pkt->dts = cx_frame->pts;
1334 
1335  if (!!(cx_frame->flags & VPX_FRAME_IS_KEY)) {
1336  pict_type = AV_PICTURE_TYPE_I;
1338  } else {
1339  pict_type = AV_PICTURE_TYPE_P;
1340  }
1341 
1342  ret = vpx_codec_control(&ctx->encoder, VP8E_GET_LAST_QUANTIZER_64, &quality);
1343  if (ret != VPX_CODEC_OK)
1344  quality = 0;
1346  cx_frame->have_sse ? 3 : 0, pict_type);
1347 
1348  if (cx_frame->have_sse) {
1349  /* Beware of the Y/U/V/all order! */
1350  for (int i = 0; i < 3; ++i)
1351  avctx->error[i] += cx_frame->sse[i + 1];
1352  cx_frame->have_sse = 0;
1353  }
1354  if (alpha_cx_frame) {
1355  side_data = av_packet_new_side_data(pkt,
1357  alpha_cx_frame->sz + 8);
1358  if (!side_data) {
1360  return AVERROR(ENOMEM);
1361  }
1362  AV_WB64(side_data, 1);
1363  memcpy(side_data + 8, alpha_cx_frame->buf, alpha_cx_frame->sz);
1364  }
1365  ret = frame_data_apply(avctx, ctx->fifo, pkt);
1366  if (ret < 0)
1367  return ret;
1368 
1369  return pkt->size;
1370 }
1371 
1372 /**
1373  * Queue multiple output frames from the encoder, returning the front-most.
1374  * In cases where vpx_codec_get_cx_data() returns more than 1 frame append
1375  * the frame queue. Return the head frame if available.
1376  * @return Stored frame size
1377  * @return AVERROR(EINVAL) on output size error
1378  * @return AVERROR(ENOMEM) on coded frame queue data allocation error
1379  */
1380 static int queue_frames(AVCodecContext *avctx, struct vpx_codec_ctx *encoder,
1381  struct FrameListData **frame_list, AVPacket *pkt_out)
1382 {
1383  VPxContext *ctx = avctx->priv_data;
1384  const struct vpx_codec_cx_pkt *pkt;
1385  const void *iter = NULL;
1386  int size = 0;
1387 
1388  if (!ctx->is_alpha && *frame_list) {
1389  struct FrameListData *cx_frame = *frame_list;
1390  /* return the leading frame if we've already begun queueing */
1391  size = storeframe(avctx, cx_frame, NULL, pkt_out);
1392  if (size < 0)
1393  return size;
1394  *frame_list = cx_frame->next;
1395  free_coded_frame(cx_frame);
1396  }
1397 
1398  /* consume all available output from the encoder before returning. buffers
1399  are only good through the next vpx_codec call */
1400  while (pkt = vpx_codec_get_cx_data(encoder, &iter)) {
1401  switch (pkt->kind) {
1402  case VPX_CODEC_CX_FRAME_PKT:
1403  if (!ctx->is_alpha && !size) {
1404  struct FrameListData cx_frame;
1405 
1406  /* avoid storing the frame when the list is empty and we haven't yet
1407  provided a frame for output */
1408  av_assert0(!ctx->coded_frame_list);
1409  cx_pktcpy(&cx_frame, pkt, ctx);
1410  size = storeframe(avctx, &cx_frame, NULL, pkt_out);
1411  if (size < 0)
1412  return size;
1413  } else {
1414  struct FrameListData *cx_frame = av_malloc(sizeof(*cx_frame));
1415 
1416  if (!cx_frame) {
1417  av_log(avctx, AV_LOG_ERROR,
1418  "Frame queue element alloc failed\n");
1419  return AVERROR(ENOMEM);
1420  }
1421  cx_pktcpy(cx_frame, pkt, ctx);
1422  cx_frame->buf = av_malloc(cx_frame->sz);
1423 
1424  if (!cx_frame->buf) {
1425  av_log(avctx, AV_LOG_ERROR,
1426  "Data buffer alloc (%"SIZE_SPECIFIER" bytes) failed\n",
1427  cx_frame->sz);
1428  av_freep(&cx_frame);
1429  return AVERROR(ENOMEM);
1430  }
1431  memcpy(cx_frame->buf, pkt->data.frame.buf, pkt->data.frame.sz);
1432  coded_frame_add(frame_list, cx_frame);
1433  }
1434  break;
1435  case VPX_CODEC_STATS_PKT: {
1436  struct vpx_fixed_buf *stats = &ctx->twopass_stats;
1437  uint8_t *tmp;
1438  if (!pkt_out)
1439  break;
1440  tmp = av_fast_realloc(stats->buf,
1441  &ctx->twopass_stats_size,
1442  stats->sz +
1443  pkt->data.twopass_stats.sz);
1444  if (!tmp) {
1445  av_freep(&stats->buf);
1446  stats->sz = 0;
1447  av_log(avctx, AV_LOG_ERROR, "Stat buffer realloc failed\n");
1448  return AVERROR(ENOMEM);
1449  }
1450  stats->buf = tmp;
1451  memcpy((uint8_t*)stats->buf + stats->sz,
1452  pkt->data.twopass_stats.buf, pkt->data.twopass_stats.sz);
1453  stats->sz += pkt->data.twopass_stats.sz;
1454  break;
1455  }
1456  case VPX_CODEC_PSNR_PKT:
1457  if (!pkt_out)
1458  break;
1459  av_assert0(!ctx->have_sse);
1460  ctx->sse[0] = pkt->data.psnr.sse[0];
1461  ctx->sse[1] = pkt->data.psnr.sse[1];
1462  ctx->sse[2] = pkt->data.psnr.sse[2];
1463  ctx->sse[3] = pkt->data.psnr.sse[3];
1464  ctx->have_sse = 1;
1465  break;
1466  case VPX_CODEC_CUSTOM_PKT:
1467  //ignore unsupported/unrecognized packet types
1468  break;
1469  }
1470  }
1471 
1472  return size;
1473 }
1474 
1475 static int set_roi_map(AVCodecContext *avctx, const AVFrameSideData *sd, int frame_width, int frame_height,
1476  vpx_roi_map_t *roi_map, int block_size, int segment_cnt)
1477 {
1478  /**
1479  * range of vpx_roi_map_t.delta_q[i] is [-63, 63]
1480  */
1481 #define MAX_DELTA_Q 63
1482 
1483  const AVRegionOfInterest *roi = NULL;
1484  int nb_rois;
1485  uint32_t self_size;
1486  int segment_id;
1487 
1488  /* record the mapping from delta_q to "segment id + 1" in segment_mapping[].
1489  * the range of delta_q is [-MAX_DELTA_Q, MAX_DELTA_Q],
1490  * and its corresponding array index is [0, 2 * MAX_DELTA_Q],
1491  * and so the length of the mapping array is 2 * MAX_DELTA_Q + 1.
1492  * "segment id + 1", so we can say there's no mapping if the value of array element is zero.
1493  */
1494  int segment_mapping[2 * MAX_DELTA_Q + 1] = { 0 };
1495 
1496  memset(roi_map, 0, sizeof(*roi_map));
1497 
1498  /* segment id 0 in roi_map is reserved for the areas not covered by AVRegionOfInterest.
1499  * segment id 0 in roi_map is also for the areas with AVRegionOfInterest.qoffset near 0.
1500  * (delta_q of segment id 0 is 0).
1501  */
1502  segment_mapping[MAX_DELTA_Q] = 1;
1503  segment_id = 1;
1504 
1505  roi = (const AVRegionOfInterest*)sd->data;
1506  self_size = roi->self_size;
1507  if (!self_size || sd->size % self_size) {
1508  av_log(avctx, AV_LOG_ERROR, "Invalid AVRegionOfInterest.self_size.\n");
1509  return AVERROR(EINVAL);
1510  }
1511  nb_rois = sd->size / self_size;
1512 
1513  /* This list must be iterated from zero because regions are
1514  * defined in order of decreasing importance. So discard less
1515  * important areas if they exceed the segment count.
1516  */
1517  for (int i = 0; i < nb_rois; i++) {
1518  int delta_q;
1519  int mapping_index;
1520 
1521  roi = (const AVRegionOfInterest*)(sd->data + self_size * i);
1522  if (!roi->qoffset.den) {
1523  av_log(avctx, AV_LOG_ERROR, "AVRegionOfInterest.qoffset.den must not be zero.\n");
1524  return AVERROR(EINVAL);
1525  }
1526 
1527  delta_q = (int)(roi->qoffset.num * 1.0f / roi->qoffset.den * MAX_DELTA_Q);
1529 
1530  mapping_index = delta_q + MAX_DELTA_Q;
1531  if (!segment_mapping[mapping_index]) {
1532  if (segment_id == segment_cnt) {
1533  av_log(avctx, AV_LOG_WARNING,
1534  "ROI only supports %d segments (and segment 0 is reserved for non-ROIs), skipping the left ones.\n",
1535  segment_cnt);
1536  break;
1537  }
1538 
1539  segment_mapping[mapping_index] = segment_id + 1;
1540  roi_map->delta_q[segment_id] = delta_q;
1541  segment_id++;
1542  }
1543  }
1544 
1545  roi_map->rows = (frame_height + block_size - 1) / block_size;
1546  roi_map->cols = (frame_width + block_size - 1) / block_size;
1547  roi_map->roi_map = av_calloc(roi_map->rows * roi_map->cols, sizeof(*roi_map->roi_map));
1548  if (!roi_map->roi_map) {
1549  av_log(avctx, AV_LOG_ERROR, "roi_map alloc failed.\n");
1550  return AVERROR(ENOMEM);
1551  }
1552 
1553  /* This list must be iterated in reverse, so for the case that
1554  * two regions are overlapping, the more important area takes effect.
1555  */
1556  for (int i = nb_rois - 1; i >= 0; i--) {
1557  int delta_q;
1558  int mapping_value;
1559  int starty, endy, startx, endx;
1560 
1561  roi = (const AVRegionOfInterest*)(sd->data + self_size * i);
1562 
1563  starty = av_clip(roi->top / block_size, 0, roi_map->rows);
1564  endy = av_clip((roi->bottom + block_size - 1) / block_size, 0, roi_map->rows);
1565  startx = av_clip(roi->left / block_size, 0, roi_map->cols);
1566  endx = av_clip((roi->right + block_size - 1) / block_size, 0, roi_map->cols);
1567 
1568  delta_q = (int)(roi->qoffset.num * 1.0f / roi->qoffset.den * MAX_DELTA_Q);
1570 
1571  mapping_value = segment_mapping[delta_q + MAX_DELTA_Q];
1572  if (mapping_value) {
1573  for (int y = starty; y < endy; y++)
1574  for (int x = startx; x < endx; x++)
1575  roi_map->roi_map[x + y * roi_map->cols] = mapping_value - 1;
1576  }
1577  }
1578 
1579  return 0;
1580 }
1581 
1582 static int vp9_encode_set_roi(AVCodecContext *avctx, int frame_width, int frame_height, const AVFrameSideData *sd)
1583 {
1584  VPxContext *ctx = avctx->priv_data;
1585 
1586 #ifdef VPX_CTRL_VP9E_SET_ROI_MAP
1587  int version = vpx_codec_version();
1588  int major = VPX_VERSION_MAJOR(version);
1589  int minor = VPX_VERSION_MINOR(version);
1590  int patch = VPX_VERSION_PATCH(version);
1591 
1592  if (major > 1 || (major == 1 && minor > 8) || (major == 1 && minor == 8 && patch >= 1)) {
1593  vpx_roi_map_t roi_map;
1594  const int segment_cnt = 8;
1595  const int block_size = 8;
1596  int ret;
1597 
1598  if (ctx->aq_mode > 0 || ctx->cpu_used < 5 || ctx->deadline != VPX_DL_REALTIME) {
1599  if (!ctx->roi_warned) {
1600  ctx->roi_warned = 1;
1601  av_log(avctx, AV_LOG_WARNING, "ROI is only enabled when aq_mode is 0, cpu_used >= 5 "
1602  "and deadline is REALTIME, so skipping ROI.\n");
1603  return AVERROR(EINVAL);
1604  }
1605  }
1606 
1607  ret = set_roi_map(avctx, sd, frame_width, frame_height, &roi_map, block_size, segment_cnt);
1608  if (ret) {
1609  log_encoder_error(avctx, "Failed to set_roi_map.\n");
1610  return ret;
1611  }
1612 
1613  memset(roi_map.ref_frame, -1, sizeof(roi_map.ref_frame));
1614 
1615  if (vpx_codec_control(&ctx->encoder, VP9E_SET_ROI_MAP, &roi_map)) {
1616  log_encoder_error(avctx, "Failed to set VP9E_SET_ROI_MAP codec control.\n");
1618  }
1619  av_freep(&roi_map.roi_map);
1620  return ret;
1621  }
1622 #endif
1623 
1624  if (!ctx->roi_warned) {
1625  ctx->roi_warned = 1;
1626  av_log(avctx, AV_LOG_WARNING, "ROI is not supported, please upgrade libvpx to version >= 1.8.1. "
1627  "You may need to rebuild ffmpeg.\n");
1628  }
1629  return 0;
1630 }
1631 
1632 static int vp8_encode_set_roi(AVCodecContext *avctx, int frame_width, int frame_height, const AVFrameSideData *sd)
1633 {
1634  vpx_roi_map_t roi_map;
1635  const int segment_cnt = 4;
1636  const int block_size = 16;
1637  VPxContext *ctx = avctx->priv_data;
1638 
1639  int ret = set_roi_map(avctx, sd, frame_width, frame_height, &roi_map, block_size, segment_cnt);
1640  if (ret) {
1641  log_encoder_error(avctx, "Failed to set_roi_map.\n");
1642  return ret;
1643  }
1644 
1645  if (vpx_codec_control(&ctx->encoder, VP8E_SET_ROI_MAP, &roi_map)) {
1646  log_encoder_error(avctx, "Failed to set VP8E_SET_ROI_MAP codec control.\n");
1648  }
1649 
1650  av_freep(&roi_map.roi_map);
1651  return ret;
1652 }
1653 
1654 static int realloc_alpha_uv(AVCodecContext *avctx, int width, int height)
1655 {
1656  VPxContext *ctx = avctx->priv_data;
1657  struct vpx_image *rawimg_alpha = &ctx->rawimg_alpha;
1658  unsigned char **planes = rawimg_alpha->planes;
1659  int *stride = rawimg_alpha->stride;
1660 
1661  if (!planes[VPX_PLANE_U] ||
1662  !planes[VPX_PLANE_V] ||
1663  width != (int)rawimg_alpha->d_w ||
1664  height != (int)rawimg_alpha->d_h) {
1665  av_freep(&planes[VPX_PLANE_U]);
1666  av_freep(&planes[VPX_PLANE_V]);
1667 
1668  vpx_img_wrap(rawimg_alpha, VPX_IMG_FMT_I420, width, height, 1,
1669  (unsigned char*)1);
1670  planes[VPX_PLANE_U] = av_malloc_array(stride[VPX_PLANE_U], height);
1671  planes[VPX_PLANE_V] = av_malloc_array(stride[VPX_PLANE_V], height);
1672  if (!planes[VPX_PLANE_U] || !planes[VPX_PLANE_V])
1673  return AVERROR(ENOMEM);
1674 
1675  memset(planes[VPX_PLANE_U], 0x80, stride[VPX_PLANE_U] * height);
1676  memset(planes[VPX_PLANE_V], 0x80, stride[VPX_PLANE_V] * height);
1677  }
1678 
1679  return 0;
1680 }
1681 
1683  const AVFrame *frame, int *got_packet)
1684 {
1685  VPxContext *ctx = avctx->priv_data;
1686  struct vpx_image *rawimg = NULL;
1687  struct vpx_image *rawimg_alpha = NULL;
1688  int64_t timestamp = 0;
1689  int res, coded_size;
1690  vpx_enc_frame_flags_t flags = 0;
1691  const struct vpx_codec_enc_cfg *enccfg = ctx->encoder.config.enc;
1692  vpx_svc_layer_id_t layer_id;
1693  int layer_id_valid = 0;
1694  unsigned long duration = 0;
1695 
1696  if (avctx->qmax >= 0 && enccfg->rc_max_quantizer != avctx->qmax) {
1697  struct vpx_codec_enc_cfg cfg = *enccfg;
1698  cfg.rc_max_quantizer = avctx->qmax;
1699  res = vpx_codec_enc_config_set(&ctx->encoder, &cfg);
1700  if (res != VPX_CODEC_OK) {
1701  log_encoder_error(avctx, "Error reconfiguring encoder");
1702  return AVERROR_INVALIDDATA;
1703  }
1704  }
1705 
1706  if (frame) {
1708  rawimg = &ctx->rawimg;
1709  rawimg->planes[VPX_PLANE_Y] = frame->data[0];
1710  rawimg->planes[VPX_PLANE_U] = frame->data[1];
1711  rawimg->planes[VPX_PLANE_V] = frame->data[2];
1712  rawimg->stride[VPX_PLANE_Y] = frame->linesize[0];
1713  rawimg->stride[VPX_PLANE_U] = frame->linesize[1];
1714  rawimg->stride[VPX_PLANE_V] = frame->linesize[2];
1715  if (ctx->is_alpha) {
1716  rawimg_alpha = &ctx->rawimg_alpha;
1717  res = realloc_alpha_uv(avctx, frame->width, frame->height);
1718  if (res < 0)
1719  return res;
1720  rawimg_alpha->planes[VPX_PLANE_Y] = frame->data[3];
1721  rawimg_alpha->stride[VPX_PLANE_Y] = frame->linesize[3];
1722  }
1723  timestamp = frame->pts;
1724 #if VPX_IMAGE_ABI_VERSION >= 4
1725  switch (frame->color_range) {
1726  case AVCOL_RANGE_MPEG:
1727  rawimg->range = VPX_CR_STUDIO_RANGE;
1728  break;
1729  case AVCOL_RANGE_JPEG:
1730  rawimg->range = VPX_CR_FULL_RANGE;
1731  break;
1732  }
1733 #endif
1734  if (frame->pict_type == AV_PICTURE_TYPE_I)
1735  flags |= VPX_EFLAG_FORCE_KF;
1736  if (frame->metadata) {
1737  AVDictionaryEntry* en = av_dict_get(frame->metadata, "vp8-flags", NULL, 0);
1738  if (en) {
1739  flags |= strtoul(en->value, NULL, 10);
1740  }
1741 
1742  memset(&layer_id, 0, sizeof(layer_id));
1743 
1744  en = av_dict_get(frame->metadata, "temporal_id", NULL, 0);
1745  if (en) {
1746  layer_id.temporal_layer_id = strtoul(en->value, NULL, 10);
1747 #ifdef VPX_CTRL_VP9E_SET_MAX_INTER_BITRATE_PCT
1748  layer_id.temporal_layer_id_per_spatial[0] = layer_id.temporal_layer_id;
1749 #endif
1750  layer_id_valid = 1;
1751  }
1752 #if CONFIG_LIBVPX_VP9_ENCODER && defined(VPX_CTRL_VP9E_SET_MAX_INTER_BITRATE_PCT)
1753  en = av_dict_get(frame->metadata, "ref-frame-config", NULL, 0);
1754 
1755  if (en) {
1756  if (avctx->codec_id == AV_CODEC_ID_VP9) {
1757  int ret = vpx_parse_ref_frame_config(&ctx->ref_frame_config,
1758  enccfg->ss_number_layers, en->value);
1759  if (ret < 0) {
1760  av_log(avctx, AV_LOG_WARNING,
1761  "Error parsing ref_frame_config option %s.\n", en->value);
1762  return ret;
1763  }
1764 
1765  codecctl_intp(avctx, VP9E_SET_SVC_REF_FRAME_CONFIG, (int *)&ctx->ref_frame_config);
1766  } else {
1767  av_log(avctx, AV_LOG_WARNING,
1768  "Ignoring ref-frame-config for a non-VP9 codec\n");
1769  }
1770  }
1771 #endif
1772  }
1773 
1774  if (sd) {
1775  if (avctx->codec_id == AV_CODEC_ID_VP8) {
1776  vp8_encode_set_roi(avctx, frame->width, frame->height, sd);
1777  } else {
1778  vp9_encode_set_roi(avctx, frame->width, frame->height, sd);
1779  }
1780  }
1781 
1782  if (!(avctx->flags & AV_CODEC_FLAG_PASS1)) {
1783  res = frame_data_submit(avctx, ctx->fifo, frame);
1784  if (res < 0)
1785  return res;
1786  }
1787  }
1788 
1789  // this is for encoding with preset temporal layering patterns defined in
1790  // set_temporal_layer_pattern function.
1791  if (enccfg->ts_number_layers > 1 && ctx->ts_layer_flags) {
1792  if (flags & VPX_EFLAG_FORCE_KF) {
1793  // keyframe, reset temporal layering.
1794  ctx->current_temporal_idx = 0;
1795  flags = VPX_EFLAG_FORCE_KF;
1796  } else {
1797  flags = 0;
1798  }
1799 
1800  /* get the flags from the temporal layer configuration. */
1801  flags |= ctx->ts_layer_flags[ctx->current_temporal_idx];
1802 
1803  memset(&layer_id, 0, sizeof(layer_id));
1804 #if VPX_ENCODER_ABI_VERSION >= 12
1805  layer_id.spatial_layer_id = 0;
1806 #endif
1807  layer_id.temporal_layer_id = enccfg->ts_layer_id[ctx->current_temporal_idx];
1808 #ifdef VPX_CTRL_VP9E_SET_MAX_INTER_BITRATE_PCT
1809  layer_id.temporal_layer_id_per_spatial[0] = layer_id.temporal_layer_id;
1810 #endif
1811  layer_id_valid = 1;
1812  }
1813 
1814  if (layer_id_valid) {
1815  if (avctx->codec_id == AV_CODEC_ID_VP8) {
1816  codecctl_int(avctx, VP8E_SET_TEMPORAL_LAYER_ID, layer_id.temporal_layer_id);
1817  }
1818 #if CONFIG_LIBVPX_VP9_ENCODER && VPX_ENCODER_ABI_VERSION >= 12
1819  else if (avctx->codec_id == AV_CODEC_ID_VP9) {
1820  codecctl_intp(avctx, VP9E_SET_SVC_LAYER_ID, (int *)&layer_id);
1821  }
1822 #endif
1823  }
1824 
1825  if (frame && frame->duration > ULONG_MAX) {
1826  av_log(avctx, AV_LOG_WARNING,
1827  "Frame duration too large: %"PRId64"\n", frame->duration);
1828  } else if (frame && frame->duration)
1829  duration = frame->duration;
1830  else if (avctx->framerate.num > 0 && avctx->framerate.den > 0)
1831  duration = av_rescale_q(1, av_inv_q(avctx->framerate), avctx->time_base);
1832  else {
1833  duration = 1;
1834  }
1835 
1836  res = vpx_codec_encode(&ctx->encoder, rawimg, timestamp,
1837  duration, flags, ctx->deadline);
1838  if (res != VPX_CODEC_OK) {
1839  log_encoder_error(avctx, "Error encoding frame");
1840  return AVERROR_INVALIDDATA;
1841  }
1842 
1843  if (ctx->is_alpha) {
1844  res = vpx_codec_encode(&ctx->encoder_alpha, rawimg_alpha, timestamp,
1845  duration, flags, ctx->deadline);
1846  if (res != VPX_CODEC_OK) {
1847  log_encoder_error(avctx, "Error encoding alpha frame");
1848  return AVERROR_INVALIDDATA;
1849  }
1850  }
1851 
1852  coded_size = queue_frames(avctx, &ctx->encoder, &ctx->coded_frame_list, pkt);
1853  if (ctx->is_alpha) {
1854  queue_frames(avctx, &ctx->encoder_alpha, &ctx->alpha_coded_frame_list, NULL);
1855 
1856  if (ctx->coded_frame_list && ctx->alpha_coded_frame_list) {
1857  struct FrameListData *cx_frame = ctx->coded_frame_list;
1858  struct FrameListData *alpha_cx_frame = ctx->alpha_coded_frame_list;
1859  av_assert0(!coded_size);
1860  /* return the leading frame if we've already begun queueing */
1861  coded_size = storeframe(avctx, cx_frame, alpha_cx_frame, pkt);
1862  if (coded_size < 0)
1863  return coded_size;
1864  ctx->coded_frame_list = cx_frame->next;
1865  ctx->alpha_coded_frame_list = alpha_cx_frame->next;
1866  free_coded_frame(cx_frame);
1867  free_coded_frame(alpha_cx_frame);
1868  }
1869  }
1870 
1871  if (!frame && avctx->flags & AV_CODEC_FLAG_PASS1) {
1872  unsigned int b64_size = AV_BASE64_SIZE(ctx->twopass_stats.sz);
1873 
1874  avctx->stats_out = av_malloc(b64_size);
1875  if (!avctx->stats_out) {
1876  av_log(avctx, AV_LOG_ERROR, "Stat buffer alloc (%d bytes) failed\n",
1877  b64_size);
1878  return AVERROR(ENOMEM);
1879  }
1880  av_base64_encode(avctx->stats_out, b64_size, ctx->twopass_stats.buf,
1881  ctx->twopass_stats.sz);
1882  } else if (enccfg->ts_number_layers > 1 && ctx->ts_layer_flags) {
1883  ctx->current_temporal_idx = (ctx->current_temporal_idx + 1) % enccfg->ts_periodicity;
1884  }
1885 
1886  *got_packet = !!coded_size;
1887  return 0;
1888 }
1889 
1890 #define OFFSET(x) offsetof(VPxContext, x)
1891 #define VE AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_ENCODING_PARAM
1892 
1893 #define COMMON_OPTIONS \
1894  { "lag-in-frames", "Number of frames to look ahead for " \
1895  "alternate reference frame selection", OFFSET(lag_in_frames), AV_OPT_TYPE_INT, {.i64 = -1}, -1, INT_MAX, VE}, \
1896  { "arnr-maxframes", "altref noise reduction max frame count", OFFSET(arnr_max_frames), AV_OPT_TYPE_INT, {.i64 = -1}, -1, INT_MAX, VE}, \
1897  { "arnr-strength", "altref noise reduction filter strength", OFFSET(arnr_strength), AV_OPT_TYPE_INT, {.i64 = -1}, -1, INT_MAX, VE}, \
1898  { "arnr-type", "altref noise reduction filter type", OFFSET(arnr_type), AV_OPT_TYPE_INT, {.i64 = -1}, -1, INT_MAX, VE, .unit = "arnr_type"}, \
1899  { "backward", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = 1}, 0, 0, VE, .unit = "arnr_type" }, \
1900  { "forward", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = 2}, 0, 0, VE, .unit = "arnr_type" }, \
1901  { "centered", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = 3}, 0, 0, VE, .unit = "arnr_type" }, \
1902  { "tune", "Tune the encoding to a specific scenario", OFFSET(tune), AV_OPT_TYPE_INT, {.i64 = -1}, -1, INT_MAX, VE, .unit = "tune"}, \
1903  { "psnr", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = VP8_TUNE_PSNR}, 0, 0, VE, .unit = "tune"}, \
1904  { "ssim", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = VP8_TUNE_SSIM}, 0, 0, VE, .unit = "tune"}, \
1905  { "deadline", "Time to spend encoding, in microseconds.", OFFSET(deadline), AV_OPT_TYPE_INT, {.i64 = VPX_DL_GOOD_QUALITY}, INT_MIN, INT_MAX, VE, .unit = "quality"}, \
1906  { "best", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = VPX_DL_BEST_QUALITY}, 0, 0, VE, .unit = "quality"}, \
1907  { "good", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = VPX_DL_GOOD_QUALITY}, 0, 0, VE, .unit = "quality"}, \
1908  { "realtime", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = VPX_DL_REALTIME}, 0, 0, VE, .unit = "quality"}, \
1909  { "error-resilient", "Error resilience configuration", OFFSET(error_resilient), AV_OPT_TYPE_FLAGS, {.i64 = 0}, INT_MIN, INT_MAX, VE, .unit = "er"}, \
1910  { "max-intra-rate", "Maximum I-frame bitrate (pct) 0=unlimited", OFFSET(max_intra_rate), AV_OPT_TYPE_INT, {.i64 = -1}, -1, INT_MAX, VE}, \
1911  { "default", "Improve resiliency against losses of whole frames", 0, AV_OPT_TYPE_CONST, {.i64 = VPX_ERROR_RESILIENT_DEFAULT}, 0, 0, VE, .unit = "er"}, \
1912  { "partitions", "The frame partitions are independently decodable " \
1913  "by the bool decoder, meaning that partitions can be decoded even " \
1914  "though earlier partitions have been lost. Note that intra prediction" \
1915  " is still done over the partition boundary.", 0, AV_OPT_TYPE_CONST, {.i64 = VPX_ERROR_RESILIENT_PARTITIONS}, 0, 0, VE, .unit = "er"}, \
1916  { "crf", "Select the quality for constant quality mode", offsetof(VPxContext, crf), AV_OPT_TYPE_INT, {.i64 = -1}, -1, 63, VE }, \
1917  { "static-thresh", "A change threshold on blocks below which they will be skipped by the encoder", OFFSET(static_thresh), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, INT_MAX, VE }, \
1918  { "drop-threshold", "Frame drop threshold", offsetof(VPxContext, drop_threshold), AV_OPT_TYPE_INT, {.i64 = 0 }, INT_MIN, INT_MAX, VE }, \
1919  { "noise-sensitivity", "Noise sensitivity", OFFSET(noise_sensitivity), AV_OPT_TYPE_INT, {.i64 = 0 }, 0, 4, VE}, \
1920  { "undershoot-pct", "Datarate undershoot (min) target (%)", OFFSET(rc_undershoot_pct), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, 100, VE }, \
1921  { "overshoot-pct", "Datarate overshoot (max) target (%)", OFFSET(rc_overshoot_pct), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, 1000, VE }, \
1922  { "ts-parameters", "Temporal scaling configuration using a :-separated list of key=value parameters", OFFSET(vpx_ts_parameters), AV_OPT_TYPE_DICT, {.str=NULL}, 0, 0, VE}, \
1923 
1924 #define LEGACY_OPTIONS \
1925  {"speed", "", offsetof(VPxContext, cpu_used), AV_OPT_TYPE_INT, {.i64 = 1}, -16, 16, VE}, \
1926  {"quality", "", offsetof(VPxContext, deadline), AV_OPT_TYPE_INT, {.i64 = VPX_DL_GOOD_QUALITY}, INT_MIN, INT_MAX, VE, .unit = "quality"}, \
1927  {"vp8flags", "", offsetof(VPxContext, flags), AV_OPT_TYPE_FLAGS, {.i64 = 0}, 0, UINT_MAX, VE, .unit = "flags"}, \
1928  {"error_resilient", "enable error resilience", 0, AV_OPT_TYPE_CONST, {.i64 = VP8F_ERROR_RESILIENT}, INT_MIN, INT_MAX, VE, .unit = "flags"}, \
1929  {"altref", "enable use of alternate reference frames (VP8/2-pass only)", 0, AV_OPT_TYPE_CONST, {.i64 = VP8F_AUTO_ALT_REF}, INT_MIN, INT_MAX, VE, .unit = "flags"}, \
1930  {"arnr_max_frames", "altref noise reduction max frame count", offsetof(VPxContext, arnr_max_frames), AV_OPT_TYPE_INT, {.i64 = 0}, 0, 15, VE}, \
1931  {"arnr_strength", "altref noise reduction filter strength", offsetof(VPxContext, arnr_strength), AV_OPT_TYPE_INT, {.i64 = 3}, 0, 6, VE}, \
1932  {"arnr_type", "altref noise reduction filter type", offsetof(VPxContext, arnr_type), AV_OPT_TYPE_INT, {.i64 = 3}, 1, 3, VE}, \
1933  {"rc_lookahead", "Number of frames to look ahead for alternate reference frame selection", offsetof(VPxContext, lag_in_frames), AV_OPT_TYPE_INT, {.i64 = 25}, 0, 25, VE}, \
1934  {"sharpness", "Increase sharpness at the expense of lower PSNR", offsetof(VPxContext, sharpness), AV_OPT_TYPE_INT, {.i64 = -1}, -1, 7, VE},
1935 
1936 #if CONFIG_LIBVPX_VP8_ENCODER
1937 static const AVOption vp8_options[] = {
1939  { "auto-alt-ref", "Enable use of alternate reference "
1940  "frames (2-pass only)", OFFSET(auto_alt_ref), AV_OPT_TYPE_INT, {.i64 = -1}, -1, 2, VE},
1941  { "cpu-used", "Quality/Speed ratio modifier", OFFSET(cpu_used), AV_OPT_TYPE_INT, {.i64 = 1}, -16, 16, VE},
1942  { "screen-content-mode", "Encoder screen content mode", OFFSET(screen_content_mode), AV_OPT_TYPE_INT, {.i64 = -1}, -1, 2, VE},
1944  { NULL }
1945 };
1946 #endif
1947 
1948 #if CONFIG_LIBVPX_VP9_ENCODER
1949 static const AVOption vp9_options[] = {
1951  { "auto-alt-ref", "Enable use of alternate reference "
1952  "frames (2-pass only)", OFFSET(auto_alt_ref), AV_OPT_TYPE_INT, {.i64 = -1}, -1, 6, VE},
1953  { "cpu-used", "Quality/Speed ratio modifier", OFFSET(cpu_used), AV_OPT_TYPE_INT, {.i64 = 1}, -8, 8, VE},
1954  { "lossless", "Lossless mode", OFFSET(lossless), AV_OPT_TYPE_INT, {.i64 = -1}, -1, 1, VE},
1955  { "tile-columns", "Number of tile columns to use, log2", OFFSET(tile_columns), AV_OPT_TYPE_INT, {.i64 = -1}, -1, 6, VE},
1956  { "tile-rows", "Number of tile rows to use, log2", OFFSET(tile_rows), AV_OPT_TYPE_INT, {.i64 = -1}, -1, 2, VE},
1957  { "frame-parallel", "Enable frame parallel decodability features", OFFSET(frame_parallel), AV_OPT_TYPE_BOOL,{.i64 = -1}, -1, 1, VE},
1958 #if VPX_ENCODER_ABI_VERSION >= 12
1959  { "aq-mode", "adaptive quantization mode", OFFSET(aq_mode), AV_OPT_TYPE_INT, {.i64 = -1}, -1, 4, VE, .unit = "aq_mode"},
1960 #else
1961  { "aq-mode", "adaptive quantization mode", OFFSET(aq_mode), AV_OPT_TYPE_INT, {.i64 = -1}, -1, 3, VE, .unit = "aq_mode"},
1962 #endif
1963  { "none", "Aq not used", 0, AV_OPT_TYPE_CONST, {.i64 = 0}, 0, 0, VE, .unit = "aq_mode" },
1964  { "variance", "Variance based Aq", 0, AV_OPT_TYPE_CONST, {.i64 = 1}, 0, 0, VE, .unit = "aq_mode" },
1965  { "complexity", "Complexity based Aq", 0, AV_OPT_TYPE_CONST, {.i64 = 2}, 0, 0, VE, .unit = "aq_mode" },
1966  { "cyclic", "Cyclic Refresh Aq", 0, AV_OPT_TYPE_CONST, {.i64 = 3}, 0, 0, VE, .unit = "aq_mode" },
1967 #if VPX_ENCODER_ABI_VERSION >= 12
1968  { "equator360", "360 video Aq", 0, AV_OPT_TYPE_CONST, {.i64 = 4}, 0, 0, VE, .unit = "aq_mode" },
1969  {"level", "Specify level", OFFSET(level), AV_OPT_TYPE_FLOAT, {.dbl=-1}, -1, 6.2, VE},
1970 #endif
1971 #ifdef VPX_CTRL_VP9E_SET_ROW_MT
1972  {"row-mt", "Row based multi-threading", OFFSET(row_mt), AV_OPT_TYPE_BOOL, {.i64 = -1}, -1, 1, VE},
1973 #endif
1974 #ifdef VPX_CTRL_VP9E_SET_TUNE_CONTENT
1975 #if VPX_ENCODER_ABI_VERSION >= 14
1976  { "tune-content", "Tune content type", OFFSET(tune_content), AV_OPT_TYPE_INT, {.i64 = -1}, -1, 2, VE, .unit = "tune_content" },
1977 #else
1978  { "tune-content", "Tune content type", OFFSET(tune_content), AV_OPT_TYPE_INT, {.i64 = -1}, -1, 1, VE, .unit = "tune_content" },
1979 #endif
1980  { "default", "Regular video content", 0, AV_OPT_TYPE_CONST, {.i64 = 0}, 0, 0, VE, .unit = "tune_content" },
1981  { "screen", "Screen capture content", 0, AV_OPT_TYPE_CONST, {.i64 = 1}, 0, 0, VE, .unit = "tune_content" },
1982 #if VPX_ENCODER_ABI_VERSION >= 14
1983  { "film", "Film content; improves grain retention", 0, AV_OPT_TYPE_CONST, {.i64 = 2}, 0, 0, VE, .unit = "tune_content" },
1984 #endif
1985 #endif
1986 #if VPX_ENCODER_ABI_VERSION >= 14
1987  { "corpus-complexity", "corpus vbr complexity midpoint", OFFSET(corpus_complexity), AV_OPT_TYPE_INT, {.i64 = -1}, -1, 10000, VE },
1988 #endif
1989 #ifdef VPX_CTRL_VP9E_SET_TPL
1990  { "enable-tpl", "Enable temporal dependency model", OFFSET(tpl_model), AV_OPT_TYPE_BOOL, {.i64 = -1}, -1, 1, VE },
1991 #endif
1992 #ifdef VPX_CTRL_VP9E_SET_MIN_GF_INTERVAL
1993  { "min-gf-interval", "Minimum golden/alternate reference frame interval", OFFSET(min_gf_interval), AV_OPT_TYPE_INT, {.i64 = -1}, -1, INT_MAX, VE },
1994 #endif
1996  { NULL }
1997 };
1998 #endif
1999 
2000 #undef COMMON_OPTIONS
2001 #undef LEGACY_OPTIONS
2002 
2003 static const FFCodecDefault defaults[] = {
2004  { "b", "0" },
2005  { "qmin", "-1" },
2006  { "qmax", "-1" },
2007  { "g", "-1" },
2008  { "keyint_min", "-1" },
2009  { NULL },
2010 };
2011 
2012 #if CONFIG_LIBVPX_VP8_ENCODER
2013 static av_cold int vp8_init(AVCodecContext *avctx)
2014 {
2015  return vpx_init(avctx, vpx_codec_vp8_cx());
2016 }
2017 
2018 static const AVClass class_vp8 = {
2019  .class_name = "libvpx-vp8 encoder",
2020  .item_name = av_default_item_name,
2021  .option = vp8_options,
2022  .version = LIBAVUTIL_VERSION_INT,
2023 };
2024 
2026  .p.name = "libvpx",
2027  CODEC_LONG_NAME("libvpx VP8"),
2028  .p.type = AVMEDIA_TYPE_VIDEO,
2029  .p.id = AV_CODEC_ID_VP8,
2030  .p.capabilities = AV_CODEC_CAP_DR1 | AV_CODEC_CAP_DELAY |
2033  .priv_data_size = sizeof(VPxContext),
2034  .init = vp8_init,
2036  .close = vpx_free,
2037  .caps_internal = FF_CODEC_CAP_NOT_INIT_THREADSAFE |
2041  .color_ranges = AVCOL_RANGE_MPEG | AVCOL_RANGE_JPEG,
2042  .p.priv_class = &class_vp8,
2043  .defaults = defaults,
2044  .p.wrapper_name = "libvpx",
2045 };
2046 #endif /* CONFIG_LIBVPX_VP8_ENCODER */
2047 
2048 #if CONFIG_LIBVPX_VP9_ENCODER
2049 static av_cold int vp9_init(AVCodecContext *avctx)
2050 {
2051  return vpx_init(avctx, vpx_codec_vp9_cx());
2052 }
2053 
2054 static const enum AVPixelFormat vp9_pix_fmts_highcol[] = {
2062 };
2063 
2064 static const enum AVPixelFormat vp9_pix_fmts_highbd[] = {
2082 };
2083 
2084 static int vp9_get_supported_config(const AVCodecContext *avctx,
2085  const AVCodec *codec,
2086  enum AVCodecConfig config,
2087  unsigned flags, const void **out,
2088  int *out_num)
2089 {
2091  vpx_codec_caps_t codec_caps = vpx_codec_get_caps(vpx_codec_vp9_cx());
2092  if (codec_caps & VPX_CODEC_CAP_HIGHBITDEPTH) {
2093  *out = vp9_pix_fmts_highbd;
2094  *out_num = FF_ARRAY_ELEMS(vp9_pix_fmts_highbd) - 1;
2095  } else {
2096  *out = vp9_pix_fmts_highcol;
2097  *out_num = FF_ARRAY_ELEMS(vp9_pix_fmts_highcol) - 1;
2098  }
2099  return 0;
2100  }
2101 
2102  return ff_default_get_supported_config(avctx, codec, config, flags, out, out_num);
2103 }
2104 
2105 static const AVClass class_vp9 = {
2106  .class_name = "libvpx-vp9 encoder",
2107  .item_name = av_default_item_name,
2108  .option = vp9_options,
2109  .version = LIBAVUTIL_VERSION_INT,
2110 };
2111 
2113  .p.name = "libvpx-vp9",
2114  CODEC_LONG_NAME("libvpx VP9"),
2115  .p.type = AVMEDIA_TYPE_VIDEO,
2116  .p.id = AV_CODEC_ID_VP9,
2117  .p.capabilities = AV_CODEC_CAP_DR1 | AV_CODEC_CAP_DELAY |
2120  .p.profiles = NULL_IF_CONFIG_SMALL(ff_vp9_profiles),
2121  .p.priv_class = &class_vp9,
2122  .p.wrapper_name = "libvpx",
2123  .priv_data_size = sizeof(VPxContext),
2124  .init = vp9_init,
2125  .color_ranges = AVCOL_RANGE_MPEG | AVCOL_RANGE_JPEG,
2127  .close = vpx_free,
2128  .caps_internal = FF_CODEC_CAP_NOT_INIT_THREADSAFE |
2131  .defaults = defaults,
2132  .get_supported_config = vp9_get_supported_config,
2133 };
2134 #endif /* CONFIG_LIBVPX_VP9_ENCODER */
error
static void error(const char *err)
Definition: target_bsf_fuzzer.c:32
flags
const SwsFlags flags[]
Definition: swscale.c:61
av_packet_unref
void av_packet_unref(AVPacket *pkt)
Wipe the packet.
Definition: packet.c:432
av_fifo_drain2
void av_fifo_drain2(AVFifo *f, size_t size)
Discard the specified amount of data from an AVFifo.
Definition: fifo.c:266
CODEC_PIXFMTS
#define CODEC_PIXFMTS(...)
Definition: codec_internal.h:392
AVCodec
AVCodec.
Definition: codec.h:172
AV_LOG_WARNING
#define AV_LOG_WARNING
Something somehow does not look correct.
Definition: log.h:216
AVPixelFormat
AVPixelFormat
Pixel format.
Definition: pixfmt.h:71
level
uint8_t level
Definition: svq3.c:208
FrameListData::pts
int64_t pts
time stamp to show frame (in timebase units)
Definition: libaomenc.c:61
av_clip
#define av_clip
Definition: common.h:100
FF_CODEC_CAP_INIT_CLEANUP
#define FF_CODEC_CAP_INIT_CLEANUP
The codec allows calling the close function for deallocation even if the init function returned a fai...
Definition: codec_internal.h:42
AVCodecContext::keyint_min
int keyint_min
minimum GOP size
Definition: avcodec.h:998
vp9_init
static av_cold int vp9_init(AVFormatContext *ctx, int st_index, PayloadContext *data)
Definition: rtpdec_vp9.c:34
AVERROR
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
opt.h
set_color_range
static void set_color_range(AVCodecContext *avctx)
Definition: libaomenc.c:546
VPxEncoderContext::screen_content_mode
int screen_content_mode
Definition: libvpxenc.c:124
AVCodecContext::colorspace
enum AVColorSpace colorspace
YUV colorspace type.
Definition: avcodec.h:659
FrameData
Definition: ffmpeg.h:713
out
FILE * out
Definition: movenc.c:55
av_frame_get_side_data
AVFrameSideData * av_frame_get_side_data(const AVFrame *frame, enum AVFrameSideDataType type)
Definition: frame.c:659
AVCodecContext::rc_min_rate
int64_t rc_min_rate
minimum bitrate
Definition: avcodec.h:1277
vp8_ts_parse_int_array
static void vp8_ts_parse_int_array(int *dest, char *value, size_t value_len, int max_entries)
Definition: libvpxenc.c:530
frame_data_uninit
static void frame_data_uninit(FrameData *fd)
Definition: libvpxenc.c:341
av_pix_fmt_desc_get
const AVPixFmtDescriptor * av_pix_fmt_desc_get(enum AVPixelFormat pix_fmt)
Definition: pixdesc.c:3456
AVBufferRef::data
uint8_t * data
The data buffer.
Definition: buffer.h:90
VPxEncoderContext::rawimg_alpha
struct vpx_image rawimg_alpha
Definition: libvpxenc.c:84
AVPictureType
AVPictureType
Definition: avutil.h:276
int64_t
long long int64_t
Definition: coverity.c:34
ff_libvpx_vp9_encoder
FFCodec ff_libvpx_vp9_encoder
VPxEncoderContext
Definition: libvpxenc.c:79
VPxEncoderContext::is_alpha
uint8_t is_alpha
Definition: libvpxenc.c:85
av_fifo_peek
int av_fifo_peek(const AVFifo *f, void *buf, size_t nb_elems, size_t offset)
Read data from a FIFO without modifying FIFO state.
Definition: fifo.c:255
VPxEncoderContext::rawimg
struct vpx_image rawimg
Definition: libvpxenc.c:82
AVFrame
This structure describes decoded (raw) audio or video data.
Definition: frame.h:427
pixdesc.h
AVFrameSideData::buf
AVBufferRef * buf
Definition: frame.h:287
AVCodecContext::color_trc
enum AVColorTransferCharacteristic color_trc
Color Transfer Characteristic.
Definition: avcodec.h:652
AVCOL_RANGE_JPEG
@ AVCOL_RANGE_JPEG
Full range content.
Definition: pixfmt.h:777
AVPacket::data
uint8_t * data
Definition: packet.h:588
VP8F_ERROR_RESILIENT
#define VP8F_ERROR_RESILIENT
Enable measures appropriate for streaming over lossy links.
Definition: libvpxenc.c:100
AVOption
AVOption.
Definition: opt.h:429
encode.h
set_pix_fmt
static int set_pix_fmt(AVCodecContext *avctx, struct aom_image *img)
Definition: libaomdec.c:68
data
const char data[16]
Definition: mxf.c:149
AV_PIX_FMT_YUV420P10
#define AV_PIX_FMT_YUV420P10
Definition: pixfmt.h:539
FF_CODEC_CAP_NOT_INIT_THREADSAFE
#define FF_CODEC_CAP_NOT_INIT_THREADSAFE
The codec is not known to be init-threadsafe (i.e.
Definition: codec_internal.h:34
FFCodec
Definition: codec_internal.h:127
AV_LOG_VERBOSE
#define AV_LOG_VERBOSE
Detailed information.
Definition: log.h:226
AVCOL_SPC_RGB
@ AVCOL_SPC_RGB
order of coefficients is actually GBR, also IEC 61966-2-1 (sRGB), YZX and ST 428-1
Definition: pixfmt.h:701
VP8F_AUTO_ALT_REF
#define VP8F_AUTO_ALT_REF
Enable automatic alternate reference frame generation.
Definition: libvpxenc.c:101
AVPacket::duration
int64_t duration
Duration of this packet in AVStream->time_base units, 0 if unknown.
Definition: packet.h:606
VPxEncoderContext::have_sse
int have_sse
true if we have pending sse[]
Definition: libvpxenc.c:90
AV_PIX_FMT_YUV440P
@ AV_PIX_FMT_YUV440P
planar YUV 4:4:0 (1 Cr & Cb sample per 1x2 Y samples)
Definition: pixfmt.h:106
mathematics.h
AVDictionary
Definition: dict.c:32
AV_CODEC_FLAG_PSNR
#define AV_CODEC_FLAG_PSNR
error[?] variables will be set during encoding.
Definition: avcodec.h:306
av_buffer_ref
AVBufferRef * av_buffer_ref(const AVBufferRef *buf)
Create a new reference to an AVBuffer.
Definition: buffer.c:103
AV_CODEC_CONFIG_PIX_FORMAT
@ AV_CODEC_CONFIG_PIX_FORMAT
AVPixelFormat, terminated by AV_PIX_FMT_NONE.
Definition: avcodec.h:2531
VPxEncoderContext::fifo
AVFifo * fifo
Definition: libvpxenc.c:143
VPxEncoderContext::level
float level
Definition: libvpxenc.c:135
AVCodecContext::qmax
int qmax
maximum quantizer
Definition: avcodec.h:1241
VPxEncoderContext::aq_mode
int aq_mode
Definition: libvpxenc.c:131
tf_sess_config.config
config
Definition: tf_sess_config.py:33
AV_PKT_FLAG_KEY
#define AV_PKT_FLAG_KEY
The packet contains a keyframe.
Definition: packet.h:643
quality
trying all byte sequences megabyte in length and selecting the best looking sequence will yield cases to try But a word about quality
Definition: rate_distortion.txt:12
AV_WB64
#define AV_WB64(p, v)
Definition: intreadwrite.h:429
av_malloc
#define av_malloc(s)
Definition: tableprint_vlc.h:31
VPxEncoderContext::encoder_alpha
struct vpx_codec_ctx encoder_alpha
Definition: libvpxenc.c:83
AVCodecContext::framerate
AVRational framerate
Definition: avcodec.h:551
AVCOL_SPC_BT470BG
@ AVCOL_SPC_BT470BG
also ITU-R BT601-6 625 / ITU-R BT1358 625 / ITU-R BT1700 625 PAL & SECAM / IEC 61966-2-4 xvYCC601
Definition: pixfmt.h:706
VPxEncoderContext::auto_alt_ref
int auto_alt_ref
Definition: libvpxenc.c:103
AVCOL_SPC_RESERVED
@ AVCOL_SPC_RESERVED
reserved for future use by ITU-T and ISO/IEC just like 15-255 are
Definition: pixfmt.h:704
FrameListData::flags
uint32_t flags
flags for this frame
Definition: libaomenc.c:65
VPxEncoderContext::coded_frame_list
struct FrameListData * coded_frame_list
Definition: libvpxenc.c:91
AV_CODEC_FLAG_COPY_OPAQUE
#define AV_CODEC_FLAG_COPY_OPAQUE
Definition: avcodec.h:279
fifo.h
FFCodecDefault
Definition: codec_internal.h:96
FFCodec::p
AVCodec p
The public AVCodec.
Definition: codec_internal.h:131
VPxEncoderContext::deadline
int deadline
Definition: libvpxenc.c:88
AVPacket::opaque_ref
AVBufferRef * opaque_ref
AVBufferRef for free use by the API user.
Definition: packet.h:624
fail
#define fail()
Definition: checkasm.h:207
av_fifo_write
int av_fifo_write(AVFifo *f, const void *buf, size_t nb_elems)
Write data into a FIFO.
Definition: fifo.c:188
AVCodecContext::thread_count
int thread_count
thread count is used to decide how many independent tasks should be passed to execute()
Definition: avcodec.h:1561
AV_PIX_FMT_GBRP10
#define AV_PIX_FMT_GBRP10
Definition: pixfmt.h:558
VPxEncoderContext::drop_threshold
int drop_threshold
Definition: libvpxenc.c:132
set_vp8_defaults
static void set_vp8_defaults(AVCodecContext *avctx, struct vpx_codec_enc_cfg *enccfg)
Set the target bitrate to VPX library default.
Definition: libvpxenc.c:905
VPxEncoderContext::roi_warned
int roi_warned
If the driver does not support ROI then warn the first time we encounter a frame with ROI side data.
Definition: libvpxenc.c:148
AVCodecContext::flags
int flags
AV_CODEC_FLAG_*.
Definition: avcodec.h:488
codecctl_int
static av_cold int codecctl_int(AVCodecContext *avctx, enum vp8e_enc_control_id id, int val)
Definition: libvpxenc.c:434
realloc_alpha_uv
static int realloc_alpha_uv(AVCodecContext *avctx, int width, int height)
Definition: libvpxenc.c:1654
val
static double val(void *priv, double ch)
Definition: aeval.c:77
vpx_ts_param_parse
static int vpx_ts_param_parse(VPxContext *ctx, struct vpx_codec_enc_cfg *enccfg, char *key, char *value, enum AVCodecID codec_id)
Definition: libvpxenc.c:660
VPxEncoderContext::max_intra_rate
int max_intra_rate
Definition: libvpxenc.c:115
ff_encode_add_stats_side_data
int ff_encode_add_stats_side_data(AVPacket *pkt, int quality, const int64_t error[], int error_count, enum AVPictureType pict_type)
Definition: encode.c:918
FF_CODEC_ENCODE_CB
#define FF_CODEC_ENCODE_CB(func)
Definition: codec_internal.h:359
AVRational::num
int num
Numerator.
Definition: rational.h:59
LEGACY_OPTIONS
#define LEGACY_OPTIONS
Definition: libvpxenc.c:1924
AV_PIX_FMT_YUV444P10
#define AV_PIX_FMT_YUV444P10
Definition: pixfmt.h:542
vpx_encode
static int vpx_encode(AVCodecContext *avctx, AVPacket *pkt, const AVFrame *frame, int *got_packet)
Definition: libvpxenc.c:1682
avassert.h
lrint
#define lrint
Definition: tablegen.h:53
pkt
AVPacket * pkt
Definition: movenc.c:60
AV_LOG_ERROR
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
Definition: log.h:210
AVFrameSideData::size
size_t size
Definition: frame.h:285
FF_ARRAY_ELEMS
#define FF_ARRAY_ELEMS(a)
Definition: sinewin_tablegen.c:29
av_cold
#define av_cold
Definition: attributes.h:106
AVRegionOfInterest
Structure describing a single Region Of Interest.
Definition: frame.h:353
AV_PROFILE_UNKNOWN
#define AV_PROFILE_UNKNOWN
Definition: defs.h:65
av_fifo_read
int av_fifo_read(AVFifo *f, void *buf, size_t nb_elems)
Read data from a FIFO.
Definition: fifo.c:240
AVCodecContext::rc_initial_buffer_occupancy
int rc_initial_buffer_occupancy
Number of bits which should be loaded into the rc buffer before decoding starts.
Definition: avcodec.h:1298
duration
int64_t duration
Definition: movenc.c:65
av_dict_get
AVDictionaryEntry * av_dict_get(const AVDictionary *m, const char *key, const AVDictionaryEntry *prev, int flags)
Get a dictionary entry with matching key.
Definition: dict.c:60
av_fast_realloc
void * av_fast_realloc(void *ptr, unsigned int *size, size_t min_size)
Reallocate the given buffer if it is not large enough, otherwise do nothing.
Definition: mem.c:497
intreadwrite.h
AVCodecContext::stats_in
char * stats_in
pass2 encoding statistics input buffer Concatenated stuff from stats_out of pass1 should be placed he...
Definition: avcodec.h:1320
AV_PIX_FMT_YUVA420P
@ AV_PIX_FMT_YUVA420P
planar YUV 4:2:0, 20bpp, (1 Cr & Cb sample per 2x2 Y & A samples)
Definition: pixfmt.h:108
COMMON_OPTIONS
#define COMMON_OPTIONS
Definition: libvpxenc.c:1893
AVRegionOfInterest::bottom
int bottom
Definition: frame.h:369
AVFormatContext::flags
int flags
Flags modifying the (de)muxer behaviour.
Definition: avformat.h:1415
vpx_init
static av_cold int vpx_init(AVCodecContext *avctx, const struct vpx_codec_iface *iface)
Definition: libvpxenc.c:962
AVCOL_SPC_SMPTE170M
@ AVCOL_SPC_SMPTE170M
also ITU-R BT601-6 525 / ITU-R BT1358 525 / ITU-R BT1700 NTSC / functionally identical to above
Definition: pixfmt.h:707
log_encoder_error
static av_cold void log_encoder_error(AVCodecContext *avctx, const char *desc)
Definition: libvpxenc.c:205
AVDictionaryEntry::key
char * key
Definition: dict.h:91
AV_CODEC_ID_VP9
@ AV_CODEC_ID_VP9
Definition: codec_id.h:222
AV_CODEC_CAP_OTHER_THREADS
#define AV_CODEC_CAP_OTHER_THREADS
Codec supports multithreading through a method other than slice- or frame-level multithreading.
Definition: codec.h:109
av_strtok
char * av_strtok(char *s, const char *delim, char **saveptr)
Split the string into several tokens which can be accessed by successive calls to av_strtok().
Definition: avstring.c:179
VPxEncoderContext::row_mt
int row_mt
Definition: libvpxenc.c:136
FrameListData::sse
uint64_t sse[4]
Definition: libaomenc.c:66
AV_CODEC_CAP_ENCODER_REORDERED_OPAQUE
#define AV_CODEC_CAP_ENCODER_REORDERED_OPAQUE
This encoder can reorder user opaque values from input AVFrames and return them with corresponding ou...
Definition: codec.h:144
VPxEncoderContext::lag_in_frames
int lag_in_frames
Definition: libvpxenc.c:111
tile_rows
int tile_rows
Definition: h265_levels.c:217
av_assert0
#define av_assert0(cond)
assert() equivalent, that is always enabled.
Definition: avassert.h:41
AV_LOG_DEBUG
#define AV_LOG_DEBUG
Stuff which is only useful for libav* developers.
Definition: log.h:231
VPxEncoderContext::arnr_type
int arnr_type
Definition: libvpxenc.c:107
ctx
AVFormatContext * ctx
Definition: movenc.c:49
MAX_DELTA_Q
#define MAX_DELTA_Q
av_rescale_q
int64_t av_rescale_q(int64_t a, AVRational bq, AVRational cq)
Rescale a 64-bit integer by 2 rational numbers.
Definition: mathematics.c:142
VPxEncoderContext::static_thresh
int static_thresh
Definition: libvpxenc.c:114
codec_id
enum AVCodecID codec_id
Definition: vaapi_decode.c:410
AV_PIX_FMT_YUV420P
@ AV_PIX_FMT_YUV420P
planar YUV 4:2:0, 12bpp, (1 Cr & Cb sample per 2x2 Y samples)
Definition: pixfmt.h:73
VPxEncoderContext::rc_undershoot_pct
int rc_undershoot_pct
Definition: libvpxenc.c:116
AVCodecContext::rc_max_rate
int64_t rc_max_rate
maximum bitrate
Definition: avcodec.h:1270
AVCodecContext::error
uint64_t error[AV_NUM_DATA_POINTERS]
error
Definition: avcodec.h:1505
key
const char * key
Definition: hwcontext_opencl.c:189
MAX_VPX_THREADS
#define MAX_VPX_THREADS
Definition: libvpx.h:24
cx_pktcpy
static void cx_pktcpy(struct FrameListData *dst, const struct vpx_codec_cx_pkt *src, VPxContext *ctx)
Definition: libvpxenc.c:1290
VPxEncoderContext::current_temporal_idx
int current_temporal_idx
Definition: libvpxenc.c:121
AV_ROUND_NEAR_INF
@ AV_ROUND_NEAR_INF
Round to nearest and halfway cases away from zero.
Definition: mathematics.h:135
AVPacket::opaque
void * opaque
for some private data of the user
Definition: packet.h:613
AVCPBProperties
This structure describes the bitrate properties of an encoded bitstream.
Definition: defs.h:282
CODEC_LONG_NAME
#define CODEC_LONG_NAME(str)
Definition: codec_internal.h:332
tmp
static uint8_t tmp[40]
Definition: aes_ctr.c:52
AVCodecContext::codec_id
enum AVCodecID codec_id
Definition: avcodec.h:441
if
if(ret)
Definition: filter_design.txt:179
set_vpx_defaults
static void set_vpx_defaults(AVCodecContext *avctx, struct vpx_codec_enc_cfg *enccfg)
Called when the bitrate is not set.
Definition: libvpxenc.c:949
AVCodecContext::rc_buffer_size
int rc_buffer_size
decoder bitstream buffer size
Definition: avcodec.h:1255
VPxEncoderContext::ts_layer_flags
int * ts_layer_flags
Definition: libvpxenc.c:120
LIBAVUTIL_VERSION_INT
#define LIBAVUTIL_VERSION_INT
Definition: version.h:85
AVClass
Describe the class of an AVClass context structure.
Definition: log.h:76
NULL
#define NULL
Definition: coverity.c:32
AVCodecContext::color_range
enum AVColorRange color_range
MPEG vs JPEG YUV range.
Definition: avcodec.h:669
av_buffer_unref
void av_buffer_unref(AVBufferRef **buf)
Free a given reference and automatically free the buffer if there are no more references to it.
Definition: buffer.c:139
IS_VP9
#define IS_VP9(avctx)
Definition: libvpxenc.c:51
frame_data_apply
static int frame_data_apply(AVCodecContext *avctx, AVFifo *fifo, AVPacket *pkt)
Definition: libvpxenc.c:395
VPxEncoderContext::twopass_stats
struct vpx_fixed_buf twopass_stats
Definition: libvpxenc.c:86
vpx_free
static av_cold int vpx_free(AVCodecContext *avctx)
Definition: libvpxenc.c:500
AVCodecContext::bit_rate
int64_t bit_rate
the average bitrate
Definition: avcodec.h:481
FrameData::duration
int64_t duration
Definition: librav1e.c:60
AVRegionOfInterest::self_size
uint32_t self_size
Must be set to the size of this data structure (that is, sizeof(AVRegionOfInterest)).
Definition: frame.h:358
av_default_item_name
const char * av_default_item_name(void *ptr)
Return the context name.
Definition: log.c:241
AV_PICTURE_TYPE_I
@ AV_PICTURE_TYPE_I
Intra.
Definition: avutil.h:278
profiles.h
AV_PIX_FMT_YUV440P10
#define AV_PIX_FMT_YUV440P10
Definition: pixfmt.h:541
list
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining list
Definition: filter_design.txt:25
VPxEncoderContext::noise_sensitivity
int noise_sensitivity
Definition: libvpxenc.c:133
FrameData::frame_opaque
void * frame_opaque
Definition: librav1e.c:62
FrameListData::buf
void * buf
compressed data buffer
Definition: libaomenc.c:59
VPxEncoderContext::crf
int crf
Definition: libvpxenc.c:113
VPxEncoderContext::tpl_model
int tpl_model
Definition: libvpxenc.c:139
AV_PIX_FMT_YUV422P10
#define AV_PIX_FMT_YUV422P10
Definition: pixfmt.h:540
av_base64_decode
int av_base64_decode(uint8_t *out, const char *in_str, int out_size)
Decode a base64-encoded string.
Definition: base64.c:81
VPxEncoderContext::encoder
struct vpx_codec_ctx encoder
Definition: libvpxenc.c:81
VPxEncoderContext::flags
int flags
VP8 specific flags, see VP8F_* below.
Definition: libvpxenc.c:99
base64.h
stats
static void stats(AVPacket *const *in, int n_in, unsigned *_max, unsigned *_sum)
Definition: vp9_superframe.c:34
AVCOL_RANGE_UNSPECIFIED
@ AVCOL_RANGE_UNSPECIFIED
Definition: pixfmt.h:743
free_frame_list
static av_cold void free_frame_list(struct FrameListData *list)
Definition: libvpxenc.c:330
AVCodecID
AVCodecID
Identify the syntax and semantics of the bitstream.
Definition: codec_id.h:49
vp8_encode_set_roi
static int vp8_encode_set_roi(AVCodecContext *avctx, int frame_width, int frame_height, const AVFrameSideData *sd)
Definition: libvpxenc.c:1632
av_cpu_count
int av_cpu_count(void)
Definition: cpu.c:221
AVCodecContext::qcompress
float qcompress
amount of qscale change between easy & hard scenes (0.0-1.0)
Definition: avcodec.h:1226
AVCodecContext::time_base
AVRational time_base
This is the fundamental unit of time (in seconds) in terms of which frame timestamps are represented.
Definition: avcodec.h:535
AVCOL_TRC_SMPTE2084
@ AVCOL_TRC_SMPTE2084
SMPTE ST 2084 for 10-, 12-, 14- and 16-bit systems.
Definition: pixfmt.h:683
av_rescale_rnd
int64_t av_rescale_rnd(int64_t a, int64_t b, int64_t c, enum AVRounding rnd)
Rescale a 64-bit integer with specified rounding.
Definition: mathematics.c:58
FrameListData::next
struct FrameListData * next
Definition: libaomenc.c:69
AVCodecContext::stats_out
char * stats_out
pass1 encoding statistics output buffer
Definition: avcodec.h:1312
VPxEncoderContext::rc_overshoot_pct
int rc_overshoot_pct
Definition: libvpxenc.c:117
init
int(* init)(AVBSFContext *ctx)
Definition: dts2pts.c:550
AV_CODEC_CAP_DR1
#define AV_CODEC_CAP_DR1
Codec uses get_buffer() or get_encode_buffer() for allocating buffers and supports custom allocators.
Definition: codec.h:52
AVPacket::size
int size
Definition: packet.h:589
AVFifo
Definition: fifo.c:35
NULL_IF_CONFIG_SMALL
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification.
Definition: internal.h:94
AVCodecContext::gop_size
int gop_size
the number of pictures in a group of pictures, or 0 for intra_only
Definition: avcodec.h:1005
height
#define height
Definition: dsp.h:89
codec_internal.h
dst
uint8_t ptrdiff_t const uint8_t ptrdiff_t int intptr_t intptr_t int int16_t * dst
Definition: dsp.h:87
AV_PKT_DATA_DYNAMIC_HDR10_PLUS
@ AV_PKT_DATA_DYNAMIC_HDR10_PLUS
HDR10+ dynamic metadata associated with a video frame.
Definition: packet.h:296
cpu.h
FrameData::hdr10_plus
AVBufferRef * hdr10_plus
Definition: libvpxenc.c:76
fifo_free
static av_cold void fifo_free(AVFifo **fifo)
Definition: libvpxenc.c:347
AV_PIX_FMT_YUV422P12
#define AV_PIX_FMT_YUV422P12
Definition: pixfmt.h:544
size
int size
Definition: twinvq_data.h:10344
VPxEncoderContext::lossless
int lossless
Definition: libvpxenc.c:127
av_reallocp
int av_reallocp(void *ptr, size_t size)
Allocate, reallocate, or free a block of memory through a pointer to a pointer.
Definition: mem.c:188
AV_PIX_FMT_YUV444P12
#define AV_PIX_FMT_YUV444P12
Definition: pixfmt.h:546
AVFrameSideData::data
uint8_t * data
Definition: frame.h:284
VPxEncoderContext::tune_content
int tune_content
Definition: libvpxenc.c:137
VPxEncoderContext::corpus_complexity
int corpus_complexity
Definition: libvpxenc.c:138
VPxEncoderContext::tile_rows
int tile_rows
Definition: libvpxenc.c:129
AVCPBProperties::min_bitrate
int64_t min_bitrate
Minimum bitrate of the stream, in bits per second.
Definition: defs.h:292
FrameListData
Portion of struct vpx_codec_cx_pkt from vpx_encoder.h.
Definition: libaomenc.c:58
VPxEncoderContext::sharpness
int sharpness
Definition: libvpxenc.c:95
vp9_encode_set_roi
static int vp9_encode_set_roi(AVCodecContext *avctx, int frame_width, int frame_height, const AVFrameSideData *sd)
Definition: libvpxenc.c:1582
AVPacket::dts
int64_t dts
Decompression timestamp in AVStream->time_base units; the time at which the packet is decompressed.
Definition: packet.h:587
AV_CODEC_FLAG_PASS2
#define AV_CODEC_FLAG_PASS2
Use internal 2pass ratecontrol in second pass mode.
Definition: avcodec.h:294
FrameData::pts
int64_t pts
Definition: ffmpeg.h:722
AVPacket::flags
int flags
A combination of AV_PKT_FLAG values.
Definition: packet.h:594
FrameData::frame_opaque_ref
AVBufferRef * frame_opaque_ref
Definition: librav1e.c:63
AVCPBProperties::avg_bitrate
int64_t avg_bitrate
Average bitrate of the stream, in bits per second.
Definition: defs.h:297
version
version
Definition: libkvazaar.c:313
AVRegionOfInterest::right
int right
Definition: frame.h:371
VPxEncoderContext::tune
int tune
Definition: libvpxenc.c:109
AVBufferRef::size
size_t size
Size of data in bytes.
Definition: buffer.h:94
AV_LOG_INFO
#define AV_LOG_INFO
Standard information.
Definition: log.h:221
AV_OPT_TYPE_FLOAT
@ AV_OPT_TYPE_FLOAT
Underlying C type is float.
Definition: opt.h:271
AVCOL_SPC_SMPTE240M
@ AVCOL_SPC_SMPTE240M
derived from 170M primaries and D65 white point, 170M is derived from BT470 System M's primaries
Definition: pixfmt.h:708
frame_data_submit
static int frame_data_submit(AVCodecContext *avctx, AVFifo *fifo, const AVFrame *frame)
Definition: libvpxenc.c:355
VPxEncoderContext::twopass_stats_size
unsigned twopass_stats_size
Definition: libvpxenc.c:87
AVRegionOfInterest::left
int left
Definition: frame.h:370
AV_BASE64_SIZE
#define AV_BASE64_SIZE(x)
Calculate the output size needed to base64-encode x bytes to a null-terminated string.
Definition: base64.h:66
VPxEncoderContext::vpx_ts_parameters
AVDictionary * vpx_ts_parameters
Definition: libvpxenc.c:119
VPxEncoderContext::tile_columns
int tile_columns
Definition: libvpxenc.c:128
ff_default_get_supported_config
int ff_default_get_supported_config(const AVCodecContext *avctx, const AVCodec *codec, enum AVCodecConfig config, unsigned flags, const void **out_configs, int *out_num_configs)
Definition: avcodec.c:759
i
#define i(width, name, range_min, range_max)
Definition: cbs_h2645.c:256
AVPacket::pts
int64_t pts
Presentation timestamp in AVStream->time_base units; the time at which the decompressed packet will b...
Definition: packet.h:581
AVCOL_SPC_BT2020_NCL
@ AVCOL_SPC_BT2020_NCL
ITU-R BT2020 non-constant luminance system.
Definition: pixfmt.h:711
AVRegionOfInterest::top
int top
Distance in pixels from the top edge of the frame to the top and bottom edges and from the left edge ...
Definition: frame.h:368
internal.h
AV_PIX_FMT_GBRP12
#define AV_PIX_FMT_GBRP12
Definition: pixfmt.h:559
av_malloc_array
#define av_malloc_array(a, b)
Definition: tableprint_vlc.h:32
common.h
AVCPBProperties::max_bitrate
int64_t max_bitrate
Maximum bitrate of the stream, in bits per second.
Definition: defs.h:287
value
it s the only field you need to keep assuming you have a context There is some magic you don t need to care about around this just let it vf default value
Definition: writing_filters.txt:86
FFMIN
#define FFMIN(a, b)
Definition: macros.h:49
AVCodec::name
const char * name
Name of the codec implementation.
Definition: codec.h:179
av_inv_q
static av_always_inline AVRational av_inv_q(AVRational q)
Invert a rational.
Definition: rational.h:159
av_buffer_replace
int av_buffer_replace(AVBufferRef **pdst, const AVBufferRef *src)
Ensure dst refers to the same data as src.
Definition: buffer.c:233
AVCOL_SPC_UNSPECIFIED
@ AVCOL_SPC_UNSPECIFIED
Definition: pixfmt.h:703
AVCodecContext::height
int height
Definition: avcodec.h:592
AVCodecContext::pix_fmt
enum AVPixelFormat pix_fmt
Pixel format, see AV_PIX_FMT_xxx.
Definition: avcodec.h:631
AVCOL_RANGE_MPEG
@ AVCOL_RANGE_MPEG
Narrow or limited range content.
Definition: pixfmt.h:760
av_calloc
void * av_calloc(size_t nmemb, size_t size)
Definition: mem.c:264
defaults
static const FFCodecDefault defaults[]
Definition: libvpxenc.c:2003
avcodec.h
delta_q
#define delta_q(name)
Definition: cbs_av1.c:657
AV_PKT_DATA_MATROSKA_BLOCKADDITIONAL
@ AV_PKT_DATA_MATROSKA_BLOCKADDITIONAL
Data found in BlockAdditional element of matroska container.
Definition: packet.h:188
ret
ret
Definition: filter_design.txt:187
AVClass::class_name
const char * class_name
The name of the class; usually it is the same name as the context structure type to which the AVClass...
Definition: log.h:81
frame
these buffered frames must be flushed immediately if a new input produces new the filter must not call request_frame to get more It must just process the frame or queue it The task of requesting more frames is left to the filter s request_frame method or the application If a filter has several the filter must be ready for frames arriving randomly on any input any filter with several inputs will most likely require some kind of queuing mechanism It is perfectly acceptable to have a limited queue and to drop frames when the inputs are too unbalanced request_frame For filters that do not use the this method is called when a frame is wanted on an output For a it should directly call filter_frame on the corresponding output For a if there are queued frames already one of these frames should be pushed If the filter should request a frame on one of its repeatedly until at least one frame has been pushed Return or at least make progress towards producing a frame
Definition: filter_design.txt:265
AVCPBProperties::buffer_size
int64_t buffer_size
The size of the buffer to which the ratecontrol is applied, in bits.
Definition: defs.h:303
VPxEncoderContext::cpu_used
int cpu_used
Definition: libvpxenc.c:94
VPxEncoderContext::alpha_coded_frame_list
struct FrameListData * alpha_coded_frame_list
Definition: libvpxenc.c:92
av_fifo_alloc2
AVFifo * av_fifo_alloc2(size_t nb_elems, size_t elem_size, unsigned int flags)
Allocate and initialize an AVFifo with a given element size.
Definition: fifo.c:47
AV_PIX_FMT_YUV420P12
#define AV_PIX_FMT_YUV420P12
Definition: pixfmt.h:543
SIZE_SPECIFIER
#define SIZE_SPECIFIER
Definition: internal.h:119
AV_FRAME_DATA_DYNAMIC_HDR_PLUS
@ AV_FRAME_DATA_DYNAMIC_HDR_PLUS
HDR dynamic metadata associated with a video frame.
Definition: frame.h:159
AVCodecContext
main external API structure.
Definition: avcodec.h:431
av_packet_new_side_data
uint8_t * av_packet_new_side_data(AVPacket *pkt, enum AVPacketSideDataType type, size_t size)
Allocate new information of a packet.
Definition: packet.c:231
ff_get_encode_buffer
int ff_get_encode_buffer(AVCodecContext *avctx, AVPacket *avpkt, int64_t size, int flags)
Get a buffer for a packet.
Definition: encode.c:105
AVCodecContext::qmin
int qmin
minimum quantizer
Definition: avcodec.h:1234
AVRational::den
int den
Denominator.
Definition: rational.h:60
storeframe
static int storeframe(AVCodecContext *avctx, struct FrameListData *cx_frame, struct FrameListData *alpha_cx_frame, AVPacket *pkt)
Store coded frame information in format suitable for return from encode2().
Definition: libvpxenc.c:1320
AV_PIX_FMT_NONE
@ AV_PIX_FMT_NONE
Definition: pixfmt.h:72
AV_OPT_TYPE_INT
@ AV_OPT_TYPE_INT
Underlying C type is int.
Definition: opt.h:259
AVCodecContext::profile
int profile
profile
Definition: avcodec.h:1618
av_get_token
char * av_get_token(const char **buf, const char *term)
Unescape the given string until a non escaped terminating char, and return the token corresponding to...
Definition: avstring.c:143
ctlidstr
static const char *const ctlidstr[]
String mappings for enum vp8e_enc_control_id.
Definition: libvpxenc.c:155
av_base64_encode
char * av_base64_encode(char *out, int out_size, const uint8_t *in, int in_size)
Encode data to base64 and null-terminate.
Definition: base64.c:147
AV_CODEC_CAP_DELAY
#define AV_CODEC_CAP_DELAY
Encoder or decoder requires flushing with NULL input at the end in order to give the complete and cor...
Definition: codec.h:76
Windows::Graphics::DirectX::Direct3D11::p
IDirect3DDxgiInterfaceAccess _COM_Outptr_ void ** p
Definition: vsrc_gfxcapture_winrt.hpp:53
VPxEncoderContext::frame_parallel
int frame_parallel
Definition: libvpxenc.c:130
ff_libvpx_vp8_encoder
const FFCodec ff_libvpx_vp8_encoder
AV_PIX_FMT_YUV444P
@ AV_PIX_FMT_YUV444P
planar YUV 4:4:4, 24bpp, (1 Cr & Cb sample per 1x1 Y samples)
Definition: pixfmt.h:78
VPxEncoderContext::error_resilient
int error_resilient
Definition: libvpxenc.c:112
AV_PIX_FMT_GBRP
@ AV_PIX_FMT_GBRP
planar GBR 4:4:4 24bpp
Definition: pixfmt.h:165
OFFSET
#define OFFSET(x)
Definition: libvpxenc.c:1890
desc
const char * desc
Definition: libsvtav1.c:78
AV_PICTURE_TYPE_P
@ AV_PICTURE_TYPE_P
Predicted.
Definition: avutil.h:279
AVMEDIA_TYPE_VIDEO
@ AVMEDIA_TYPE_VIDEO
Definition: avutil.h:200
coded_frame_add
static void coded_frame_add(void *list, struct FrameListData *cx_frame)
Definition: libvpxenc.c:314
AV_PIX_FMT_YUV422P
@ AV_PIX_FMT_YUV422P
planar YUV 4:2:2, 16bpp, (1 Cr & Cb sample per 2x1 Y samples)
Definition: pixfmt.h:77
mem.h
AVBufferRef
A reference to a data buffer.
Definition: buffer.h:82
FF_CODEC_CAP_AUTO_THREADS
#define FF_CODEC_CAP_AUTO_THREADS
Codec handles avctx->thread_count == 0 (auto) internally.
Definition: codec_internal.h:72
AVFrameSideData
Structure to hold side data for an AVFrame.
Definition: frame.h:282
AVPixFmtDescriptor
Descriptor that unambiguously describes how the bits of a pixel are stored in the up to 4 data planes...
Definition: pixdesc.h:69
set_temporal_layer_pattern
static void set_temporal_layer_pattern(int layering_mode, vpx_codec_enc_cfg_t *cfg, int *layer_flags, int *flag_periodicity)
Definition: libvpxenc.c:556
dump_enc_cfg
static av_cold void dump_enc_cfg(AVCodecContext *avctx, const struct vpx_codec_enc_cfg *cfg, int level)
Definition: libvpxenc.c:216
AVDictionaryEntry
Definition: dict.h:90
VPxEncoderContext::arnr_max_frames
int arnr_max_frames
Definition: libvpxenc.c:105
AVCodecContext::slices
int slices
Number of slices.
Definition: avcodec.h:1021
AVPacket
This structure stores compressed data.
Definition: packet.h:565
AVCodecContext::priv_data
void * priv_data
Definition: avcodec.h:458
VPxEncoderContext::vpx_cs
int vpx_cs
Definition: libvpxenc.c:134
AV_OPT_TYPE_BOOL
@ AV_OPT_TYPE_BOOL
Underlying C type is int.
Definition: opt.h:327
av_freep
#define av_freep(p)
Definition: tableprint_vlc.h:35
set_roi_map
static int set_roi_map(AVCodecContext *avctx, const AVFrameSideData *sd, int frame_width, int frame_height, vpx_roi_map_t *roi_map, int block_size, int segment_cnt)
Definition: libvpxenc.c:1475
queue_frames
static int queue_frames(AVCodecContext *avctx, struct vpx_codec_ctx *encoder, struct FrameListData **frame_list, AVPacket *pkt_out)
Queue multiple output frames from the encoder, returning the front-most.
Definition: libvpxenc.c:1380
AVCodecContext::width
int width
picture width / height.
Definition: avcodec.h:592
AV_FRAME_DATA_REGIONS_OF_INTEREST
@ AV_FRAME_DATA_REGIONS_OF_INTEREST
Regions Of Interest, the data is an array of AVRegionOfInterest type, the number of array element is ...
Definition: frame.h:165
AV_CODEC_ID_VP8
@ AV_CODEC_ID_VP8
Definition: codec_id.h:192
av_log
#define av_log(a,...)
Definition: tableprint_vlc.h:27
FrameListData::sz
size_t sz
length of compressed data
Definition: libaomenc.c:60
av_fifo_freep2
void av_fifo_freep2(AVFifo **f)
Free an AVFifo and reset pointer to NULL.
Definition: fifo.c:286
AVERROR_INVALIDDATA
#define AVERROR_INVALIDDATA
Invalid data found when processing input.
Definition: error.h:61
libvpx.h
AV_PIX_FMT_YUV440P12
#define AV_PIX_FMT_YUV440P12
Definition: pixfmt.h:545
free_coded_frame
static av_cold void free_coded_frame(struct FrameListData *cx_frame)
Definition: libvpxenc.c:324
VPxEncoderContext::arnr_strength
int arnr_strength
Definition: libvpxenc.c:106
vp8_init
static av_cold int vp8_init(AVFormatContext *s, int st_index, PayloadContext *vp8)
Definition: rtpdec_vp8.c:263
ff_encode_add_cpb_side_data
AVCPBProperties * ff_encode_add_cpb_side_data(AVCodecContext *avctx)
Add a CPB properties side data to an encoding context.
Definition: encode.c:887
stride
#define stride
Definition: h264pred_template.c:536
AVDictionaryEntry::value
char * value
Definition: dict.h:92
planes
static const struct @544 planes[]
avstring.h
width
#define width
Definition: dsp.h:89
FF_QP2LAMBDA
#define FF_QP2LAMBDA
factor to convert from H.263 QP to lambda
Definition: avutil.h:226
AVCOL_SPC_BT709
@ AVCOL_SPC_BT709
also ITU-R BT1361 / IEC 61966-2-4 xvYCC709 / derived in SMPTE RP 177 Annex B
Definition: pixfmt.h:702
VE
#define VE
Definition: libvpxenc.c:1891
AVRegionOfInterest::qoffset
AVRational qoffset
Quantisation offset.
Definition: frame.h:395
AV_OPT_TYPE_CONST
@ AV_OPT_TYPE_CONST
Special option type for declaring named constants.
Definition: opt.h:299
snprintf
#define snprintf
Definition: snprintf.h:34
av_log2
int av_log2(unsigned v)
Definition: intmath.c:26
VPxEncoderContext::sse
uint64_t sse[4]
Definition: libvpxenc.c:89
AVCodecConfig
AVCodecConfig
Definition: avcodec.h:2530
av_dict_iterate
const AVDictionaryEntry * av_dict_iterate(const AVDictionary *m, const AVDictionaryEntry *prev)
Iterate over a dictionary.
Definition: dict.c:42
skip
static void BS_FUNC() skip(BSCTX *bc, unsigned int n)
Skip n bits in the buffer.
Definition: bitstream_template.h:383
src
#define src
Definition: vp8dsp.c:248
AV_FIFO_FLAG_AUTO_GROW
#define AV_FIFO_FLAG_AUTO_GROW
Automatically resize the FIFO on writes, so that the data fits.
Definition: fifo.h:63
ff_vp9_profiles
const AVProfile ff_vp9_profiles[]
Definition: profiles.c:155
AV_CODEC_FLAG_PASS1
#define AV_CODEC_FLAG_PASS1
Use internal 2pass ratecontrol in first pass mode.
Definition: avcodec.h:290
VPxEncoderContext::min_gf_interval
int min_gf_interval
Definition: libvpxenc.c:140
FrameListData::have_sse
int have_sse
true if we have pending sse[]
Definition: libaomenc.c:67