Go to the documentation of this file.
   36 #define NUM_DATA_BUFS 13 
   56 #define OFFSET(x) offsetof(VIFContext, x) 
   69         0.00745626912, 0.0142655009, 0.0250313189, 0.0402820669, 0.0594526194,
 
   70         0.0804751068, 0.0999041125, 0.113746084, 0.118773937, 0.113746084,
 
   71         0.0999041125, 0.0804751068, 0.0594526194, 0.0402820669, 0.0250313189,
 
   72         0.0142655009, 0.00745626912
 
   75         0.0189780835, 0.0558981746, 0.120920904, 0.192116052, 0.224173605,
 
   76         0.192116052, 0.120920904, 0.0558981746, 0.0189780835
 
   79         0.054488685, 0.244201347, 0.402619958, 0.244201347, 0.054488685
 
   82         0.166378498, 0.667243004, 0.166378498
 
   98                      int src_stride, 
int dst_stride)
 
  100     const int dst_px_stride = dst_stride / 2;
 
  102     for (
int i = 0; 
i < 
h / 2; 
i++) {
 
  103         for (
int j = 0; j < 
w / 2; j++)
 
  104             dst[
i * dst_px_stride + j] = 
src[(
i * 2) * src_stride + (j * 2)];
 
  109                           const float *mu1_mu2, 
const float *xx_filt,
 
  110                           const float *yy_filt, 
const float *xy_filt,
 
  111                           float *num, 
float *den, 
int w, 
int h)
 
  113     static const float sigma_nsq = 2;
 
  114     float mu1_sq_val, mu2_sq_val, mu1_mu2_val, xx_filt_val, yy_filt_val, xy_filt_val;
 
  115     float sigma1_sq, sigma2_sq, sigma12, 
g, sv_sq, eps = 1.0e-10
f;
 
  116     float gain_limit = 100.f;
 
  117     float num_val, den_val;
 
  118     float accum_num = 0.0f;
 
  119     float accum_den = 0.0f;
 
  121     for (
int i = 0; 
i < 
h; 
i++) {
 
  122         float accum_inner_num = 0.f;
 
  123         float accum_inner_den = 0.f;
 
  125         for (
int j = 0; j < 
w; j++) {
 
  126             mu1_sq_val  = mu1_sq[
i * 
w + j];
 
  127             mu2_sq_val  = mu2_sq[
i * 
w + j];
 
  128             mu1_mu2_val = mu1_mu2[
i * 
w + j];
 
  129             xx_filt_val = xx_filt[
i * 
w + j];
 
  130             yy_filt_val = yy_filt[
i * 
w + j];
 
  131             xy_filt_val = xy_filt[
i * 
w + j];
 
  133             sigma1_sq = xx_filt_val - mu1_sq_val;
 
  134             sigma2_sq = yy_filt_val - mu2_sq_val;
 
  135             sigma12   = xy_filt_val - mu1_mu2_val;
 
  137             sigma1_sq = 
FFMAX(sigma1_sq, 0.0
f);
 
  138             sigma2_sq = 
FFMAX(sigma2_sq, 0.0
f);
 
  139             sigma12   = 
FFMAX(sigma12,   0.0
f);
 
  141             g = sigma12 / (sigma1_sq + eps);
 
  142             sv_sq = sigma2_sq - 
g * sigma12;
 
  144             if (sigma1_sq < eps) {
 
  150             if (sigma2_sq < eps) {
 
  159             sv_sq = 
FFMAX(sv_sq, eps);
 
  163             num_val = 
log2f(1.0
f + 
g * 
g * sigma1_sq / (sv_sq + sigma_nsq));
 
  164             den_val = 
log2f(1.0
f + sigma1_sq / sigma_nsq);
 
  167                 num_val = den_val = 1.f;
 
  169             accum_inner_num += num_val;
 
  170             accum_inner_den += den_val;
 
  173         accum_num += accum_inner_num;
 
  174         accum_den += accum_inner_den;
 
  181 static void vif_xx_yy_xy(
const float *x, 
const float *y, 
float *xx, 
float *yy,
 
  182                          float *xy, 
int w, 
int h)
 
  184     for (
int i = 0; 
i < 
h; 
i++) {
 
  185         for (
int j = 0; j < 
w; j++) {
 
  188             float xxval = xval * xval;
 
  189             float yyval = yval * yval;
 
  190             float xyval = xval * yval;
 
  209     const float *
src = 
td->src;
 
  210     float *dst = 
td->dst;
 
  213     int src_stride = 
td->src_stride;
 
  214     int dst_stride = 
td->dst_stride;
 
  215     int filt_w = 
td->filter_width;
 
  216     float *
temp = 
td->temp[jobnr];
 
  217     const int slice_start = (
h * jobnr) / nb_jobs;
 
  218     const int slice_end = (
h * (jobnr+1)) / nb_jobs;
 
  222         for (
int j = 0; j < 
w; j++) {
 
  225             if (
i >= filt_w / 2 && 
i < 
h - filt_w / 2 - 1) {
 
  226                 for (
int filt_i = 0; filt_i < filt_w; filt_i++) {
 
  227                     const float filt_coeff = 
filter[filt_i];
 
  229                     int ii = 
i - filt_w / 2 + filt_i;
 
  231                     img_coeff = 
src[ii * src_stride + j];
 
  232                     sum += filt_coeff * img_coeff;
 
  235                 for (
int filt_i = 0; filt_i < filt_w; filt_i++) {
 
  236                     const float filt_coeff = 
filter[filt_i];
 
  237                     int ii = 
i - filt_w / 2 + filt_i;
 
  240                     ii = ii < 0 ? -ii : (ii >= 
h ? 2 * 
h - ii - 1 : ii);
 
  242                     img_coeff = 
src[ii * src_stride + j];
 
  243                     sum += filt_coeff * img_coeff;
 
  251         for (
int j = 0; j < 
w; j++) {
 
  254             if (j >= filt_w / 2 && j < 
w - filt_w / 2 - 1) {
 
  255                 for (
int filt_j = 0; filt_j < filt_w; filt_j++) {
 
  256                     const float filt_coeff = 
filter[filt_j];
 
  257                     int jj = j - filt_w / 2 + filt_j;
 
  260                     img_coeff = 
temp[jj];
 
  261                     sum += filt_coeff * img_coeff;
 
  264                 for (
int filt_j = 0; filt_j < filt_w; filt_j++) {
 
  265                     const float filt_coeff = 
filter[filt_j];
 
  266                     int jj = j - filt_w / 2 + filt_j;
 
  269                     jj = jj < 0 ? -jj : (jj >= 
w ? 2 * 
w - jj - 1 : jj);
 
  271                     img_coeff = 
temp[jj];
 
  272                     sum += filt_coeff * img_coeff;
 
  276             dst[
i * dst_stride + j] = sum;
 
  284                         const float *
ref, 
const float *
main, 
int w, 
int h,
 
  285                         int ref_stride, 
int main_stride, 
float *score,
 
  290     float *ref_scale = data_buf[0];
 
  291     float *main_scale = data_buf[1];
 
  292     float *ref_sq = data_buf[2];
 
  293     float *main_sq = data_buf[3];
 
  294     float *ref_main = data_buf[4];
 
  295     float *mu1 = data_buf[5];
 
  296     float *mu2 = data_buf[6];
 
  297     float *mu1_sq = data_buf[7];
 
  298     float *mu2_sq = data_buf[8];
 
  299     float *mu1_mu2 = data_buf[9];
 
  300     float *ref_sq_filt = data_buf[10];
 
  301     float *main_sq_filt = data_buf[11];
 
  302     float *ref_main_filt = data_buf[12];
 
  304     const float *curr_ref_scale  = 
ref;
 
  305     const float *curr_main_scale = 
main;
 
  306     int curr_ref_stride = ref_stride;
 
  307     int curr_main_stride = main_stride;
 
  315         const int nb_threads = 
FFMIN(
h, gnb_threads);
 
  320         td.filter_width = filter_width;
 
  323             td.src = curr_ref_scale;
 
  327             td.src_stride = curr_ref_stride;
 
  332             td.src = curr_main_scale;
 
  334             td.src_stride = curr_main_stride;
 
  337             vif_dec2(mu1, ref_scale, buf_valid_w, buf_valid_h, 
w, 
w);
 
  338             vif_dec2(mu2, main_scale, buf_valid_w, buf_valid_h, 
w, 
w);
 
  346             curr_ref_scale = ref_scale;
 
  347             curr_main_scale = main_scale;
 
  350             curr_main_stride = 
w;
 
  353         td.src = curr_ref_scale;
 
  357         td.src_stride = curr_ref_stride;
 
  362         td.src = curr_main_scale;
 
  364         td.src_stride = curr_main_stride;
 
  369         vif_xx_yy_xy(curr_ref_scale, curr_main_scale, ref_sq, main_sq, ref_main, 
w, 
h);
 
  372         td.dst = ref_sq_filt;
 
  377         td.dst = main_sq_filt;
 
  382         td.dst = ref_main_filt;
 
  385         vif_statistic(mu1_sq, mu2_sq, mu1_mu2, ref_sq_filt, main_sq_filt,
 
  386                       ref_main_filt, &num, &den, 
w, 
h);
 
  388         score[
scale] = den <= FLT_EPSILON ? 1.f : num / den;
 
  394 #define offset_fn(type, bits)                            \ 
  395 static void offset_##bits##bit(VIFContext *s,            \ 
  396                                const AVFrame *ref,       \ 
  397                                AVFrame *main, int stride)\ 
  402     int ref_stride = ref->linesize[0];                   \ 
  403     int main_stride = main->linesize[0];                 \ 
  405     const type *ref_ptr = (const type *) ref->data[0];   \ 
  406     const type *main_ptr = (const type *) main->data[0]; \ 
  408     const float factor = s->factor;         \ 
  410     float *ref_ptr_data = s->ref_data;      \ 
  411     float *main_ptr_data = s->main_data;    \ 
  413     for (int i = 0; i < h; i++) {           \ 
  414         for (int j = 0; j < w; j++) {       \ 
  415             ref_ptr_data[j] = ref_ptr[j] * factor - 128.f;   \ 
  416             main_ptr_data[j] = main_ptr[j] * factor - 128.f; \ 
  418         ref_ptr += ref_stride / sizeof(type);   \ 
  420         main_ptr += main_stride / sizeof(type); \ 
  421         main_ptr_data += w;                     \ 
  441     s->factor = 1.f / (1 << (
s->desc->comp[0].depth - 8));
 
  442     if (
s->desc->comp[0].depth <= 8) {
 
  449                  s->width, 
s->height, 
s->width, 
s->width,
 
  450                  score, 
s->data_buf, 
s->temp, 
s->nb_threads);
 
  452     set_meta(metadata, 
"lavfi.vif.scale.0", score[0]);
 
  453     set_meta(metadata, 
"lavfi.vif.scale.1", score[1]);
 
  454     set_meta(metadata, 
"lavfi.vif.scale.2", score[2]);
 
  455     set_meta(metadata, 
"lavfi.vif.scale.3", score[3]);
 
  457     for (
int i = 0; 
i < 4; 
i++) {
 
  458         s->vif_min[
i]  = 
FFMIN(
s->vif_min[
i], score[
i]);
 
  459         s->vif_max[
i]  = 
FFMAX(
s->vif_max[
i], score[
i]);
 
  460         s->vif_sum[
i] += score[
i];
 
  475 #define PF(suf) AV_PIX_FMT_YUV420##suf,  AV_PIX_FMT_YUV422##suf,  AV_PIX_FMT_YUV444##suf 
  485     if (
ctx->inputs[0]->w != 
ctx->inputs[1]->w ||
 
  486         ctx->inputs[0]->h != 
ctx->inputs[1]->h) {
 
  492     s->width = 
ctx->inputs[0]->w;
 
  493     s->height = 
ctx->inputs[0]->h;
 
  496     for (
int i = 0; 
i < 4; 
i++) {
 
  497         s->vif_min[
i] =  DBL_MAX;
 
  498         s->vif_max[
i] = -DBL_MAX;
 
  502         if (!(
s->data_buf[
i] = 
av_calloc(
s->width, 
s->height * 
sizeof(
float))))
 
  506     if (!(
s->ref_data = 
av_calloc(
s->width, 
s->height * 
sizeof(
float))))
 
  509     if (!(
s->main_data = 
av_calloc(
s->width, 
s->height * 
sizeof(
float))))
 
  512     if (!(
s->temp = 
av_calloc(
s->nb_threads, 
sizeof(
s->temp[0]))))
 
  515     for (
int i = 0; 
i < 
s->nb_threads; 
i++) {
 
  536         out_frame = main_frame;
 
  555     outlink->
w = mainlink->
w;
 
  556     outlink->
h = mainlink->
h;
 
  588     if (
s->nb_frames > 0) {
 
  589         for (
int i = 0; 
i < 4; 
i++)
 
  591                    i, 
s->vif_sum[
i] / 
s->nb_frames, 
s->vif_min[
i], 
s->vif_max[
i]);
 
  600     for (
int i = 0; 
i < 
s->nb_threads && 
s->temp; 
i++)
 
  630     .preinit       = vif_framesync_preinit,
 
  633     .priv_class    = &vif_class,
 
  
static const AVFilterPad vif_outputs[]
AVRational time_base
Time base for the incoming frames.
int ff_framesync_configure(FFFrameSync *fs)
Configure a frame sync structure.
AVPixelFormat
Pixel format.
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
void ff_framesync_uninit(FFFrameSync *fs)
Free all memory currently allocated.
int ff_filter_frame(AVFilterLink *link, AVFrame *frame)
Send a frame of data to the next filter.
const AVPixFmtDescriptor * av_pix_fmt_desc_get(enum AVPixelFormat pix_fmt)
static int process_frame(FFFrameSync *fs)
#define FILTER_PIXFMTS_ARRAY(array)
The exact code depends on how similar the blocks are and how related they are to the and needs to apply these operations to the correct inlink or outlink if there are several Macros are available to factor that when no extra processing is inlink
#define offset_fn(type, bits)
static void vif_xx_yy_xy(const float *x, const float *y, float *xx, float *yy, float *xy, int w, int h)
This structure describes decoded (raw) audio or video data.
int64_t pts
Presentation timestamp in time_base units (time when frame should be shown to user).
static av_cold void uninit(AVFilterContext *ctx)
static const float vif_filter1d_table[4][17]
@ AV_PIX_FMT_YUV440P
planar YUV 4:4:0 (1 Cr & Cb sample per 1x2 Y samples)
filter_frame For filters that do not use the this method is called when a frame is pushed to the filter s input It can be called at any time except in a reentrant way If the input frame is enough to produce then the filter should push the output frames on the output link immediately As an exception to the previous rule if the input frame is enough to produce several output frames then the filter needs output only at least one per link The additional frames can be left buffered in the filter
const char * name
Filter name.
static int vif_filter1d(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs)
static enum AVPixelFormat pix_fmts[]
static const uint8_t vif_filter1d_width1[4]
A link between two filters.
const AVPixFmtDescriptor * desc
@ EXT_STOP
Completely stop all streams with this one.
static av_always_inline float scale(float x, float s)
static void vif_dec2(const float *src, float *dst, int w, int h, int src_stride, int dst_stride)
#define AV_PIX_FMT_GRAY16
unsigned sync
Synchronization level: frames on input at the highest sync level will generate output frame events.
A filter pad used for either input or output.
@ AV_PIX_FMT_YUVJ411P
planar YUV 4:1:1, 12bpp, (1 Cr & Cb sample per 4x1 Y samples) full scale (JPEG), deprecated in favor ...
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
@ AV_PIX_FMT_YUVJ422P
planar YUV 4:2:2, 16bpp, full scale (JPEG), deprecated in favor of AV_PIX_FMT_YUV422P and setting col...
static const AVFrame * ref_frame(const struct pl_frame_mix *mix)
static int slice_end(AVCodecContext *avctx, AVFrame *pict)
Handle slice ends.
AVRational sample_aspect_ratio
agreed upon sample aspect ratio
AVRational frame_rate
Frame rate of the stream on the link, or 1/0 if unknown or variable; if left to 0/0,...
#define AV_PIX_FMT_GRAY14
int64_t av_rescale_q(int64_t a, AVRational bq, AVRational cq)
Rescale a 64-bit integer by 2 rational numbers.
static AVFrame * do_vif(AVFilterContext *ctx, AVFrame *main, const AVFrame *ref)
@ AV_PIX_FMT_YUV420P
planar YUV 4:2:0, 12bpp, (1 Cr & Cb sample per 2x2 Y samples)
#define FILTER_INPUTS(array)
@ AV_PIX_FMT_YUVJ444P
planar YUV 4:4:4, 24bpp, full scale (JPEG), deprecated in favor of AV_PIX_FMT_YUV444P and setting col...
#define AV_PIX_FMT_GRAY10
Describe the class of an AVClass context structure.
#define fs(width, name, subs,...)
@ AV_PIX_FMT_YUVJ420P
planar YUV 4:2:0, 12bpp, full scale (JPEG), deprecated in favor of AV_PIX_FMT_YUV420P and setting col...
@ AV_PIX_FMT_GRAY8
Y , 8bpp.
int main(int argc, char **argv)
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification.
AVFilterContext * src
source filter
#define AV_LOG_INFO
Standard information.
static int compute_vif2(AVFilterContext *ctx, const float *ref, const float *main, int w, int h, int ref_stride, int main_stride, float *score, float *const data_buf[NUM_DATA_BUFS], float **temp, int gnb_threads)
#define i(width, name, range_min, range_max)
int w
agreed upon image width
int ff_filter_get_nb_threads(AVFilterContext *ctx)
Get number of threads for current filter instance.
Used for passing data between threads.
it s the only field you need to keep assuming you have a context There is some magic you don t need to care about around this just let it vf default value
@ AV_PIX_FMT_YUVJ440P
planar YUV 4:4:0 full scale (JPEG), deprecated in favor of AV_PIX_FMT_YUV440P and setting color_range
const char * name
Pad name.
static int config_output(AVFilterLink *outlink)
void * av_calloc(size_t nmemb, size_t size)
static void vif_statistic(const float *mu1_sq, const float *mu2_sq, const float *mu1_mu2, const float *xx_filt, const float *yy_filt, const float *xy_filt, float *num, float *den, int w, int h)
int ff_framesync_init(FFFrameSync *fs, AVFilterContext *parent, unsigned nb_in)
Initialize a frame sync structure.
static void set_meta(AVDictionary **metadata, int chan, const char *key, const char *fmt, float val)
enum FFFrameSyncExtMode before
Extrapolation mode for timestamps before the first frame.
int h
agreed upon image height
static const AVFilterPad vif_inputs[]
#define AVFILTER_FLAG_METADATA_ONLY
The filter is a "metadata" filter - it does not modify the frame data in any way.
static int ref[MAX_W *MAX_W]
AVRational time_base
Define the time base used by the PTS of the frames/samples which will pass through this link.
@ AV_PIX_FMT_YUV444P
planar YUV 4:4:4, 24bpp, (1 Cr & Cb sample per 1x1 Y samples)
float * data_buf[NUM_DATA_BUFS]
static int activate(AVFilterContext *ctx)
#define AVFILTER_FLAG_SLICE_THREADS
The filter supports multithreading by splitting frames into multiple parts and processing them concur...
@ AV_PIX_FMT_YUV422P
planar YUV 4:2:2, 16bpp, (1 Cr & Cb sample per 2x1 Y samples)
Descriptor that unambiguously describes how the bits of a pixel are stored in the up to 4 data planes...
#define FILTER_OUTPUTS(array)
int av_dict_set(AVDictionary **pm, const char *key, const char *value, int flags)
Set the given entry in *pm, overwriting an existing entry.
@ AV_PIX_FMT_YUV411P
planar YUV 4:1:1, 12bpp, (1 Cr & Cb sample per 4x1 Y samples)
#define AVFILTER_FLAG_SUPPORT_TIMELINE_INTERNAL
Same as AVFILTER_FLAG_SUPPORT_TIMELINE_GENERIC, except that the filter will have its filter_frame() c...
@ AV_PIX_FMT_YUV410P
planar YUV 4:1:0, 9bpp, (1 Cr & Cb sample per 4x4 Y samples)
enum FFFrameSyncExtMode after
Extrapolation mode for timestamps after the last frame.
int ff_framesync_activate(FFFrameSync *fs)
Examine the frames in the filter's input and try to produce output.
int ff_framesync_dualinput_get(FFFrameSync *fs, AVFrame **f0, AVFrame **f1)
static const AVOption vif_options[]
#define AV_PIX_FMT_GRAY12
static av_always_inline int ff_filter_execute(AVFilterContext *ctx, avfilter_action_func *func, void *arg, int *ret, int nb_jobs)
FRAMESYNC_DEFINE_CLASS(vif, VIFContext, fs)
static int config_input_ref(AVFilterLink *inlink)