Go to the documentation of this file.
   53 #define OFFSET(x) offsetof(VMAFMotionContext, x) 
   54 #define FLAGS AV_OPT_FLAG_FILTERING_PARAM|AV_OPT_FLAG_VIDEO_PARAM 
   64                           int h, ptrdiff_t _img1_stride, ptrdiff_t _img2_stride)
 
   66     ptrdiff_t img1_stride = _img1_stride / 
sizeof(*img1);
 
   67     ptrdiff_t img2_stride = _img2_stride / 
sizeof(*img2);
 
   71     for (
i = 0; 
i < 
h; 
i++) {
 
   72         for (j = 0; j < 
w; j++) {
 
   83                           uint16_t *dst, 
int w, 
int h, ptrdiff_t _src_stride,
 
   84                           ptrdiff_t _dst_stride)
 
   86     ptrdiff_t src_stride = _src_stride / 
sizeof(*src);
 
   87     ptrdiff_t dst_stride = _dst_stride / 
sizeof(*dst);
 
   88     int radius = filt_w / 2;
 
   89     int borders_left = radius;
 
   90     int borders_right = 
w - (filt_w - radius);
 
   94     for (
i = 0; 
i < 
h; 
i++) {
 
   95         for (j = 0; j < borders_left; j++) {
 
   97             for (k = 0; k < filt_w; k++) {
 
   98                 int j_tap = 
FFABS(j - radius + k);
 
  100                     j_tap = 
w - (j_tap - 
w + 1);
 
  102                 sum += 
filter[k] * 
src[
i * src_stride + j_tap];
 
  107         for (j = borders_left; j < borders_right; j++) {
 
  109             for (k = 0; k < filt_w; k++) {
 
  110                 sum += 
filter[k] * 
src[
i * src_stride + j - radius + k];
 
  115         for (j = borders_right; j < 
w; j++) {
 
  117             for (k = 0; k < filt_w; k++) {
 
  118                 int j_tap = 
FFABS(j - radius + k);
 
  120                     j_tap = 
w - (j_tap - 
w + 1);
 
  122                 sum += 
filter[k] * 
src[
i * src_stride + j_tap];
 
  129 #define conv_y_fn(type, bits) \ 
  130 static void convolution_y_##bits##bit(const uint16_t *filter, int filt_w, \ 
  131                                       const uint8_t *_src, uint16_t *dst, \ 
  132                                       int w, int h, ptrdiff_t _src_stride, \ 
  133                                       ptrdiff_t _dst_stride) \ 
  135     const type *src = (const type *) _src; \ 
  136     ptrdiff_t src_stride = _src_stride / sizeof(*src); \ 
  137     ptrdiff_t dst_stride = _dst_stride / sizeof(*dst); \ 
  138     int radius = filt_w / 2; \ 
  139     int borders_top = radius; \ 
  140     int borders_bottom = h - (filt_w - radius); \ 
  144     for (i = 0; i < borders_top; i++) { \ 
  145         for (j = 0; j < w; j++) { \ 
  147             for (k = 0; k < filt_w; k++) { \ 
  148                 int i_tap = FFABS(i - radius + k); \ 
  150                     i_tap = h - (i_tap - h + 1); \ 
  152                 sum += filter[k] * src[i_tap * src_stride + j]; \ 
  154             dst[i * dst_stride + j] = sum >> bits; \ 
  157     for (i = borders_top; i < borders_bottom; i++) { \ 
  158         for (j = 0; j < w; j++) { \ 
  160             for (k = 0; k < filt_w; k++) { \ 
  161                 sum += filter[k] * src[(i - radius + k) * src_stride + j]; \ 
  163             dst[i * dst_stride + j] = sum >> bits; \ 
  166     for (i = borders_bottom; i < h; i++) { \ 
  167         for (j = 0; j < w; j++) { \ 
  169             for (k = 0; k < filt_w; k++) { \ 
  170                 int i_tap = FFABS(i - radius + k); \ 
  172                     i_tap = h - (i_tap - h + 1); \ 
  174                 sum += filter[k] * src[i_tap * src_stride + j]; \ 
  176             dst[i * dst_stride + j] = sum >> bits; \ 
  186     dsp->convolution_y = bpp == 10 ? convolution_y_10bit : convolution_y_8bit;
 
  194     s->vmafdsp.convolution_y(
s->filter, 5, 
ref->data[0], 
s->temp_data,
 
  195                              s->width, 
s->height, 
ref->linesize[0], 
s->stride);
 
  196     s->vmafdsp.convolution_x(
s->filter, 5, 
s->temp_data, 
s->blur_data[0],
 
  197                              s->width, 
s->height, 
s->stride, 
s->stride);
 
  202         uint64_t sad = 
s->vmafdsp.sad(
s->blur_data[1], 
s->blur_data[0],
 
  203                                       s->width, 
s->height, 
s->stride, 
s->stride);
 
  208     FFSWAP(uint16_t *, 
s->blur_data[0], 
s->blur_data[1]);
 
  210     s->motion_sum += score;
 
  228     set_meta(&
ref->metadata, 
"lavfi.vmafmotion.score", score);
 
  230         fprintf(
s->stats_file,
 
  231                 "n:%"PRId64
" motion:%0.2lf\n", 
s->data.nb_frames, score);
 
  248     s->stride = 
FFALIGN(
w * 
sizeof(uint16_t), 32);
 
  250     data_sz = (size_t) 
s->stride * 
h;
 
  257     for (
i = 0; 
i < 5; 
i++) {
 
  261     vmafmotiondsp_init(&
s->vmafdsp, 
desc->comp[0].depth);
 
  276             (
desc->comp[0].depth == 8 || 
desc->comp[0].depth == 10) &&
 
  290                               ctx->inputs[0]->h, 
ctx->inputs[0]->format);
 
  299     return s->nb_frames > 0 ? 
s->motion_sum / 
s->nb_frames : 0.0;
 
  313     if (
s->stats_file_str) {
 
  314         if (!strcmp(
s->stats_file_str, 
"-")) {
 
  315             s->stats_file = stdout;
 
  318             if (!
s->stats_file) {
 
  323                        s->stats_file_str, buf);
 
  337     if (
s->data.nb_frames > 0) {
 
  341     if (
s->stats_file && 
s->stats_file != stdout)
 
  342         fclose(
s->stats_file);
 
  355     .
name          = 
"vmafmotion",
 
  360     .priv_class    = &vmafmotion_class,
 
  
AVPixelFormat
Pixel format.
 
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
 
int ff_filter_frame(AVFilterLink *link, AVFrame *frame)
Send a frame of data to the next filter.
 
const AVPixFmtDescriptor * av_pix_fmt_desc_get(enum AVPixelFormat pix_fmt)
 
The exact code depends on how similar the blocks are and how related they are to the and needs to apply these operations to the correct inlink or outlink if there are several Macros are available to factor that when no extra processing is inlink
 
This structure describes decoded (raw) audio or video data.
 
#define FILTER_QUERY_FUNC(func)
 
filter_frame For filters that do not use the this method is called when a frame is pushed to the filter s input It can be called at any time except in a reentrant way If the input frame is enough to produce then the filter should push the output frames on the output link immediately As an exception to the previous rule if the input frame is enough to produce several output frames then the filter needs output only at least one per link The additional frames can be left buffered in the filter
 
const char * name
Filter name.
 
A link between two filters.
 
double ff_vmafmotion_process(VMAFMotionData *s, AVFrame *ref)
 
static int filter_frame(AVFilterLink *inlink, AVFrame *ref)
 
int av_strerror(int errnum, char *errbuf, size_t errbuf_size)
Put a description of the AVERROR code errnum in errbuf.
 
#define AV_PIX_FMT_FLAG_HWACCEL
Pixel format is an HW accelerated format.
 
static void convolution_x(const uint16_t *filter, int filt_w, const uint16_t *src, uint16_t *dst, int w, int h, ptrdiff_t _src_stride, ptrdiff_t _dst_stride)
 
static int config_input_ref(AVFilterLink *inlink)
 
A filter pad used for either input or output.
 
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
 
const AVFilterPad ff_video_default_filterpad[1]
An AVFilterPad array whose only entry has name "default" and is of type AVMEDIA_TYPE_VIDEO.
 
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample format(the sample packing is implied by the sample format) and sample rate. The lists are not just lists
 
int ff_vmafmotion_init(VMAFMotionData *s, int w, int h, enum AVPixelFormat fmt)
 
#define FILTER_INPUTS(array)
 
static uint8_t img1[WIDTH *HEIGHT]
 
#define FFABS(a)
Absolute value, Note, INT_MIN / INT64_MIN result in undefined behavior as they are not representable ...
 
Describe the class of an AVClass context structure.
 
AVFILTER_DEFINE_CLASS(vmafmotion)
 
double ff_vmafmotion_uninit(VMAFMotionData *s)
 
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification.
 
#define AV_PIX_FMT_FLAG_RGB
The pixel format contains RGB-like data (as opposed to YUV/grayscale).
 
static uint8_t img2[WIDTH *HEIGHT]
 
#define AV_PIX_FMT_FLAG_BITSTREAM
All values of a component are bit-wise packed end to end.
 
static av_cold int init(AVFilterContext *ctx)
 
const AVFilter ff_vf_vmafmotion
 
#define AV_LOG_INFO
Standard information.
 
static uint64_t image_sad(const uint16_t *img1, const uint16_t *img2, int w, int h, ptrdiff_t _img1_stride, ptrdiff_t _img2_stride)
 
#define i(width, name, range_min, range_max)
 
it s the only field you need to keep assuming you have a context There is some magic you don t need to care about around this just let it vf default value
 
#define AV_PIX_FMT_FLAG_BE
Pixel format is big-endian.
 
const char * name
Pad name.
 
FILE * avpriv_fopen_utf8(const char *path, const char *mode)
Open a file using a UTF-8 filename.
 
#define FFSWAP(type, a, b)
 
static int query_formats(AVFilterContext *ctx)
 
static const float FILTER_5[5]
 
#define AVFILTER_FLAG_METADATA_ONLY
The filter is a "metadata" filter - it does not modify the frame data in any way.
 
static int ref[MAX_W *MAX_W]
 
#define AV_PIX_FMT_FLAG_PLANAR
At least one pixel component is not in the first data plane.
 
static void do_vmafmotion(AVFilterContext *ctx, AVFrame *ref)
 
static const AVFilterPad vmafmotion_inputs[]
 
#define conv_y_fn(type, bits)
 
static const AVOption vmafmotion_options[]
 
Descriptor that unambiguously describes how the bits of a pixel are stored in the up to 4 data planes...
 
#define FILTER_OUTPUTS(array)
 
int av_dict_set(AVDictionary **pm, const char *key, const char *value, int flags)
Set the given entry in *pm, overwriting an existing entry.
 
static av_cold void uninit(AVFilterContext *ctx)
 
#define flags(name, subs,...)
 
#define AV_PIX_FMT_FLAG_PAL
Pixel format has a palette in data[1], values are indexes in this palette.
 
static void set_meta(AVDictionary **metadata, const char *key, float d)