FFmpeg
vf_xmedian.c
Go to the documentation of this file.
1 /*
2  * Copyright (c) 2019 Paul B Mahol
3  *
4  * This file is part of FFmpeg.
5  *
6  * FFmpeg is free software; you can redistribute it and/or
7  * modify it under the terms of the GNU Lesser General Public
8  * License as published by the Free Software Foundation; either
9  * version 2.1 of the License, or (at your option) any later version.
10  *
11  * FFmpeg is distributed in the hope that it will be useful,
12  * but WITHOUT ANY WARRANTY; without even the implied warranty of
13  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14  * Lesser General Public License for more details.
15  *
16  * You should have received a copy of the GNU Lesser General Public
17  * License along with FFmpeg; if not, write to the Free Software
18  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
19  */
20 
21 #include "config_components.h"
22 
23 #include "libavutil/avstring.h"
24 #include "libavutil/imgutils.h"
25 #include "libavutil/intreadwrite.h"
26 #include "libavutil/opt.h"
27 #include "libavutil/pixdesc.h"
28 #include "libavutil/qsort.h"
29 
30 #include "avfilter.h"
31 #include "formats.h"
32 #include "internal.h"
33 #include "framesync.h"
34 #include "video.h"
35 
36 typedef struct XMedianContext {
37  const AVClass *class;
39  int nb_inputs;
40  int nb_frames;
42  int planes;
43  float percentile;
44 
45  int xmedian;
46  int radius;
47  int index;
48  int depth;
49  int max;
50  int nb_planes;
51  int linesizes[4];
52  int width[4];
53  int height[4];
54 
55  uint8_t **data;
56  int *linesize;
57 
60 
61  int (*median_frames)(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs);
63 
64 static const enum AVPixelFormat pixel_fmts[] = {
92 };
93 
95 {
96  XMedianContext *s = ctx->priv;
97 
98  if (!s->xmedian)
99  s->nb_inputs = s->radius * 2 + 1;
100 
101  if (s->nb_inputs & 1)
102  s->index = s->radius * 2.f * s->percentile;
103  else
104  s->index = av_clip(s->radius * 2.f * s->percentile, 1, s->nb_inputs - 1);
105  s->frames = av_calloc(s->nb_inputs, sizeof(*s->frames));
106  if (!s->frames)
107  return AVERROR(ENOMEM);
108 
109  return 0;
110 }
111 
112 typedef struct ThreadData {
113  AVFrame **in, *out;
114 } ThreadData;
115 
116 static int compare8(const void *p1, const void *p2)
117 {
118  int left = *(const uint8_t *)p1;
119  int right = *(const uint8_t *)p2;
120  return FFDIFFSIGN(left, right);
121 }
122 
123 static int compare16(const void *p1, const void *p2)
124 {
125  int left = *(const uint16_t *)p1;
126  int right = *(const uint16_t *)p2;
127  return FFDIFFSIGN(left, right);
128 }
129 
130 #define MEDIAN_SLICE(name, type, comparei) \
131 static int median_frames ## name(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs) \
132 { \
133  XMedianContext *s = ctx->priv; \
134  ThreadData *td = arg; \
135  AVFrame **in = td->in; \
136  AVFrame *out = td->out; \
137  const int nb_inputs = s->nb_inputs; \
138  uint8_t **srcf = s->data + jobnr * nb_inputs; \
139  int *linesize = s->linesize + jobnr * nb_inputs; \
140  const int radius = s->radius; \
141  const int index = s->index; \
142  type values[256]; \
143  \
144  for (int p = 0; p < s->nb_planes; p++) { \
145  const int slice_start = (s->height[p] * jobnr) / nb_jobs; \
146  const int slice_end = (s->height[p] * (jobnr+1)) / nb_jobs; \
147  const int width = s->width[p]; \
148  type *dst = (type *)(out->data[p] + slice_start * out->linesize[p]); \
149  ptrdiff_t dst_linesize = out->linesize[p] / sizeof(type); \
150  \
151  if (!((1 << p) & s->planes)) { \
152  av_image_copy_plane((uint8_t *)dst, out->linesize[p], \
153  in[radius]->data[p] + slice_start * in[radius]->linesize[p], \
154  in[radius]->linesize[p], \
155  s->linesizes[p], slice_end - slice_start); \
156  continue; \
157  } \
158  \
159  for (int i = 0; i < nb_inputs; i++) \
160  linesize[i] = in[i]->linesize[p]; \
161  \
162  for (int i = 0; i < nb_inputs; i++) \
163  srcf[i] = in[i]->data[p] + slice_start * linesize[i]; \
164  \
165  for (int y = slice_start; y < slice_end; y++) { \
166  for (int x = 0; x < width; x++) { \
167  for (int i = 0; i < nb_inputs; i++) { \
168  const type *src = (const type *)srcf[i]; \
169  values[i] = src[x]; \
170  } \
171  \
172  AV_QSORT(values, nb_inputs, type, comparei); \
173  if (nb_inputs & 1) \
174  dst[x] = values[index]; \
175  else \
176  dst[x] = (values[index] + values[index - 1]) >> 1; \
177  } \
178  \
179  dst += dst_linesize; \
180  for (int i = 0; i < nb_inputs; i++) \
181  srcf[i] += linesize[i]; \
182  } \
183  } \
184  \
185  return 0; \
186 }
187 
188 MEDIAN_SLICE(8, uint8_t, compare8)
189 MEDIAN_SLICE(16, uint16_t, compare16)
190 
192 {
193  if (s->nb_inputs & 1)
194  s->index = s->radius * 2.f * s->percentile;
195  else
196  s->index = av_clip(s->radius * 2.f * s->percentile, 1, s->nb_inputs - 1);
197 }
198 
200 {
201  AVFilterContext *ctx = fs->parent;
202  AVFilterLink *outlink = ctx->outputs[0];
203  XMedianContext *s = fs->opaque;
204  AVFrame **in = s->frames;
205  AVFrame *out;
206  ThreadData td;
207  int i, ret;
208 
209  update_index(s);
210 
211  for (i = 0; i < s->nb_inputs; i++) {
212  if ((ret = ff_framesync_get_frame(&s->fs, i, &in[i], 0)) < 0)
213  return ret;
214  }
215 
216  if (ctx->is_disabled) {
217  out = av_frame_clone(in[0]);
218  } else {
219  out = ff_get_video_buffer(outlink, outlink->w, outlink->h);
220  }
221  if (!out)
222  return AVERROR(ENOMEM);
223  out->pts = av_rescale_q(s->fs.pts, s->fs.time_base, outlink->time_base);
224 
225  if (!ctx->is_disabled) {
226  td.in = in;
227  td.out = out;
228  ff_filter_execute(ctx, s->median_frames, &td, NULL,
229  FFMIN(s->height[1], s->nb_threads));
230  }
231 
232  return ff_filter_frame(outlink, out);
233 }
234 
235 static int config_output(AVFilterLink *outlink)
236 {
237  AVFilterContext *ctx = outlink->src;
238  XMedianContext *s = ctx->priv;
239  AVRational frame_rate = ctx->inputs[0]->frame_rate;
240  AVRational sar = ctx->inputs[0]->sample_aspect_ratio;
241  AVFilterLink *inlink = ctx->inputs[0];
242  int height = ctx->inputs[0]->h;
243  int width = ctx->inputs[0]->w;
244  FFFrameSyncIn *in;
245  int i, ret;
246 
247  for (int i = 1; i < s->nb_inputs && s->xmedian; i++) {
248  if (ctx->inputs[i]->h != height || ctx->inputs[i]->w != width) {
249  av_log(ctx, AV_LOG_ERROR, "Input %d size (%dx%d) does not match input %d size (%dx%d).\n", i, ctx->inputs[i]->w, ctx->inputs[i]->h, 0, width, height);
250  return AVERROR(EINVAL);
251  }
252  }
253 
254  s->desc = av_pix_fmt_desc_get(outlink->format);
255  if (!s->desc)
256  return AVERROR_BUG;
257  s->nb_planes = av_pix_fmt_count_planes(outlink->format);
258  s->depth = s->desc->comp[0].depth;
259  s->max = (1 << s->depth) - 1;
260  s->nb_threads = ff_filter_get_nb_threads(ctx);
261 
262  if (s->depth <= 8)
263  s->median_frames = median_frames8;
264  else
265  s->median_frames = median_frames16;
266 
267  if ((ret = av_image_fill_linesizes(s->linesizes, inlink->format, inlink->w)) < 0)
268  return ret;
269 
270  s->width[1] = s->width[2] = AV_CEIL_RSHIFT(inlink->w, s->desc->log2_chroma_w);
271  s->width[0] = s->width[3] = inlink->w;
272  s->height[1] = s->height[2] = AV_CEIL_RSHIFT(inlink->h, s->desc->log2_chroma_h);
273  s->height[0] = s->height[3] = inlink->h;
274 
275  s->data = av_calloc(s->nb_threads * s->nb_inputs, sizeof(*s->data));
276  if (!s->data)
277  return AVERROR(ENOMEM);
278 
279  s->linesize = av_calloc(s->nb_threads * s->nb_inputs, sizeof(*s->linesize));
280  if (!s->linesize)
281  return AVERROR(ENOMEM);
282 
283  if (!s->xmedian)
284  return 0;
285 
286  outlink->w = width;
287  outlink->h = height;
288  outlink->frame_rate = frame_rate;
289  outlink->sample_aspect_ratio = sar;
290 
291  if ((ret = ff_framesync_init(&s->fs, ctx, s->nb_inputs)) < 0)
292  return ret;
293 
294  in = s->fs.in;
295  s->fs.opaque = s;
296  s->fs.on_event = process_frame;
297 
298  for (i = 0; i < s->nb_inputs; i++) {
299  AVFilterLink *inlink = ctx->inputs[i];
300 
301  in[i].time_base = inlink->time_base;
302  in[i].sync = 1;
303  in[i].before = EXT_STOP;
304  in[i].after = EXT_INFINITY;
305  }
306 
307  ret = ff_framesync_configure(&s->fs);
308  outlink->time_base = s->fs.time_base;
309 
310  return ret;
311 }
312 
314 {
315  XMedianContext *s = ctx->priv;
316 
317  ff_framesync_uninit(&s->fs);
318 
319  for (int i = 0; i < s->nb_frames && s->frames && !s->xmedian; i++)
320  av_frame_free(&s->frames[i]);
321  av_freep(&s->frames);
322  av_freep(&s->data);
323  av_freep(&s->linesize);
324 }
325 
327 {
328  XMedianContext *s = ctx->priv;
329  return ff_framesync_activate(&s->fs);
330 }
331 
332 #if CONFIG_XMEDIAN_FILTER
333 static av_cold int xmedian_init(AVFilterContext *ctx)
334 {
335  XMedianContext *s = ctx->priv;
336  int ret;
337 
338  s->xmedian = 1;
339 
340  s->radius = s->nb_inputs / 2;
341 
342  for (int i = 0; i < s->nb_inputs; i++) {
343  AVFilterPad pad = { 0 };
344 
345  pad.type = AVMEDIA_TYPE_VIDEO;
346  pad.name = av_asprintf("input%d", i);
347  if (!pad.name)
348  return AVERROR(ENOMEM);
349 
350  if ((ret = ff_append_inpad_free_name(ctx, &pad)) < 0)
351  return ret;
352  }
353 
354  return init(ctx);
355 }
356 
357 #define OFFSET(x) offsetof(XMedianContext, x)
358 #define FLAGS AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_FILTERING_PARAM
359 #define TFLAGS AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_FILTERING_PARAM | AV_OPT_FLAG_RUNTIME_PARAM
360 
361 static const AVOption xmedian_options[] = {
362  { "inputs", "set number of inputs", OFFSET(nb_inputs), AV_OPT_TYPE_INT, {.i64=3}, 3, 255, .flags = FLAGS },
363  { "planes", "set planes to filter", OFFSET(planes), AV_OPT_TYPE_INT, {.i64=15}, 0, 15, .flags =TFLAGS },
364  { "percentile", "set percentile", OFFSET(percentile),AV_OPT_TYPE_FLOAT,{.dbl=0.5}, 0, 1, .flags =TFLAGS },
365  { NULL },
366 };
367 
368 static const AVFilterPad outputs[] = {
369  {
370  .name = "default",
371  .type = AVMEDIA_TYPE_VIDEO,
372  .config_props = config_output,
373  },
374 };
375 
377 
378 const AVFilter ff_vf_xmedian = {
379  .name = "xmedian",
380  .description = NULL_IF_CONFIG_SMALL("Pick median pixels from several video inputs."),
381  .priv_size = sizeof(XMedianContext),
382  .priv_class = &xmedian_class,
385  .preinit = xmedian_framesync_preinit,
386  .init = xmedian_init,
387  .uninit = uninit,
388  .activate = activate,
391  .process_command = ff_filter_process_command,
392 };
393 
394 #endif /* CONFIG_XMEDIAN_FILTER */
395 
396 #if CONFIG_TMEDIAN_FILTER
397 static int tmedian_filter_frame(AVFilterLink *inlink, AVFrame *in)
398 {
399  AVFilterContext *ctx = inlink->dst;
400  AVFilterLink *outlink = ctx->outputs[0];
401  XMedianContext *s = ctx->priv;
402  ThreadData td;
403  AVFrame *out;
404 
405  update_index(s);
406 
407  if (s->nb_frames < s->nb_inputs) {
408  s->frames[s->nb_frames] = in;
409  s->nb_frames++;
410  if (s->nb_frames < s->nb_inputs)
411  return 0;
412  } else {
413  av_frame_free(&s->frames[0]);
414  memmove(&s->frames[0], &s->frames[1], sizeof(*s->frames) * (s->nb_inputs - 1));
415  s->frames[s->nb_inputs - 1] = in;
416  }
417 
418  if (ctx->is_disabled) {
419  out = av_frame_clone(s->frames[0]);
420  if (!out)
421  return AVERROR(ENOMEM);
422  return ff_filter_frame(outlink, out);
423  }
424 
425  out = ff_get_video_buffer(outlink, outlink->w, outlink->h);
426  if (!out)
427  return AVERROR(ENOMEM);
428  out->pts = s->frames[0]->pts;
429 
430  td.out = out;
431  td.in = s->frames;
432  ff_filter_execute(ctx, s->median_frames, &td, NULL,
433  FFMIN(s->height[1], s->nb_threads));
434 
435  return ff_filter_frame(outlink, out);
436 }
437 
438 static const AVOption tmedian_options[] = {
439  { "radius", "set median filter radius", OFFSET(radius), AV_OPT_TYPE_INT, {.i64=1}, 1, 127, .flags = FLAGS },
440  { "planes", "set planes to filter", OFFSET(planes), AV_OPT_TYPE_INT, {.i64=15}, 0, 15, .flags =TFLAGS },
441  { "percentile", "set percentile", OFFSET(percentile), AV_OPT_TYPE_FLOAT, {.dbl=0.5}, 0, 1, .flags =TFLAGS },
442  { NULL },
443 };
444 
445 static const AVFilterPad tmedian_inputs[] = {
446  {
447  .name = "default",
448  .type = AVMEDIA_TYPE_VIDEO,
449  .filter_frame = tmedian_filter_frame,
450  },
451 };
452 
453 static const AVFilterPad tmedian_outputs[] = {
454  {
455  .name = "default",
456  .type = AVMEDIA_TYPE_VIDEO,
457  .config_props = config_output,
458  },
459 };
460 
461 AVFILTER_DEFINE_CLASS(tmedian);
462 
463 const AVFilter ff_vf_tmedian = {
464  .name = "tmedian",
465  .description = NULL_IF_CONFIG_SMALL("Pick median pixels from successive frames."),
466  .priv_size = sizeof(XMedianContext),
467  .priv_class = &tmedian_class,
468  FILTER_INPUTS(tmedian_inputs),
469  FILTER_OUTPUTS(tmedian_outputs),
471  .init = init,
472  .uninit = uninit,
474  .process_command = ff_filter_process_command,
475 };
476 
477 #endif /* CONFIG_TMEDIAN_FILTER */
ff_get_video_buffer
AVFrame * ff_get_video_buffer(AVFilterLink *link, int w, int h)
Request a picture buffer with a specific set of permissions.
Definition: video.c:101
AV_PIX_FMT_YUVA422P16
#define AV_PIX_FMT_YUVA422P16
Definition: pixfmt.h:449
AV_PIX_FMT_GBRAP16
#define AV_PIX_FMT_GBRAP16
Definition: pixfmt.h:428
FFFrameSyncIn::time_base
AVRational time_base
Time base for the incoming frames.
Definition: framesync.h:96
ff_framesync_configure
int ff_framesync_configure(FFFrameSync *fs)
Configure a frame sync structure.
Definition: framesync.c:119
td
#define td
Definition: regdef.h:70
AVPixelFormat
AVPixelFormat
Pixel format.
Definition: pixfmt.h:64
av_clip
#define av_clip
Definition: common.h:95
AVERROR
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
opt.h
ff_framesync_uninit
void ff_framesync_uninit(FFFrameSync *fs)
Free all memory currently allocated.
Definition: framesync.c:285
out
FILE * out
Definition: movenc.c:54
ff_filter_frame
int ff_filter_frame(AVFilterLink *link, AVFrame *frame)
Send a frame of data to the next filter.
Definition: avfilter.c:999
av_pix_fmt_desc_get
const AVPixFmtDescriptor * av_pix_fmt_desc_get(enum AVPixelFormat pix_fmt)
Definition: pixdesc.c:2662
ff_framesync_get_frame
int ff_framesync_get_frame(FFFrameSync *fs, unsigned in, AVFrame **rframe, unsigned get)
Get the current frame in an input.
Definition: framesync.c:248
FILTER_PIXFMTS_ARRAY
#define FILTER_PIXFMTS_ARRAY(array)
Definition: internal.h:170
MEDIAN_SLICE
#define MEDIAN_SLICE(name, type, comparei)
Definition: vf_xmedian.c:130
inlink
The exact code depends on how similar the blocks are and how related they are to the and needs to apply these operations to the correct inlink or outlink if there are several Macros are available to factor that when no extra processing is inlink
Definition: filter_design.txt:212
av_asprintf
char * av_asprintf(const char *fmt,...)
Definition: avstring.c:116
XMedianContext::median_frames
int(* median_frames)(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs)
Definition: vf_xmedian.c:61
av_frame_free
void av_frame_free(AVFrame **frame)
Free the frame and any dynamically allocated objects in it, e.g.
Definition: frame.c:111
AV_PIX_FMT_YUVA422P9
#define AV_PIX_FMT_YUVA422P9
Definition: pixfmt.h:441
XMedianContext::linesize
int * linesize
Definition: vf_xmedian.c:56
AVFrame
This structure describes decoded (raw) audio or video data.
Definition: frame.h:325
pixdesc.h
AV_PIX_FMT_YUVA420P16
#define AV_PIX_FMT_YUVA420P16
Definition: pixfmt.h:448
AV_PIX_FMT_YUVA420P10
#define AV_PIX_FMT_YUVA420P10
Definition: pixfmt.h:443
AVOption
AVOption.
Definition: opt.h:251
AV_PIX_FMT_YUV420P10
#define AV_PIX_FMT_YUV420P10
Definition: pixfmt.h:406
FRAMESYNC_DEFINE_CLASS
#define FRAMESYNC_DEFINE_CLASS(name, context, field)
Definition: framesync.h:328
FLAGS
#define FLAGS
Definition: cmdutils.c:509
XMedianContext::nb_frames
int nb_frames
Definition: vf_xmedian.c:40
AV_PIX_FMT_YUV440P
@ AV_PIX_FMT_YUV440P
planar YUV 4:4:0 (1 Cr & Cb sample per 1x2 Y samples)
Definition: pixfmt.h:99
AVFilter::name
const char * name
Filter name.
Definition: avfilter.h:175
FFFrameSync
Frame sync structure.
Definition: framesync.h:146
EXT_INFINITY
@ EXT_INFINITY
Extend the frame to infinity.
Definition: framesync.h:75
ThreadData::out
AVFrame * out
Definition: af_adeclick.c:473
video.h
ThreadData::in
AVFrame * in
Definition: af_adecorrelate.c:154
AV_PIX_FMT_YUVA422P10
#define AV_PIX_FMT_YUVA422P10
Definition: pixfmt.h:444
AV_PIX_FMT_GRAY9
#define AV_PIX_FMT_GRAY9
Definition: pixfmt.h:386
formats.h
av_pix_fmt_count_planes
int av_pix_fmt_count_planes(enum AVPixelFormat pix_fmt)
Definition: pixdesc.c:2702
AV_PIX_FMT_YUVA420P9
#define AV_PIX_FMT_YUVA420P9
Definition: pixfmt.h:440
EXT_STOP
@ EXT_STOP
Completely stop all streams with this one.
Definition: framesync.h:65
AV_PIX_FMT_GBRP14
#define AV_PIX_FMT_GBRP14
Definition: pixfmt.h:424
AV_PIX_FMT_GBRAP
@ AV_PIX_FMT_GBRAP
planar GBRA 4:4:4:4 32bpp
Definition: pixfmt.h:205
XMedianContext::planes
int planes
Definition: vf_xmedian.c:42
XMedianContext::fs
FFFrameSync fs
Definition: vf_xmedian.c:59
AV_PIX_FMT_GBRP10
#define AV_PIX_FMT_GBRP10
Definition: pixfmt.h:422
AV_PIX_FMT_YUVA444P16
#define AV_PIX_FMT_YUVA444P16
Definition: pixfmt.h:450
FFFrameSyncIn
Input stream structure.
Definition: framesync.h:81
AV_PIX_FMT_YUV422P9
#define AV_PIX_FMT_YUV422P9
Definition: pixfmt.h:404
AV_PIX_FMT_GRAY16
#define AV_PIX_FMT_GRAY16
Definition: pixfmt.h:390
FFFrameSyncIn::sync
unsigned sync
Synchronization level: frames on input at the highest sync level will generate output frame events.
Definition: framesync.h:139
AVFILTER_FLAG_DYNAMIC_INPUTS
#define AVFILTER_FLAG_DYNAMIC_INPUTS
The number of the filter inputs is not determined just by AVFilter.inputs.
Definition: avfilter.h:116
config_output
static int config_output(AVFilterLink *outlink)
Definition: vf_xmedian.c:235
AVFilterPad
A filter pad used for either input or output.
Definition: internal.h:49
FFDIFFSIGN
#define FFDIFFSIGN(x, y)
Comparator.
Definition: macros.h:45
AV_PIX_FMT_YUV444P10
#define AV_PIX_FMT_YUV444P10
Definition: pixfmt.h:409
AV_PIX_FMT_YUVJ411P
@ AV_PIX_FMT_YUVJ411P
planar YUV 4:1:1, 12bpp, (1 Cr & Cb sample per 4x1 Y samples) full scale (JPEG), deprecated in favor ...
Definition: pixfmt.h:248
AV_LOG_ERROR
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
Definition: log.h:180
av_cold
#define av_cold
Definition: attributes.h:90
AV_PIX_FMT_YUV422P16
#define AV_PIX_FMT_YUV422P16
Definition: pixfmt.h:418
AV_PIX_FMT_YUVJ422P
@ AV_PIX_FMT_YUVJ422P
planar YUV 4:2:2, 16bpp, full scale (JPEG), deprecated in favor of AV_PIX_FMT_YUV422P and setting col...
Definition: pixfmt.h:79
AV_PIX_FMT_GBRAP10
#define AV_PIX_FMT_GBRAP10
Definition: pixfmt.h:426
width
#define width
av_image_fill_linesizes
int av_image_fill_linesizes(int linesizes[4], enum AVPixelFormat pix_fmt, int width)
Fill plane linesizes for an image with pixel format pix_fmt and width width.
Definition: imgutils.c:89
intreadwrite.h
s
#define s(width, name)
Definition: cbs_vp9.c:256
AV_PIX_FMT_GBRAP12
#define AV_PIX_FMT_GBRAP12
Definition: pixfmt.h:427
AV_PIX_FMT_YUVA420P
@ AV_PIX_FMT_YUVA420P
planar YUV 4:2:0, 20bpp, (1 Cr & Cb sample per 2x2 Y & A samples)
Definition: pixfmt.h:101
AV_PIX_FMT_YUV444P16
#define AV_PIX_FMT_YUV444P16
Definition: pixfmt.h:419
AV_CEIL_RSHIFT
#define AV_CEIL_RSHIFT(a, b)
Definition: common.h:50
XMedianContext::depth
int depth
Definition: vf_xmedian.c:48
outputs
static const AVFilterPad outputs[]
Definition: af_acontrast.c:172
AV_PIX_FMT_YUVA444P12
#define AV_PIX_FMT_YUVA444P12
Definition: pixfmt.h:447
AV_PIX_FMT_YUV420P9
#define AV_PIX_FMT_YUV420P9
Definition: pixfmt.h:403
AV_PIX_FMT_YUV420P16
#define AV_PIX_FMT_YUV420P16
Definition: pixfmt.h:417
process_frame
static int process_frame(FFFrameSync *fs)
Definition: vf_xmedian.c:199
ctx
AVFormatContext * ctx
Definition: movenc.c:48
AV_PIX_FMT_GRAY14
#define AV_PIX_FMT_GRAY14
Definition: pixfmt.h:389
av_frame_clone
AVFrame * av_frame_clone(const AVFrame *src)
Create a new frame that references the same data as src.
Definition: frame.c:464
av_rescale_q
int64_t av_rescale_q(int64_t a, AVRational bq, AVRational cq)
Rescale a 64-bit integer by 2 rational numbers.
Definition: mathematics.c:142
AV_PIX_FMT_YUV420P
@ AV_PIX_FMT_YUV420P
planar YUV 4:2:0, 12bpp, (1 Cr & Cb sample per 2x2 Y samples)
Definition: pixfmt.h:66
FILTER_INPUTS
#define FILTER_INPUTS(array)
Definition: internal.h:190
AV_PIX_FMT_YUVJ444P
@ AV_PIX_FMT_YUVJ444P
planar YUV 4:4:4, 24bpp, full scale (JPEG), deprecated in favor of AV_PIX_FMT_YUV444P and setting col...
Definition: pixfmt.h:80
arg
const char * arg
Definition: jacosubdec.c:67
XMedianContext::data
uint8_t ** data
Definition: vf_xmedian.c:55
AV_PIX_FMT_GRAY10
#define AV_PIX_FMT_GRAY10
Definition: pixfmt.h:387
AV_PIX_FMT_GBRP16
#define AV_PIX_FMT_GBRP16
Definition: pixfmt.h:425
XMedianContext::width
int width[4]
Definition: vf_xmedian.c:52
AVClass
Describe the class of an AVClass context structure.
Definition: log.h:66
NULL
#define NULL
Definition: coverity.c:32
fs
#define fs(width, name, subs,...)
Definition: cbs_vp9.c:258
init
static av_cold int init(AVFilterContext *ctx)
Definition: vf_xmedian.c:94
AVRational
Rational number (pair of numerator and denominator).
Definition: rational.h:58
ff_append_inpad_free_name
int ff_append_inpad_free_name(AVFilterContext *f, AVFilterPad *p)
Definition: avfilter.c:123
AV_PIX_FMT_YUVJ420P
@ AV_PIX_FMT_YUVJ420P
planar YUV 4:2:0, 12bpp, full scale (JPEG), deprecated in favor of AV_PIX_FMT_YUV420P and setting col...
Definition: pixfmt.h:78
AV_PIX_FMT_YUV440P10
#define AV_PIX_FMT_YUV440P10
Definition: pixfmt.h:408
AV_PIX_FMT_YUV422P10
#define AV_PIX_FMT_YUV422P10
Definition: pixfmt.h:407
AV_PIX_FMT_GRAY8
@ AV_PIX_FMT_GRAY8
Y , 8bpp.
Definition: pixfmt.h:74
AV_PIX_FMT_GBRP9
#define AV_PIX_FMT_GBRP9
Definition: pixfmt.h:421
XMedianContext::height
int height[4]
Definition: vf_xmedian.c:53
XMedianContext::nb_threads
int nb_threads
Definition: vf_xmedian.c:41
planes
static const struct @328 planes[]
TFLAGS
#define TFLAGS
Definition: af_afade.c:60
qsort.h
NULL_IF_CONFIG_SMALL
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification.
Definition: internal.h:117
AV_PIX_FMT_YUV422P12
#define AV_PIX_FMT_YUV422P12
Definition: pixfmt.h:411
AV_PIX_FMT_YUV444P12
#define AV_PIX_FMT_YUV444P12
Definition: pixfmt.h:413
ff_filter_process_command
int ff_filter_process_command(AVFilterContext *ctx, const char *cmd, const char *arg, char *res, int res_len, int flags)
Generic processing of user supplied commands that are set in the same way as the filter options.
Definition: avfilter.c:863
compare8
static int compare8(const void *p1, const void *p2)
Definition: vf_xmedian.c:116
height
#define height
AV_PIX_FMT_YUVA444P
@ AV_PIX_FMT_YUVA444P
planar YUV 4:4:4 32bpp, (1 Cr & Cb sample per 1x1 Y & A samples)
Definition: pixfmt.h:167
AV_PIX_FMT_YUVA444P10
#define AV_PIX_FMT_YUVA444P10
Definition: pixfmt.h:445
ff_vf_xmedian
const AVFilter ff_vf_xmedian
XMedianContext::desc
const AVPixFmtDescriptor * desc
Definition: vf_xmedian.c:38
update_index
static void update_index(XMedianContext *s)
Definition: vf_xmedian.c:191
compare16
static int compare16(const void *p1, const void *p2)
Definition: vf_xmedian.c:123
XMedianContext
Definition: vf_xmedian.c:36
internal.h
AVFILTER_DEFINE_CLASS
#define AVFILTER_DEFINE_CLASS(fname)
Definition: internal.h:325
AV_OPT_TYPE_FLOAT
@ AV_OPT_TYPE_FLOAT
Definition: opt.h:228
XMedianContext::index
int index
Definition: vf_xmedian.c:47
pixel_fmts
static enum AVPixelFormat pixel_fmts[]
Definition: vf_xmedian.c:64
ff_vf_tmedian
const AVFilter ff_vf_tmedian
i
#define i(width, name, range_min, range_max)
Definition: cbs_h2645.c:269
AV_PIX_FMT_GBRP12
#define AV_PIX_FMT_GBRP12
Definition: pixfmt.h:423
XMedianContext::linesizes
int linesizes[4]
Definition: vf_xmedian.c:51
ff_filter_get_nb_threads
int ff_filter_get_nb_threads(AVFilterContext *ctx)
Get number of threads for current filter instance.
Definition: avfilter.c:783
XMedianContext::max
int max
Definition: vf_xmedian.c:49
ThreadData
Used for passing data between threads.
Definition: dsddec.c:68
FFMIN
#define FFMIN(a, b)
Definition: macros.h:49
AV_PIX_FMT_YUVJ440P
@ AV_PIX_FMT_YUVJ440P
planar YUV 4:4:0 full scale (JPEG), deprecated in favor of AV_PIX_FMT_YUV440P and setting color_range
Definition: pixfmt.h:100
AVFilterPad::name
const char * name
Pad name.
Definition: internal.h:55
av_calloc
void * av_calloc(size_t nmemb, size_t size)
Definition: mem.c:272
AV_PIX_FMT_YUV444P9
#define AV_PIX_FMT_YUV444P9
Definition: pixfmt.h:405
AVFilter
Filter definition.
Definition: avfilter.h:171
ret
ret
Definition: filter_design.txt:187
AVFilterPad::type
enum AVMediaType type
AVFilterPad type.
Definition: internal.h:60
XMedianContext::nb_inputs
int nb_inputs
Definition: vf_xmedian.c:39
AV_PIX_FMT_YUVA444P9
#define AV_PIX_FMT_YUVA444P9
Definition: pixfmt.h:442
ff_framesync_init
int ff_framesync_init(FFFrameSync *fs, AVFilterContext *parent, unsigned nb_in)
Initialize a frame sync structure.
Definition: framesync.c:79
AV_PIX_FMT_YUV420P12
#define AV_PIX_FMT_YUV420P12
Definition: pixfmt.h:410
XMedianContext::frames
AVFrame ** frames
Definition: vf_xmedian.c:58
left
Tag MUST be and< 10hcoeff half pel interpolation filter coefficients, hcoeff[0] are the 2 middle coefficients[1] are the next outer ones and so on, resulting in a filter like:...eff[2], hcoeff[1], hcoeff[0], hcoeff[0], hcoeff[1], hcoeff[2] ... the sign of the coefficients is not explicitly stored but alternates after each coeff and coeff[0] is positive, so ...,+,-,+,-,+,+,-,+,-,+,... hcoeff[0] is not explicitly stored but found by subtracting the sum of all stored coefficients with signs from 32 hcoeff[0]=32 - hcoeff[1] - hcoeff[2] - ... a good choice for hcoeff and htaps is htaps=6 hcoeff={40,-10, 2} an alternative which requires more computations at both encoder and decoder side and may or may not be better is htaps=8 hcoeff={42,-14, 6,-2}ref_frames minimum of the number of available reference frames and max_ref_frames for example the first frame after a key frame always has ref_frames=1spatial_decomposition_type wavelet type 0 is a 9/7 symmetric compact integer wavelet 1 is a 5/3 symmetric compact integer wavelet others are reserved stored as delta from last, last is reset to 0 if always_reset||keyframeqlog quality(logarithmic quantizer scale) stored as delta from last, last is reset to 0 if always_reset||keyframemv_scale stored as delta from last, last is reset to 0 if always_reset||keyframe FIXME check that everything works fine if this changes between framesqbias dequantization bias stored as delta from last, last is reset to 0 if always_reset||keyframeblock_max_depth maximum depth of the block tree stored as delta from last, last is reset to 0 if always_reset||keyframequant_table quantization tableHighlevel bitstream structure:==============================--------------------------------------------|Header|--------------------------------------------|------------------------------------|||Block0||||split?||||yes no||||......... intra?||||:Block01 :yes no||||:Block02 :....... ..........||||:Block03 ::y DC ::ref index:||||:Block04 ::cb DC ::motion x :||||......... :cr DC ::motion y :||||....... ..........|||------------------------------------||------------------------------------|||Block1|||...|--------------------------------------------|------------ ------------ ------------|||Y subbands||Cb subbands||Cr subbands||||--- ---||--- ---||--- ---|||||LL0||HL0||||LL0||HL0||||LL0||HL0|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||LH0||HH0||||LH0||HH0||||LH0||HH0|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||HL1||LH1||||HL1||LH1||||HL1||LH1|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||HH1||HL2||||HH1||HL2||||HH1||HL2|||||...||...||...|||------------ ------------ ------------|--------------------------------------------Decoding process:=================------------|||Subbands|------------||||------------|Intra DC||||LL0 subband prediction ------------|\ Dequantization ------------------- \||Reference frames|\ IDWT|------- -------|Motion \|||Frame 0||Frame 1||Compensation . OBMC v -------|------- -------|--------------. \------> Frame n output Frame Frame<----------------------------------/|...|------------------- Range Coder:============Binary Range Coder:------------------- The implemented range coder is an adapted version based upon "Range encoding: an algorithm for removing redundancy from a digitised message." by G. N. N. Martin. The symbols encoded by the Snow range coder are bits(0|1). The associated probabilities are not fix but change depending on the symbol mix seen so far. bit seen|new state ---------+----------------------------------------------- 0|256 - state_transition_table[256 - old_state];1|state_transition_table[old_state];state_transition_table={ 0, 0, 0, 0, 0, 0, 0, 0, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 170, 171, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181, 182, 183, 184, 185, 186, 187, 188, 189, 190, 190, 191, 192, 194, 194, 195, 196, 197, 198, 199, 200, 201, 202, 202, 204, 205, 206, 207, 208, 209, 209, 210, 211, 212, 213, 215, 215, 216, 217, 218, 219, 220, 220, 222, 223, 224, 225, 226, 227, 227, 229, 229, 230, 231, 232, 234, 234, 235, 236, 237, 238, 239, 240, 241, 242, 243, 244, 245, 246, 247, 248, 248, 0, 0, 0, 0, 0, 0, 0};FIXME Range Coding of integers:------------------------- FIXME Neighboring Blocks:===================left and top are set to the respective blocks unless they are outside of the image in which case they are set to the Null block top-left is set to the top left block unless it is outside of the image in which case it is set to the left block if this block has no larger parent block or it is at the left side of its parent block and the top right block is not outside of the image then the top right block is used for top-right else the top-left block is used Null block y, cb, cr are 128 level, ref, mx and my are 0 Motion Vector Prediction:=========================1. the motion vectors of all the neighboring blocks are scaled to compensate for the difference of reference frames scaled_mv=(mv *(256 *(current_reference+1)/(mv.reference+1))+128)> the median of the scaled left
Definition: snow.txt:386
AV_PIX_FMT_YUV422P14
#define AV_PIX_FMT_YUV422P14
Definition: pixfmt.h:415
OFFSET
it s the only field you need to keep assuming you have a context There is some magic you don t need to care about around this just let it vf default minimum maximum flags name is the option keep it simple and lowercase description are in without and describe what they for example set the foo of the bar offset is the offset of the field in your see the OFFSET() macro
FFFrameSyncIn::before
enum FFFrameSyncExtMode before
Extrapolation mode for timestamps before the first frame.
Definition: framesync.h:86
XMedianContext::percentile
float percentile
Definition: vf_xmedian.c:43
framesync.h
XMedianContext::radius
int radius
Definition: vf_xmedian.c:46
AV_PIX_FMT_NONE
@ AV_PIX_FMT_NONE
Definition: pixfmt.h:65
AV_PIX_FMT_YUVA422P12
#define AV_PIX_FMT_YUVA422P12
Definition: pixfmt.h:446
AV_OPT_TYPE_INT
@ AV_OPT_TYPE_INT
Definition: opt.h:225
avfilter.h
uninit
static av_cold void uninit(AVFilterContext *ctx)
Definition: vf_xmedian.c:313
AV_PIX_FMT_YUV444P
@ AV_PIX_FMT_YUV444P
planar YUV 4:4:4, 24bpp, (1 Cr & Cb sample per 1x1 Y samples)
Definition: pixfmt.h:71
activate
static int activate(AVFilterContext *ctx)
Definition: vf_xmedian.c:326
AVFilterContext
An instance of a filter.
Definition: avfilter.h:408
XMedianContext::nb_planes
int nb_planes
Definition: vf_xmedian.c:50
AV_PIX_FMT_GBRP
@ AV_PIX_FMT_GBRP
planar GBR 4:4:4 24bpp
Definition: pixfmt.h:158
AVFILTER_FLAG_SLICE_THREADS
#define AVFILTER_FLAG_SLICE_THREADS
The filter supports multithreading by splitting frames into multiple parts and processing them concur...
Definition: avfilter.h:127
AVMEDIA_TYPE_VIDEO
@ AVMEDIA_TYPE_VIDEO
Definition: avutil.h:201
AV_PIX_FMT_YUV422P
@ AV_PIX_FMT_YUV422P
planar YUV 4:2:2, 16bpp, (1 Cr & Cb sample per 2x1 Y samples)
Definition: pixfmt.h:70
AVPixFmtDescriptor
Descriptor that unambiguously describes how the bits of a pixel are stored in the up to 4 data planes...
Definition: pixdesc.h:69
FILTER_OUTPUTS
#define FILTER_OUTPUTS(array)
Definition: internal.h:191
av_freep
#define av_freep(p)
Definition: tableprint_vlc.h:34
XMedianContext::xmedian
int xmedian
Definition: vf_xmedian.c:45
AV_PIX_FMT_YUV411P
@ AV_PIX_FMT_YUV411P
planar YUV 4:1:1, 12bpp, (1 Cr & Cb sample per 4x1 Y samples)
Definition: pixfmt.h:73
AVFILTER_FLAG_SUPPORT_TIMELINE_INTERNAL
#define AVFILTER_FLAG_SUPPORT_TIMELINE_INTERNAL
Same as AVFILTER_FLAG_SUPPORT_TIMELINE_GENERIC, except that the filter will have its filter_frame() c...
Definition: avfilter.h:160
imgutils.h
AVERROR_BUG
#define AVERROR_BUG
Internal bug, also see AVERROR_BUG2.
Definition: error.h:52
AV_PIX_FMT_YUV410P
@ AV_PIX_FMT_YUV410P
planar YUV 4:1:0, 9bpp, (1 Cr & Cb sample per 4x4 Y samples)
Definition: pixfmt.h:72
av_log
#define av_log(a,...)
Definition: tableprint_vlc.h:27
FFFrameSyncIn::after
enum FFFrameSyncExtMode after
Extrapolation mode for timestamps after the last frame.
Definition: framesync.h:91
AV_PIX_FMT_YUV440P12
#define AV_PIX_FMT_YUV440P12
Definition: pixfmt.h:412
AV_PIX_FMT_YUV444P14
#define AV_PIX_FMT_YUV444P14
Definition: pixfmt.h:416
ff_framesync_activate
int ff_framesync_activate(FFFrameSync *fs)
Examine the frames in the filter's input and try to produce output.
Definition: framesync.c:336
avstring.h
AV_PIX_FMT_GRAY12
#define AV_PIX_FMT_GRAY12
Definition: pixfmt.h:388
ff_filter_execute
static av_always_inline int ff_filter_execute(AVFilterContext *ctx, avfilter_action_func *func, void *arg, int *ret, int nb_jobs)
Definition: internal.h:142
int
int
Definition: ffmpeg_filter.c:153
AV_PIX_FMT_YUVA422P
@ AV_PIX_FMT_YUVA422P
planar YUV 4:2:2 24bpp, (1 Cr & Cb sample per 2x1 Y & A samples)
Definition: pixfmt.h:166
AV_PIX_FMT_YUV420P14
#define AV_PIX_FMT_YUV420P14
Definition: pixfmt.h:414