FFmpeg
vf_xmedian.c
Go to the documentation of this file.
1 /*
2  * Copyright (c) 2019 Paul B Mahol
3  *
4  * This file is part of FFmpeg.
5  *
6  * FFmpeg is free software; you can redistribute it and/or
7  * modify it under the terms of the GNU Lesser General Public
8  * License as published by the Free Software Foundation; either
9  * version 2.1 of the License, or (at your option) any later version.
10  *
11  * FFmpeg is distributed in the hope that it will be useful,
12  * but WITHOUT ANY WARRANTY; without even the implied warranty of
13  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14  * Lesser General Public License for more details.
15  *
16  * You should have received a copy of the GNU Lesser General Public
17  * License along with FFmpeg; if not, write to the Free Software
18  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
19  */
20 
21 #include "config_components.h"
22 
23 #include "libavutil/avstring.h"
24 #include "libavutil/imgutils.h"
25 #include "libavutil/opt.h"
26 #include "libavutil/pixdesc.h"
27 #include "libavutil/qsort.h"
28 
29 #include "avfilter.h"
30 #include "internal.h"
31 #include "framesync.h"
32 #include "video.h"
33 
34 typedef struct XMedianContext {
35  const AVClass *class;
37  int nb_inputs;
38  int nb_frames;
40  int planes;
41  float percentile;
42 
43  int xmedian;
44  int radius;
45  int index;
46  int depth;
47  int max;
48  int nb_planes;
49  int linesizes[4];
50  int width[4];
51  int height[4];
52 
53  uint8_t **data;
54  int *linesize;
55 
58 
59  int (*median_frames)(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs);
61 
62 static const enum AVPixelFormat pixel_fmts[] = {
90 };
91 
93 {
94  XMedianContext *s = ctx->priv;
95 
96  if (!s->xmedian)
97  s->nb_inputs = s->radius * 2 + 1;
98 
99  if (s->nb_inputs & 1)
100  s->index = s->radius * 2.f * s->percentile;
101  else
102  s->index = av_clip(s->radius * 2.f * s->percentile, 1, s->nb_inputs - 1);
103  s->frames = av_calloc(s->nb_inputs, sizeof(*s->frames));
104  if (!s->frames)
105  return AVERROR(ENOMEM);
106 
107  return 0;
108 }
109 
110 typedef struct ThreadData {
111  AVFrame **in, *out;
112 } ThreadData;
113 
114 static int compare8(const void *p1, const void *p2)
115 {
116  int left = *(const uint8_t *)p1;
117  int right = *(const uint8_t *)p2;
118  return FFDIFFSIGN(left, right);
119 }
120 
121 static int compare16(const void *p1, const void *p2)
122 {
123  int left = *(const uint16_t *)p1;
124  int right = *(const uint16_t *)p2;
125  return FFDIFFSIGN(left, right);
126 }
127 
128 #define MEDIAN_SLICE(name, type, comparei) \
129 static int median_frames ## name(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs) \
130 { \
131  XMedianContext *s = ctx->priv; \
132  ThreadData *td = arg; \
133  AVFrame **in = td->in; \
134  AVFrame *out = td->out; \
135  const int nb_inputs = s->nb_inputs; \
136  uint8_t **srcf = s->data + jobnr * nb_inputs; \
137  int *linesize = s->linesize + jobnr * nb_inputs; \
138  const int radius = s->radius; \
139  const int index = s->index; \
140  type values[256]; \
141  \
142  for (int p = 0; p < s->nb_planes; p++) { \
143  const int slice_start = (s->height[p] * jobnr) / nb_jobs; \
144  const int slice_end = (s->height[p] * (jobnr+1)) / nb_jobs; \
145  const int width = s->width[p]; \
146  type *dst = (type *)(out->data[p] + slice_start * out->linesize[p]); \
147  ptrdiff_t dst_linesize = out->linesize[p] / sizeof(type); \
148  \
149  if (!((1 << p) & s->planes)) { \
150  av_image_copy_plane((uint8_t *)dst, out->linesize[p], \
151  in[radius]->data[p] + slice_start * in[radius]->linesize[p], \
152  in[radius]->linesize[p], \
153  s->linesizes[p], slice_end - slice_start); \
154  continue; \
155  } \
156  \
157  for (int i = 0; i < nb_inputs; i++) \
158  linesize[i] = in[i]->linesize[p]; \
159  \
160  for (int i = 0; i < nb_inputs; i++) \
161  srcf[i] = in[i]->data[p] + slice_start * linesize[i]; \
162  \
163  for (int y = slice_start; y < slice_end; y++) { \
164  for (int x = 0; x < width; x++) { \
165  for (int i = 0; i < nb_inputs; i++) { \
166  const type *src = (const type *)srcf[i]; \
167  values[i] = src[x]; \
168  } \
169  \
170  AV_QSORT(values, nb_inputs, type, comparei); \
171  if (nb_inputs & 1) \
172  dst[x] = values[index]; \
173  else \
174  dst[x] = (values[index] + values[index - 1]) >> 1; \
175  } \
176  \
177  dst += dst_linesize; \
178  for (int i = 0; i < nb_inputs; i++) \
179  srcf[i] += linesize[i]; \
180  } \
181  } \
182  \
183  return 0; \
184 }
185 
186 MEDIAN_SLICE(8, uint8_t, compare8)
187 MEDIAN_SLICE(16, uint16_t, compare16)
188 
190 {
191  if (s->nb_inputs & 1)
192  s->index = s->radius * 2.f * s->percentile;
193  else
194  s->index = av_clip(s->radius * 2.f * s->percentile, 1, s->nb_inputs - 1);
195 }
196 
198 {
199  AVFilterContext *ctx = fs->parent;
200  AVFilterLink *outlink = ctx->outputs[0];
201  XMedianContext *s = fs->opaque;
202  AVFrame **in = s->frames;
203  AVFrame *out;
204  ThreadData td;
205  int i, ret;
206 
207  update_index(s);
208 
209  for (i = 0; i < s->nb_inputs; i++) {
210  if ((ret = ff_framesync_get_frame(&s->fs, i, &in[i], 0)) < 0)
211  return ret;
212  }
213 
214  if (ctx->is_disabled) {
215  out = av_frame_clone(in[0]);
216  } else {
217  out = ff_get_video_buffer(outlink, outlink->w, outlink->h);
218  }
219  if (!out)
220  return AVERROR(ENOMEM);
221  out->pts = av_rescale_q(s->fs.pts, s->fs.time_base, outlink->time_base);
222 
223  if (!ctx->is_disabled) {
224  td.in = in;
225  td.out = out;
226  ff_filter_execute(ctx, s->median_frames, &td, NULL,
227  FFMIN(s->height[1], s->nb_threads));
228  }
229 
230  return ff_filter_frame(outlink, out);
231 }
232 
233 static int config_output(AVFilterLink *outlink)
234 {
235  AVFilterContext *ctx = outlink->src;
236  XMedianContext *s = ctx->priv;
237  AVRational frame_rate = ctx->inputs[0]->frame_rate;
238  AVRational sar = ctx->inputs[0]->sample_aspect_ratio;
239  AVFilterLink *inlink = ctx->inputs[0];
240  int height = ctx->inputs[0]->h;
241  int width = ctx->inputs[0]->w;
242  FFFrameSyncIn *in;
243  int i, ret;
244 
245  for (int i = 1; i < s->nb_inputs && s->xmedian; i++) {
246  if (ctx->inputs[i]->h != height || ctx->inputs[i]->w != width) {
247  av_log(ctx, AV_LOG_ERROR, "Input %d size (%dx%d) does not match input %d size (%dx%d).\n", i, ctx->inputs[i]->w, ctx->inputs[i]->h, 0, width, height);
248  return AVERROR(EINVAL);
249  }
250  }
251 
252  s->desc = av_pix_fmt_desc_get(outlink->format);
253  if (!s->desc)
254  return AVERROR_BUG;
255  s->nb_planes = av_pix_fmt_count_planes(outlink->format);
256  s->depth = s->desc->comp[0].depth;
257  s->max = (1 << s->depth) - 1;
258  s->nb_threads = ff_filter_get_nb_threads(ctx);
259 
260  if (s->depth <= 8)
261  s->median_frames = median_frames8;
262  else
263  s->median_frames = median_frames16;
264 
265  if ((ret = av_image_fill_linesizes(s->linesizes, inlink->format, inlink->w)) < 0)
266  return ret;
267 
268  s->width[1] = s->width[2] = AV_CEIL_RSHIFT(inlink->w, s->desc->log2_chroma_w);
269  s->width[0] = s->width[3] = inlink->w;
270  s->height[1] = s->height[2] = AV_CEIL_RSHIFT(inlink->h, s->desc->log2_chroma_h);
271  s->height[0] = s->height[3] = inlink->h;
272 
273  s->data = av_calloc(s->nb_threads * s->nb_inputs, sizeof(*s->data));
274  if (!s->data)
275  return AVERROR(ENOMEM);
276 
277  s->linesize = av_calloc(s->nb_threads * s->nb_inputs, sizeof(*s->linesize));
278  if (!s->linesize)
279  return AVERROR(ENOMEM);
280 
281  if (!s->xmedian)
282  return 0;
283 
284  outlink->w = width;
285  outlink->h = height;
286  outlink->frame_rate = frame_rate;
287  outlink->sample_aspect_ratio = sar;
288 
289  if ((ret = ff_framesync_init(&s->fs, ctx, s->nb_inputs)) < 0)
290  return ret;
291 
292  in = s->fs.in;
293  s->fs.opaque = s;
294  s->fs.on_event = process_frame;
295 
296  for (i = 0; i < s->nb_inputs; i++) {
297  AVFilterLink *inlink = ctx->inputs[i];
298 
299  in[i].time_base = inlink->time_base;
300  in[i].sync = 1;
301  in[i].before = EXT_STOP;
302  in[i].after = EXT_INFINITY;
303  }
304 
305  ret = ff_framesync_configure(&s->fs);
306  outlink->time_base = s->fs.time_base;
307 
308  return ret;
309 }
310 
312 {
313  XMedianContext *s = ctx->priv;
314 
315  ff_framesync_uninit(&s->fs);
316 
317  for (int i = 0; i < s->nb_frames && s->frames && !s->xmedian; i++)
318  av_frame_free(&s->frames[i]);
319  av_freep(&s->frames);
320  av_freep(&s->data);
321  av_freep(&s->linesize);
322 }
323 
325 {
326  XMedianContext *s = ctx->priv;
327  return ff_framesync_activate(&s->fs);
328 }
329 
330 static const AVFilterPad outputs[] = {
331  {
332  .name = "default",
333  .type = AVMEDIA_TYPE_VIDEO,
334  .config_props = config_output,
335  },
336 };
337 
338 #if CONFIG_XMEDIAN_FILTER
339 static av_cold int xmedian_init(AVFilterContext *ctx)
340 {
341  XMedianContext *s = ctx->priv;
342  int ret;
343 
344  s->xmedian = 1;
345 
346  s->radius = s->nb_inputs / 2;
347 
348  for (int i = 0; i < s->nb_inputs; i++) {
349  AVFilterPad pad = { 0 };
350 
351  pad.type = AVMEDIA_TYPE_VIDEO;
352  pad.name = av_asprintf("input%d", i);
353  if (!pad.name)
354  return AVERROR(ENOMEM);
355 
356  if ((ret = ff_append_inpad_free_name(ctx, &pad)) < 0)
357  return ret;
358  }
359 
360  return init(ctx);
361 }
362 
363 #define OFFSET(x) offsetof(XMedianContext, x)
364 #define FLAGS AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_FILTERING_PARAM
365 #define TFLAGS AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_FILTERING_PARAM | AV_OPT_FLAG_RUNTIME_PARAM
366 
367 static const AVOption xmedian_options[] = {
368  { "inputs", "set number of inputs", OFFSET(nb_inputs), AV_OPT_TYPE_INT, {.i64=3}, 3, 255, .flags = FLAGS },
369  { "planes", "set planes to filter", OFFSET(planes), AV_OPT_TYPE_INT, {.i64=15}, 0, 15, .flags =TFLAGS },
370  { "percentile", "set percentile", OFFSET(percentile),AV_OPT_TYPE_FLOAT,{.dbl=0.5}, 0, 1, .flags =TFLAGS },
371  { NULL },
372 };
373 
375 
376 const AVFilter ff_vf_xmedian = {
377  .name = "xmedian",
378  .description = NULL_IF_CONFIG_SMALL("Pick median pixels from several video inputs."),
379  .priv_size = sizeof(XMedianContext),
380  .priv_class = &xmedian_class,
383  .preinit = xmedian_framesync_preinit,
384  .init = xmedian_init,
385  .uninit = uninit,
386  .activate = activate,
389  .process_command = ff_filter_process_command,
390 };
391 
392 #endif /* CONFIG_XMEDIAN_FILTER */
393 
394 #if CONFIG_TMEDIAN_FILTER
395 static int tmedian_filter_frame(AVFilterLink *inlink, AVFrame *in)
396 {
397  AVFilterContext *ctx = inlink->dst;
398  AVFilterLink *outlink = ctx->outputs[0];
399  XMedianContext *s = ctx->priv;
400  ThreadData td;
401  AVFrame *out;
402 
403  update_index(s);
404 
405  if (s->nb_frames < s->nb_inputs) {
406  s->frames[s->nb_frames] = in;
407  s->nb_frames++;
408  if (s->nb_frames < s->nb_inputs)
409  return 0;
410  } else {
411  av_frame_free(&s->frames[0]);
412  memmove(&s->frames[0], &s->frames[1], sizeof(*s->frames) * (s->nb_inputs - 1));
413  s->frames[s->nb_inputs - 1] = in;
414  }
415 
416  if (ctx->is_disabled) {
417  out = av_frame_clone(s->frames[0]);
418  if (!out)
419  return AVERROR(ENOMEM);
420  return ff_filter_frame(outlink, out);
421  }
422 
423  out = ff_get_video_buffer(outlink, outlink->w, outlink->h);
424  if (!out)
425  return AVERROR(ENOMEM);
426  out->pts = s->frames[0]->pts;
427 
428  td.out = out;
429  td.in = s->frames;
430  ff_filter_execute(ctx, s->median_frames, &td, NULL,
431  FFMIN(s->height[1], s->nb_threads));
432 
433  return ff_filter_frame(outlink, out);
434 }
435 
436 static const AVOption tmedian_options[] = {
437  { "radius", "set median filter radius", OFFSET(radius), AV_OPT_TYPE_INT, {.i64=1}, 1, 127, .flags = FLAGS },
438  { "planes", "set planes to filter", OFFSET(planes), AV_OPT_TYPE_INT, {.i64=15}, 0, 15, .flags =TFLAGS },
439  { "percentile", "set percentile", OFFSET(percentile), AV_OPT_TYPE_FLOAT, {.dbl=0.5}, 0, 1, .flags =TFLAGS },
440  { NULL },
441 };
442 
443 static const AVFilterPad tmedian_inputs[] = {
444  {
445  .name = "default",
446  .type = AVMEDIA_TYPE_VIDEO,
447  .filter_frame = tmedian_filter_frame,
448  },
449 };
450 
451 AVFILTER_DEFINE_CLASS(tmedian);
452 
453 const AVFilter ff_vf_tmedian = {
454  .name = "tmedian",
455  .description = NULL_IF_CONFIG_SMALL("Pick median pixels from successive frames."),
456  .priv_size = sizeof(XMedianContext),
457  .priv_class = &tmedian_class,
458  FILTER_INPUTS(tmedian_inputs),
461  .init = init,
462  .uninit = uninit,
464  .process_command = ff_filter_process_command,
465 };
466 
467 #endif /* CONFIG_TMEDIAN_FILTER */
ff_get_video_buffer
AVFrame * ff_get_video_buffer(AVFilterLink *link, int w, int h)
Request a picture buffer with a specific set of permissions.
Definition: video.c:112
AV_PIX_FMT_YUVA422P16
#define AV_PIX_FMT_YUVA422P16
Definition: pixfmt.h:522
AV_PIX_FMT_GBRAP16
#define AV_PIX_FMT_GBRAP16
Definition: pixfmt.h:501
FFFrameSyncIn::time_base
AVRational time_base
Time base for the incoming frames.
Definition: framesync.h:117
ff_framesync_configure
int ff_framesync_configure(FFFrameSync *fs)
Configure a frame sync structure.
Definition: framesync.c:134
td
#define td
Definition: regdef.h:70
AVPixelFormat
AVPixelFormat
Pixel format.
Definition: pixfmt.h:71
av_clip
#define av_clip
Definition: common.h:98
AVERROR
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
opt.h
ff_framesync_uninit
void ff_framesync_uninit(FFFrameSync *fs)
Free all memory currently allocated.
Definition: framesync.c:304
out
FILE * out
Definition: movenc.c:54
ff_filter_frame
int ff_filter_frame(AVFilterLink *link, AVFrame *frame)
Send a frame of data to the next filter.
Definition: avfilter.c:1018
av_pix_fmt_desc_get
const AVPixFmtDescriptor * av_pix_fmt_desc_get(enum AVPixelFormat pix_fmt)
Definition: pixdesc.c:2962
ff_framesync_get_frame
int ff_framesync_get_frame(FFFrameSync *fs, unsigned in, AVFrame **rframe, unsigned get)
Get the current frame in an input.
Definition: framesync.c:267
FILTER_PIXFMTS_ARRAY
#define FILTER_PIXFMTS_ARRAY(array)
Definition: internal.h:162
MEDIAN_SLICE
#define MEDIAN_SLICE(name, type, comparei)
Definition: vf_xmedian.c:128
inlink
The exact code depends on how similar the blocks are and how related they are to the and needs to apply these operations to the correct inlink or outlink if there are several Macros are available to factor that when no extra processing is inlink
Definition: filter_design.txt:212
av_asprintf
char * av_asprintf(const char *fmt,...)
Definition: avstring.c:115
XMedianContext::median_frames
int(* median_frames)(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs)
Definition: vf_xmedian.c:59
av_frame_free
void av_frame_free(AVFrame **frame)
Free the frame and any dynamically allocated objects in it, e.g.
Definition: frame.c:130
AV_PIX_FMT_YUVA422P9
#define AV_PIX_FMT_YUVA422P9
Definition: pixfmt.h:514
XMedianContext::linesize
int * linesize
Definition: vf_xmedian.c:54
AVFrame
This structure describes decoded (raw) audio or video data.
Definition: frame.h:344
pixdesc.h
AV_PIX_FMT_YUVA420P16
#define AV_PIX_FMT_YUVA420P16
Definition: pixfmt.h:521
AV_PIX_FMT_YUVA420P10
#define AV_PIX_FMT_YUVA420P10
Definition: pixfmt.h:516
AVOption
AVOption.
Definition: opt.h:346
AV_PIX_FMT_YUV420P10
#define AV_PIX_FMT_YUV420P10
Definition: pixfmt.h:478
FRAMESYNC_DEFINE_CLASS
#define FRAMESYNC_DEFINE_CLASS(name, context, field)
Definition: framesync.h:351
FLAGS
#define FLAGS
Definition: cmdutils.c:584
XMedianContext::nb_frames
int nb_frames
Definition: vf_xmedian.c:38
AV_PIX_FMT_YUV440P
@ AV_PIX_FMT_YUV440P
planar YUV 4:4:0 (1 Cr & Cb sample per 1x2 Y samples)
Definition: pixfmt.h:106
AVFilter::name
const char * name
Filter name.
Definition: avfilter.h:170
FFFrameSync
Frame sync structure.
Definition: framesync.h:168
EXT_INFINITY
@ EXT_INFINITY
Extend the frame to infinity.
Definition: framesync.h:75
ThreadData::out
AVFrame * out
Definition: af_adeclick.c:526
video.h
ThreadData::in
AVFrame * in
Definition: af_adecorrelate.c:153
AV_PIX_FMT_YUVA422P10
#define AV_PIX_FMT_YUVA422P10
Definition: pixfmt.h:517
AV_PIX_FMT_GRAY9
#define AV_PIX_FMT_GRAY9
Definition: pixfmt.h:458
av_pix_fmt_count_planes
int av_pix_fmt_count_planes(enum AVPixelFormat pix_fmt)
Definition: pixdesc.c:3002
AV_PIX_FMT_YUVA420P9
#define AV_PIX_FMT_YUVA420P9
Definition: pixfmt.h:513
EXT_STOP
@ EXT_STOP
Completely stop all streams with this one.
Definition: framesync.h:65
AV_PIX_FMT_GBRP14
#define AV_PIX_FMT_GBRP14
Definition: pixfmt.h:496
AV_PIX_FMT_GBRAP
@ AV_PIX_FMT_GBRAP
planar GBRA 4:4:4:4 32bpp
Definition: pixfmt.h:212
XMedianContext::planes
int planes
Definition: vf_xmedian.c:40
XMedianContext::fs
FFFrameSync fs
Definition: vf_xmedian.c:57
AV_PIX_FMT_GBRP10
#define AV_PIX_FMT_GBRP10
Definition: pixfmt.h:494
AV_PIX_FMT_YUVA444P16
#define AV_PIX_FMT_YUVA444P16
Definition: pixfmt.h:523
FFFrameSyncIn
Input stream structure.
Definition: framesync.h:102
AV_PIX_FMT_YUV422P9
#define AV_PIX_FMT_YUV422P9
Definition: pixfmt.h:476
AV_PIX_FMT_GRAY16
#define AV_PIX_FMT_GRAY16
Definition: pixfmt.h:462
FFFrameSyncIn::sync
unsigned sync
Synchronization level: frames on input at the highest sync level will generate output frame events.
Definition: framesync.h:160
AVFILTER_FLAG_DYNAMIC_INPUTS
#define AVFILTER_FLAG_DYNAMIC_INPUTS
The number of the filter inputs is not determined just by AVFilter.inputs.
Definition: avfilter.h:106
config_output
static int config_output(AVFilterLink *outlink)
Definition: vf_xmedian.c:233
AVFilterPad
A filter pad used for either input or output.
Definition: internal.h:33
FFDIFFSIGN
#define FFDIFFSIGN(x, y)
Comparator.
Definition: macros.h:45
AV_PIX_FMT_YUV444P10
#define AV_PIX_FMT_YUV444P10
Definition: pixfmt.h:481
AV_PIX_FMT_YUVJ411P
@ AV_PIX_FMT_YUVJ411P
planar YUV 4:1:1, 12bpp, (1 Cr & Cb sample per 4x1 Y samples) full scale (JPEG), deprecated in favor ...
Definition: pixfmt.h:283
AV_LOG_ERROR
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
Definition: log.h:180
av_cold
#define av_cold
Definition: attributes.h:90
AV_PIX_FMT_YUV422P16
#define AV_PIX_FMT_YUV422P16
Definition: pixfmt.h:490
AV_PIX_FMT_YUVJ422P
@ AV_PIX_FMT_YUVJ422P
planar YUV 4:2:2, 16bpp, full scale (JPEG), deprecated in favor of AV_PIX_FMT_YUV422P and setting col...
Definition: pixfmt.h:86
AV_PIX_FMT_GBRAP10
#define AV_PIX_FMT_GBRAP10
Definition: pixfmt.h:498
width
#define width
av_image_fill_linesizes
int av_image_fill_linesizes(int linesizes[4], enum AVPixelFormat pix_fmt, int width)
Fill plane linesizes for an image with pixel format pix_fmt and width width.
Definition: imgutils.c:89
s
#define s(width, name)
Definition: cbs_vp9.c:198
AV_PIX_FMT_GBRAP12
#define AV_PIX_FMT_GBRAP12
Definition: pixfmt.h:499
AV_PIX_FMT_YUVA420P
@ AV_PIX_FMT_YUVA420P
planar YUV 4:2:0, 20bpp, (1 Cr & Cb sample per 2x2 Y & A samples)
Definition: pixfmt.h:108
AV_PIX_FMT_YUV444P16
#define AV_PIX_FMT_YUV444P16
Definition: pixfmt.h:491
AV_CEIL_RSHIFT
#define AV_CEIL_RSHIFT(a, b)
Definition: common.h:58
XMedianContext::depth
int depth
Definition: vf_xmedian.c:46
AV_PIX_FMT_YUVA444P12
#define AV_PIX_FMT_YUVA444P12
Definition: pixfmt.h:520
AV_PIX_FMT_YUV420P9
#define AV_PIX_FMT_YUV420P9
Definition: pixfmt.h:475
AV_PIX_FMT_YUV420P16
#define AV_PIX_FMT_YUV420P16
Definition: pixfmt.h:489
process_frame
static int process_frame(FFFrameSync *fs)
Definition: vf_xmedian.c:197
ctx
AVFormatContext * ctx
Definition: movenc.c:48
AV_PIX_FMT_GRAY14
#define AV_PIX_FMT_GRAY14
Definition: pixfmt.h:461
av_frame_clone
AVFrame * av_frame_clone(const AVFrame *src)
Create a new frame that references the same data as src.
Definition: frame.c:563
av_rescale_q
int64_t av_rescale_q(int64_t a, AVRational bq, AVRational cq)
Rescale a 64-bit integer by 2 rational numbers.
Definition: mathematics.c:142
AV_PIX_FMT_YUV420P
@ AV_PIX_FMT_YUV420P
planar YUV 4:2:0, 12bpp, (1 Cr & Cb sample per 2x2 Y samples)
Definition: pixfmt.h:73
FILTER_INPUTS
#define FILTER_INPUTS(array)
Definition: internal.h:182
AV_PIX_FMT_YUVJ444P
@ AV_PIX_FMT_YUVJ444P
planar YUV 4:4:4, 24bpp, full scale (JPEG), deprecated in favor of AV_PIX_FMT_YUV444P and setting col...
Definition: pixfmt.h:87
arg
const char * arg
Definition: jacosubdec.c:67
XMedianContext::data
uint8_t ** data
Definition: vf_xmedian.c:53
AV_PIX_FMT_GRAY10
#define AV_PIX_FMT_GRAY10
Definition: pixfmt.h:459
AV_PIX_FMT_GBRP16
#define AV_PIX_FMT_GBRP16
Definition: pixfmt.h:497
XMedianContext::width
int width[4]
Definition: vf_xmedian.c:50
AVClass
Describe the class of an AVClass context structure.
Definition: log.h:66
NULL
#define NULL
Definition: coverity.c:32
fs
#define fs(width, name, subs,...)
Definition: cbs_vp9.c:200
init
static av_cold int init(AVFilterContext *ctx)
Definition: vf_xmedian.c:92
AVRational
Rational number (pair of numerator and denominator).
Definition: rational.h:58
ff_append_inpad_free_name
int ff_append_inpad_free_name(AVFilterContext *f, AVFilterPad *p)
Definition: avfilter.c:131
AV_PIX_FMT_YUVJ420P
@ AV_PIX_FMT_YUVJ420P
planar YUV 4:2:0, 12bpp, full scale (JPEG), deprecated in favor of AV_PIX_FMT_YUV420P and setting col...
Definition: pixfmt.h:85
AV_PIX_FMT_YUV440P10
#define AV_PIX_FMT_YUV440P10
Definition: pixfmt.h:480
AV_PIX_FMT_YUV422P10
#define AV_PIX_FMT_YUV422P10
Definition: pixfmt.h:479
AV_PIX_FMT_GRAY8
@ AV_PIX_FMT_GRAY8
Y , 8bpp.
Definition: pixfmt.h:81
AV_PIX_FMT_GBRP9
#define AV_PIX_FMT_GBRP9
Definition: pixfmt.h:493
XMedianContext::height
int height[4]
Definition: vf_xmedian.c:51
XMedianContext::nb_threads
int nb_threads
Definition: vf_xmedian.c:39
TFLAGS
#define TFLAGS
Definition: af_afade.c:65
qsort.h
NULL_IF_CONFIG_SMALL
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification.
Definition: internal.h:106
AV_PIX_FMT_YUV422P12
#define AV_PIX_FMT_YUV422P12
Definition: pixfmt.h:483
AV_PIX_FMT_YUV444P12
#define AV_PIX_FMT_YUV444P12
Definition: pixfmt.h:485
ff_filter_process_command
int ff_filter_process_command(AVFilterContext *ctx, const char *cmd, const char *arg, char *res, int res_len, int flags)
Generic processing of user supplied commands that are set in the same way as the filter options.
Definition: avfilter.c:890
compare8
static int compare8(const void *p1, const void *p2)
Definition: vf_xmedian.c:114
height
#define height
AV_PIX_FMT_YUVA444P
@ AV_PIX_FMT_YUVA444P
planar YUV 4:4:4 32bpp, (1 Cr & Cb sample per 1x1 Y & A samples)
Definition: pixfmt.h:174
AV_PIX_FMT_YUVA444P10
#define AV_PIX_FMT_YUVA444P10
Definition: pixfmt.h:518
ff_vf_xmedian
const AVFilter ff_vf_xmedian
XMedianContext::desc
const AVPixFmtDescriptor * desc
Definition: vf_xmedian.c:36
update_index
static void update_index(XMedianContext *s)
Definition: vf_xmedian.c:189
compare16
static int compare16(const void *p1, const void *p2)
Definition: vf_xmedian.c:121
XMedianContext
Definition: vf_xmedian.c:34
internal.h
AVFILTER_DEFINE_CLASS
#define AVFILTER_DEFINE_CLASS(fname)
Definition: internal.h:323
AV_OPT_TYPE_FLOAT
@ AV_OPT_TYPE_FLOAT
Definition: opt.h:238
XMedianContext::index
int index
Definition: vf_xmedian.c:45
pixel_fmts
static enum AVPixelFormat pixel_fmts[]
Definition: vf_xmedian.c:62
ff_vf_tmedian
const AVFilter ff_vf_tmedian
i
#define i(width, name, range_min, range_max)
Definition: cbs_h2645.c:255
AV_PIX_FMT_GBRP12
#define AV_PIX_FMT_GBRP12
Definition: pixfmt.h:495
XMedianContext::linesizes
int linesizes[4]
Definition: vf_xmedian.c:49
ff_filter_get_nb_threads
int ff_filter_get_nb_threads(AVFilterContext *ctx)
Get number of threads for current filter instance.
Definition: avfilter.c:825
XMedianContext::max
int max
Definition: vf_xmedian.c:47
ThreadData
Used for passing data between threads.
Definition: dsddec.c:69
FFMIN
#define FFMIN(a, b)
Definition: macros.h:49
AV_PIX_FMT_YUVJ440P
@ AV_PIX_FMT_YUVJ440P
planar YUV 4:4:0 full scale (JPEG), deprecated in favor of AV_PIX_FMT_YUV440P and setting color_range
Definition: pixfmt.h:107
AVFilterPad::name
const char * name
Pad name.
Definition: internal.h:39
av_calloc
void * av_calloc(size_t nmemb, size_t size)
Definition: mem.c:262
AV_PIX_FMT_YUV444P9
#define AV_PIX_FMT_YUV444P9
Definition: pixfmt.h:477
AVFilter
Filter definition.
Definition: avfilter.h:166
ret
ret
Definition: filter_design.txt:187
AVFilterPad::type
enum AVMediaType type
AVFilterPad type.
Definition: internal.h:44
XMedianContext::nb_inputs
int nb_inputs
Definition: vf_xmedian.c:37
AV_PIX_FMT_YUVA444P9
#define AV_PIX_FMT_YUVA444P9
Definition: pixfmt.h:515
ff_framesync_init
int ff_framesync_init(FFFrameSync *fs, AVFilterContext *parent, unsigned nb_in)
Initialize a frame sync structure.
Definition: framesync.c:86
AV_PIX_FMT_YUV420P12
#define AV_PIX_FMT_YUV420P12
Definition: pixfmt.h:482
XMedianContext::frames
AVFrame ** frames
Definition: vf_xmedian.c:56
left
Tag MUST be and< 10hcoeff half pel interpolation filter coefficients, hcoeff[0] are the 2 middle coefficients[1] are the next outer ones and so on, resulting in a filter like:...eff[2], hcoeff[1], hcoeff[0], hcoeff[0], hcoeff[1], hcoeff[2] ... the sign of the coefficients is not explicitly stored but alternates after each coeff and coeff[0] is positive, so ...,+,-,+,-,+,+,-,+,-,+,... hcoeff[0] is not explicitly stored but found by subtracting the sum of all stored coefficients with signs from 32 hcoeff[0]=32 - hcoeff[1] - hcoeff[2] - ... a good choice for hcoeff and htaps is htaps=6 hcoeff={40,-10, 2} an alternative which requires more computations at both encoder and decoder side and may or may not be better is htaps=8 hcoeff={42,-14, 6,-2}ref_frames minimum of the number of available reference frames and max_ref_frames for example the first frame after a key frame always has ref_frames=1spatial_decomposition_type wavelet type 0 is a 9/7 symmetric compact integer wavelet 1 is a 5/3 symmetric compact integer wavelet others are reserved stored as delta from last, last is reset to 0 if always_reset||keyframeqlog quality(logarithmic quantizer scale) stored as delta from last, last is reset to 0 if always_reset||keyframemv_scale stored as delta from last, last is reset to 0 if always_reset||keyframe FIXME check that everything works fine if this changes between framesqbias dequantization bias stored as delta from last, last is reset to 0 if always_reset||keyframeblock_max_depth maximum depth of the block tree stored as delta from last, last is reset to 0 if always_reset||keyframequant_table quantization tableHighlevel bitstream structure:==============================--------------------------------------------|Header|--------------------------------------------|------------------------------------|||Block0||||split?||||yes no||||......... intra?||||:Block01 :yes no||||:Block02 :....... ..........||||:Block03 ::y DC ::ref index:||||:Block04 ::cb DC ::motion x :||||......... :cr DC ::motion y :||||....... ..........|||------------------------------------||------------------------------------|||Block1|||...|--------------------------------------------|------------ ------------ ------------|||Y subbands||Cb subbands||Cr subbands||||--- ---||--- ---||--- ---|||||LL0||HL0||||LL0||HL0||||LL0||HL0|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||LH0||HH0||||LH0||HH0||||LH0||HH0|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||HL1||LH1||||HL1||LH1||||HL1||LH1|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||HH1||HL2||||HH1||HL2||||HH1||HL2|||||...||...||...|||------------ ------------ ------------|--------------------------------------------Decoding process:=================------------|||Subbands|------------||||------------|Intra DC||||LL0 subband prediction ------------|\ Dequantization ------------------- \||Reference frames|\ IDWT|------- -------|Motion \|||Frame 0||Frame 1||Compensation . OBMC v -------|------- -------|--------------. \------> Frame n output Frame Frame<----------------------------------/|...|------------------- Range Coder:============Binary Range Coder:------------------- The implemented range coder is an adapted version based upon "Range encoding: an algorithm for removing redundancy from a digitised message." by G. N. N. Martin. The symbols encoded by the Snow range coder are bits(0|1). The associated probabilities are not fix but change depending on the symbol mix seen so far. bit seen|new state ---------+----------------------------------------------- 0|256 - state_transition_table[256 - old_state];1|state_transition_table[old_state];state_transition_table={ 0, 0, 0, 0, 0, 0, 0, 0, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 170, 171, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181, 182, 183, 184, 185, 186, 187, 188, 189, 190, 190, 191, 192, 194, 194, 195, 196, 197, 198, 199, 200, 201, 202, 202, 204, 205, 206, 207, 208, 209, 209, 210, 211, 212, 213, 215, 215, 216, 217, 218, 219, 220, 220, 222, 223, 224, 225, 226, 227, 227, 229, 229, 230, 231, 232, 234, 234, 235, 236, 237, 238, 239, 240, 241, 242, 243, 244, 245, 246, 247, 248, 248, 0, 0, 0, 0, 0, 0, 0};FIXME Range Coding of integers:------------------------- FIXME Neighboring Blocks:===================left and top are set to the respective blocks unless they are outside of the image in which case they are set to the Null block top-left is set to the top left block unless it is outside of the image in which case it is set to the left block if this block has no larger parent block or it is at the left side of its parent block and the top right block is not outside of the image then the top right block is used for top-right else the top-left block is used Null block y, cb, cr are 128 level, ref, mx and my are 0 Motion Vector Prediction:=========================1. the motion vectors of all the neighboring blocks are scaled to compensate for the difference of reference frames scaled_mv=(mv *(256 *(current_reference+1)/(mv.reference+1))+128)> the median of the scaled left
Definition: snow.txt:386
AV_PIX_FMT_YUV422P14
#define AV_PIX_FMT_YUV422P14
Definition: pixfmt.h:487
OFFSET
it s the only field you need to keep assuming you have a context There is some magic you don t need to care about around this just let it vf default minimum maximum flags name is the option keep it simple and lowercase description are in without and describe what they for example set the foo of the bar offset is the offset of the field in your see the OFFSET() macro
FFFrameSyncIn::before
enum FFFrameSyncExtMode before
Extrapolation mode for timestamps before the first frame.
Definition: framesync.h:107
XMedianContext::percentile
float percentile
Definition: vf_xmedian.c:41
framesync.h
XMedianContext::radius
int radius
Definition: vf_xmedian.c:44
AV_PIX_FMT_NONE
@ AV_PIX_FMT_NONE
Definition: pixfmt.h:72
AV_PIX_FMT_YUVA422P12
#define AV_PIX_FMT_YUVA422P12
Definition: pixfmt.h:519
AV_OPT_TYPE_INT
@ AV_OPT_TYPE_INT
Definition: opt.h:235
avfilter.h
uninit
static av_cold void uninit(AVFilterContext *ctx)
Definition: vf_xmedian.c:311
AV_PIX_FMT_YUV444P
@ AV_PIX_FMT_YUV444P
planar YUV 4:4:4, 24bpp, (1 Cr & Cb sample per 1x1 Y samples)
Definition: pixfmt.h:78
activate
static int activate(AVFilterContext *ctx)
Definition: vf_xmedian.c:324
AVFilterContext
An instance of a filter.
Definition: avfilter.h:407
XMedianContext::nb_planes
int nb_planes
Definition: vf_xmedian.c:48
AV_PIX_FMT_GBRP
@ AV_PIX_FMT_GBRP
planar GBR 4:4:4 24bpp
Definition: pixfmt.h:165
AVFILTER_FLAG_SLICE_THREADS
#define AVFILTER_FLAG_SLICE_THREADS
The filter supports multithreading by splitting frames into multiple parts and processing them concur...
Definition: avfilter.h:117
AVMEDIA_TYPE_VIDEO
@ AVMEDIA_TYPE_VIDEO
Definition: avutil.h:201
AV_PIX_FMT_YUV422P
@ AV_PIX_FMT_YUV422P
planar YUV 4:2:2, 16bpp, (1 Cr & Cb sample per 2x1 Y samples)
Definition: pixfmt.h:77
AVPixFmtDescriptor
Descriptor that unambiguously describes how the bits of a pixel are stored in the up to 4 data planes...
Definition: pixdesc.h:69
planes
static const struct @386 planes[]
FILTER_OUTPUTS
#define FILTER_OUTPUTS(array)
Definition: internal.h:183
outputs
static const AVFilterPad outputs[]
Definition: vf_xmedian.c:330
av_freep
#define av_freep(p)
Definition: tableprint_vlc.h:34
XMedianContext::xmedian
int xmedian
Definition: vf_xmedian.c:43
AV_PIX_FMT_YUV411P
@ AV_PIX_FMT_YUV411P
planar YUV 4:1:1, 12bpp, (1 Cr & Cb sample per 4x1 Y samples)
Definition: pixfmt.h:80
AVFILTER_FLAG_SUPPORT_TIMELINE_INTERNAL
#define AVFILTER_FLAG_SUPPORT_TIMELINE_INTERNAL
Same as AVFILTER_FLAG_SUPPORT_TIMELINE_GENERIC, except that the filter will have its filter_frame() c...
Definition: avfilter.h:155
imgutils.h
AVERROR_BUG
#define AVERROR_BUG
Internal bug, also see AVERROR_BUG2.
Definition: error.h:52
AV_PIX_FMT_YUV410P
@ AV_PIX_FMT_YUV410P
planar YUV 4:1:0, 9bpp, (1 Cr & Cb sample per 4x4 Y samples)
Definition: pixfmt.h:79
av_log
#define av_log(a,...)
Definition: tableprint_vlc.h:27
FFFrameSyncIn::after
enum FFFrameSyncExtMode after
Extrapolation mode for timestamps after the last frame.
Definition: framesync.h:112
AV_PIX_FMT_YUV440P12
#define AV_PIX_FMT_YUV440P12
Definition: pixfmt.h:484
AV_PIX_FMT_YUV444P14
#define AV_PIX_FMT_YUV444P14
Definition: pixfmt.h:488
ff_framesync_activate
int ff_framesync_activate(FFFrameSync *fs)
Examine the frames in the filter's input and try to produce output.
Definition: framesync.c:355
avstring.h
AV_PIX_FMT_GRAY12
#define AV_PIX_FMT_GRAY12
Definition: pixfmt.h:460
ff_filter_execute
static av_always_inline int ff_filter_execute(AVFilterContext *ctx, avfilter_action_func *func, void *arg, int *ret, int nb_jobs)
Definition: internal.h:134
int
int
Definition: ffmpeg_filter.c:409
AV_PIX_FMT_YUVA422P
@ AV_PIX_FMT_YUVA422P
planar YUV 4:2:2 24bpp, (1 Cr & Cb sample per 2x1 Y & A samples)
Definition: pixfmt.h:173
AV_PIX_FMT_YUV420P14
#define AV_PIX_FMT_YUV420P14
Definition: pixfmt.h:486