FFmpeg
vf_xmedian.c
Go to the documentation of this file.
1 /*
2  * Copyright (c) 2019 Paul B Mahol
3  *
4  * This file is part of FFmpeg.
5  *
6  * FFmpeg is free software; you can redistribute it and/or
7  * modify it under the terms of the GNU Lesser General Public
8  * License as published by the Free Software Foundation; either
9  * version 2.1 of the License, or (at your option) any later version.
10  *
11  * FFmpeg is distributed in the hope that it will be useful,
12  * but WITHOUT ANY WARRANTY; without even the implied warranty of
13  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14  * Lesser General Public License for more details.
15  *
16  * You should have received a copy of the GNU Lesser General Public
17  * License along with FFmpeg; if not, write to the Free Software
18  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
19  */
20 
21 #include "config_components.h"
22 
23 #include "libavutil/avstring.h"
24 #include "libavutil/imgutils.h"
25 #include "libavutil/mem.h"
26 #include "libavutil/opt.h"
27 #include "libavutil/pixdesc.h"
28 #include "libavutil/qsort.h"
29 
30 #include "avfilter.h"
31 #include "internal.h"
32 #include "framesync.h"
33 #include "video.h"
34 
35 typedef struct XMedianContext {
36  const AVClass *class;
38  int nb_inputs;
39  int nb_frames;
41  int planes;
42  float percentile;
43 
44  int xmedian;
45  int radius;
46  int index;
47  int depth;
48  int max;
49  int nb_planes;
50  int linesizes[4];
51  int width[4];
52  int height[4];
53 
54  uint8_t **data;
55  int *linesize;
56 
59 
60  int (*median_frames)(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs);
62 
63 static const enum AVPixelFormat pixel_fmts[] = {
91 };
92 
94 {
95  XMedianContext *s = ctx->priv;
96 
97  if (!s->xmedian)
98  s->nb_inputs = s->radius * 2 + 1;
99 
100  if (s->nb_inputs & 1)
101  s->index = s->radius * 2.f * s->percentile;
102  else
103  s->index = av_clip(s->radius * 2.f * s->percentile, 1, s->nb_inputs - 1);
104  s->frames = av_calloc(s->nb_inputs, sizeof(*s->frames));
105  if (!s->frames)
106  return AVERROR(ENOMEM);
107 
108  return 0;
109 }
110 
111 typedef struct ThreadData {
112  AVFrame **in, *out;
113 } ThreadData;
114 
115 static int compare8(const void *p1, const void *p2)
116 {
117  int left = *(const uint8_t *)p1;
118  int right = *(const uint8_t *)p2;
119  return FFDIFFSIGN(left, right);
120 }
121 
122 static int compare16(const void *p1, const void *p2)
123 {
124  int left = *(const uint16_t *)p1;
125  int right = *(const uint16_t *)p2;
126  return FFDIFFSIGN(left, right);
127 }
128 
129 #define MEDIAN_SLICE(name, type, comparei) \
130 static int median_frames ## name(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs) \
131 { \
132  XMedianContext *s = ctx->priv; \
133  ThreadData *td = arg; \
134  AVFrame **in = td->in; \
135  AVFrame *out = td->out; \
136  const int nb_inputs = s->nb_inputs; \
137  uint8_t **srcf = s->data + jobnr * nb_inputs; \
138  int *linesize = s->linesize + jobnr * nb_inputs; \
139  const int radius = s->radius; \
140  const int index = s->index; \
141  type values[256]; \
142  \
143  for (int p = 0; p < s->nb_planes; p++) { \
144  const int slice_start = (s->height[p] * jobnr) / nb_jobs; \
145  const int slice_end = (s->height[p] * (jobnr+1)) / nb_jobs; \
146  const int width = s->width[p]; \
147  type *dst = (type *)(out->data[p] + slice_start * out->linesize[p]); \
148  ptrdiff_t dst_linesize = out->linesize[p] / sizeof(type); \
149  \
150  if (!((1 << p) & s->planes)) { \
151  av_image_copy_plane((uint8_t *)dst, out->linesize[p], \
152  in[radius]->data[p] + slice_start * in[radius]->linesize[p], \
153  in[radius]->linesize[p], \
154  s->linesizes[p], slice_end - slice_start); \
155  continue; \
156  } \
157  \
158  for (int i = 0; i < nb_inputs; i++) \
159  linesize[i] = in[i]->linesize[p]; \
160  \
161  for (int i = 0; i < nb_inputs; i++) \
162  srcf[i] = in[i]->data[p] + slice_start * linesize[i]; \
163  \
164  for (int y = slice_start; y < slice_end; y++) { \
165  for (int x = 0; x < width; x++) { \
166  for (int i = 0; i < nb_inputs; i++) { \
167  const type *src = (const type *)srcf[i]; \
168  values[i] = src[x]; \
169  } \
170  \
171  AV_QSORT(values, nb_inputs, type, comparei); \
172  if (nb_inputs & 1) \
173  dst[x] = values[index]; \
174  else \
175  dst[x] = (values[index] + values[index - 1]) >> 1; \
176  } \
177  \
178  dst += dst_linesize; \
179  for (int i = 0; i < nb_inputs; i++) \
180  srcf[i] += linesize[i]; \
181  } \
182  } \
183  \
184  return 0; \
185 }
186 
187 MEDIAN_SLICE(8, uint8_t, compare8)
188 MEDIAN_SLICE(16, uint16_t, compare16)
189 
191 {
192  if (s->nb_inputs & 1)
193  s->index = s->radius * 2.f * s->percentile;
194  else
195  s->index = av_clip(s->radius * 2.f * s->percentile, 1, s->nb_inputs - 1);
196 }
197 
199 {
200  AVFilterContext *ctx = fs->parent;
201  AVFilterLink *outlink = ctx->outputs[0];
202  XMedianContext *s = fs->opaque;
203  AVFrame **in = s->frames;
204  AVFrame *out;
205  ThreadData td;
206  int i, ret;
207 
208  update_index(s);
209 
210  for (i = 0; i < s->nb_inputs; i++) {
211  if ((ret = ff_framesync_get_frame(&s->fs, i, &in[i], 0)) < 0)
212  return ret;
213  }
214 
215  if (ctx->is_disabled) {
216  out = av_frame_clone(in[0]);
217  } else {
218  out = ff_get_video_buffer(outlink, outlink->w, outlink->h);
219  }
220  if (!out)
221  return AVERROR(ENOMEM);
222  out->pts = av_rescale_q(s->fs.pts, s->fs.time_base, outlink->time_base);
223 
224  if (!ctx->is_disabled) {
225  td.in = in;
226  td.out = out;
227  ff_filter_execute(ctx, s->median_frames, &td, NULL,
228  FFMIN(s->height[1], s->nb_threads));
229  }
230 
231  return ff_filter_frame(outlink, out);
232 }
233 
234 static int config_output(AVFilterLink *outlink)
235 {
236  AVFilterContext *ctx = outlink->src;
237  XMedianContext *s = ctx->priv;
238  AVRational frame_rate = ctx->inputs[0]->frame_rate;
239  AVRational sar = ctx->inputs[0]->sample_aspect_ratio;
240  AVFilterLink *inlink = ctx->inputs[0];
241  int height = ctx->inputs[0]->h;
242  int width = ctx->inputs[0]->w;
243  FFFrameSyncIn *in;
244  int i, ret;
245 
246  for (int i = 1; i < s->nb_inputs && s->xmedian; i++) {
247  if (ctx->inputs[i]->h != height || ctx->inputs[i]->w != width) {
248  av_log(ctx, AV_LOG_ERROR, "Input %d size (%dx%d) does not match input %d size (%dx%d).\n", i, ctx->inputs[i]->w, ctx->inputs[i]->h, 0, width, height);
249  return AVERROR(EINVAL);
250  }
251  }
252 
253  s->desc = av_pix_fmt_desc_get(outlink->format);
254  if (!s->desc)
255  return AVERROR_BUG;
256  s->nb_planes = av_pix_fmt_count_planes(outlink->format);
257  s->depth = s->desc->comp[0].depth;
258  s->max = (1 << s->depth) - 1;
259  s->nb_threads = ff_filter_get_nb_threads(ctx);
260 
261  if (s->depth <= 8)
262  s->median_frames = median_frames8;
263  else
264  s->median_frames = median_frames16;
265 
266  if ((ret = av_image_fill_linesizes(s->linesizes, inlink->format, inlink->w)) < 0)
267  return ret;
268 
269  s->width[1] = s->width[2] = AV_CEIL_RSHIFT(inlink->w, s->desc->log2_chroma_w);
270  s->width[0] = s->width[3] = inlink->w;
271  s->height[1] = s->height[2] = AV_CEIL_RSHIFT(inlink->h, s->desc->log2_chroma_h);
272  s->height[0] = s->height[3] = inlink->h;
273 
274  s->data = av_calloc(s->nb_threads * s->nb_inputs, sizeof(*s->data));
275  if (!s->data)
276  return AVERROR(ENOMEM);
277 
278  s->linesize = av_calloc(s->nb_threads * s->nb_inputs, sizeof(*s->linesize));
279  if (!s->linesize)
280  return AVERROR(ENOMEM);
281 
282  if (!s->xmedian)
283  return 0;
284 
285  outlink->w = width;
286  outlink->h = height;
287  outlink->frame_rate = frame_rate;
288  outlink->sample_aspect_ratio = sar;
289 
290  if ((ret = ff_framesync_init(&s->fs, ctx, s->nb_inputs)) < 0)
291  return ret;
292 
293  in = s->fs.in;
294  s->fs.opaque = s;
295  s->fs.on_event = process_frame;
296 
297  for (i = 0; i < s->nb_inputs; i++) {
298  AVFilterLink *inlink = ctx->inputs[i];
299 
300  in[i].time_base = inlink->time_base;
301  in[i].sync = 1;
302  in[i].before = EXT_STOP;
303  in[i].after = EXT_INFINITY;
304  }
305 
306  ret = ff_framesync_configure(&s->fs);
307  outlink->time_base = s->fs.time_base;
308 
309  return ret;
310 }
311 
313 {
314  XMedianContext *s = ctx->priv;
315 
316  ff_framesync_uninit(&s->fs);
317 
318  for (int i = 0; i < s->nb_frames && s->frames && !s->xmedian; i++)
319  av_frame_free(&s->frames[i]);
320  av_freep(&s->frames);
321  av_freep(&s->data);
322  av_freep(&s->linesize);
323 }
324 
326 {
327  XMedianContext *s = ctx->priv;
328  return ff_framesync_activate(&s->fs);
329 }
330 
331 static const AVFilterPad outputs[] = {
332  {
333  .name = "default",
334  .type = AVMEDIA_TYPE_VIDEO,
335  .config_props = config_output,
336  },
337 };
338 
339 #if CONFIG_XMEDIAN_FILTER
340 static av_cold int xmedian_init(AVFilterContext *ctx)
341 {
342  XMedianContext *s = ctx->priv;
343  int ret;
344 
345  s->xmedian = 1;
346 
347  s->radius = s->nb_inputs / 2;
348 
349  for (int i = 0; i < s->nb_inputs; i++) {
350  AVFilterPad pad = { 0 };
351 
352  pad.type = AVMEDIA_TYPE_VIDEO;
353  pad.name = av_asprintf("input%d", i);
354  if (!pad.name)
355  return AVERROR(ENOMEM);
356 
357  if ((ret = ff_append_inpad_free_name(ctx, &pad)) < 0)
358  return ret;
359  }
360 
361  return init(ctx);
362 }
363 
364 #define OFFSET(x) offsetof(XMedianContext, x)
365 #define FLAGS AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_FILTERING_PARAM
366 #define TFLAGS AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_FILTERING_PARAM | AV_OPT_FLAG_RUNTIME_PARAM
367 
368 static const AVOption xmedian_options[] = {
369  { "inputs", "set number of inputs", OFFSET(nb_inputs), AV_OPT_TYPE_INT, {.i64=3}, 3, 255, .flags = FLAGS },
370  { "planes", "set planes to filter", OFFSET(planes), AV_OPT_TYPE_INT, {.i64=15}, 0, 15, .flags =TFLAGS },
371  { "percentile", "set percentile", OFFSET(percentile),AV_OPT_TYPE_FLOAT,{.dbl=0.5}, 0, 1, .flags =TFLAGS },
372  { NULL },
373 };
374 
376 
377 const AVFilter ff_vf_xmedian = {
378  .name = "xmedian",
379  .description = NULL_IF_CONFIG_SMALL("Pick median pixels from several video inputs."),
380  .priv_size = sizeof(XMedianContext),
381  .priv_class = &xmedian_class,
384  .preinit = xmedian_framesync_preinit,
385  .init = xmedian_init,
386  .uninit = uninit,
387  .activate = activate,
390  .process_command = ff_filter_process_command,
391 };
392 
393 #endif /* CONFIG_XMEDIAN_FILTER */
394 
395 #if CONFIG_TMEDIAN_FILTER
396 static int tmedian_filter_frame(AVFilterLink *inlink, AVFrame *in)
397 {
398  AVFilterContext *ctx = inlink->dst;
399  AVFilterLink *outlink = ctx->outputs[0];
400  XMedianContext *s = ctx->priv;
401  ThreadData td;
402  AVFrame *out;
403 
404  update_index(s);
405 
406  if (s->nb_frames < s->nb_inputs) {
407  s->frames[s->nb_frames] = in;
408  s->nb_frames++;
409  if (s->nb_frames < s->nb_inputs)
410  return 0;
411  } else {
412  av_frame_free(&s->frames[0]);
413  memmove(&s->frames[0], &s->frames[1], sizeof(*s->frames) * (s->nb_inputs - 1));
414  s->frames[s->nb_inputs - 1] = in;
415  }
416 
417  if (ctx->is_disabled) {
418  out = av_frame_clone(s->frames[0]);
419  if (!out)
420  return AVERROR(ENOMEM);
421  return ff_filter_frame(outlink, out);
422  }
423 
424  out = ff_get_video_buffer(outlink, outlink->w, outlink->h);
425  if (!out)
426  return AVERROR(ENOMEM);
427  out->pts = s->frames[0]->pts;
428 
429  td.out = out;
430  td.in = s->frames;
431  ff_filter_execute(ctx, s->median_frames, &td, NULL,
432  FFMIN(s->height[1], s->nb_threads));
433 
434  return ff_filter_frame(outlink, out);
435 }
436 
437 static const AVOption tmedian_options[] = {
438  { "radius", "set median filter radius", OFFSET(radius), AV_OPT_TYPE_INT, {.i64=1}, 1, 127, .flags = FLAGS },
439  { "planes", "set planes to filter", OFFSET(planes), AV_OPT_TYPE_INT, {.i64=15}, 0, 15, .flags =TFLAGS },
440  { "percentile", "set percentile", OFFSET(percentile), AV_OPT_TYPE_FLOAT, {.dbl=0.5}, 0, 1, .flags =TFLAGS },
441  { NULL },
442 };
443 
444 static const AVFilterPad tmedian_inputs[] = {
445  {
446  .name = "default",
447  .type = AVMEDIA_TYPE_VIDEO,
448  .filter_frame = tmedian_filter_frame,
449  },
450 };
451 
452 AVFILTER_DEFINE_CLASS(tmedian);
453 
454 const AVFilter ff_vf_tmedian = {
455  .name = "tmedian",
456  .description = NULL_IF_CONFIG_SMALL("Pick median pixels from successive frames."),
457  .priv_size = sizeof(XMedianContext),
458  .priv_class = &tmedian_class,
459  FILTER_INPUTS(tmedian_inputs),
462  .init = init,
463  .uninit = uninit,
465  .process_command = ff_filter_process_command,
466 };
467 
468 #endif /* CONFIG_TMEDIAN_FILTER */
ff_get_video_buffer
AVFrame * ff_get_video_buffer(AVFilterLink *link, int w, int h)
Request a picture buffer with a specific set of permissions.
Definition: video.c:112
AV_PIX_FMT_YUVA422P16
#define AV_PIX_FMT_YUVA422P16
Definition: pixfmt.h:522
AV_PIX_FMT_GBRAP16
#define AV_PIX_FMT_GBRAP16
Definition: pixfmt.h:501
FFFrameSyncIn::time_base
AVRational time_base
Time base for the incoming frames.
Definition: framesync.h:117
ff_framesync_configure
int ff_framesync_configure(FFFrameSync *fs)
Configure a frame sync structure.
Definition: framesync.c:134
td
#define td
Definition: regdef.h:70
AVPixelFormat
AVPixelFormat
Pixel format.
Definition: pixfmt.h:71
av_clip
#define av_clip
Definition: common.h:99
AVERROR
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
opt.h
ff_framesync_uninit
void ff_framesync_uninit(FFFrameSync *fs)
Free all memory currently allocated.
Definition: framesync.c:304
out
FILE * out
Definition: movenc.c:55
ff_filter_frame
int ff_filter_frame(AVFilterLink *link, AVFrame *frame)
Send a frame of data to the next filter.
Definition: avfilter.c:1015
av_pix_fmt_desc_get
const AVPixFmtDescriptor * av_pix_fmt_desc_get(enum AVPixelFormat pix_fmt)
Definition: pixdesc.c:2965
ff_framesync_get_frame
int ff_framesync_get_frame(FFFrameSync *fs, unsigned in, AVFrame **rframe, unsigned get)
Get the current frame in an input.
Definition: framesync.c:267
FILTER_PIXFMTS_ARRAY
#define FILTER_PIXFMTS_ARRAY(array)
Definition: internal.h:162
MEDIAN_SLICE
#define MEDIAN_SLICE(name, type, comparei)
Definition: vf_xmedian.c:129
inlink
The exact code depends on how similar the blocks are and how related they are to the and needs to apply these operations to the correct inlink or outlink if there are several Macros are available to factor that when no extra processing is inlink
Definition: filter_design.txt:212
av_asprintf
char * av_asprintf(const char *fmt,...)
Definition: avstring.c:115
XMedianContext::median_frames
int(* median_frames)(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs)
Definition: vf_xmedian.c:60
av_frame_free
void av_frame_free(AVFrame **frame)
Free the frame and any dynamically allocated objects in it, e.g.
Definition: frame.c:160
AV_PIX_FMT_YUVA422P9
#define AV_PIX_FMT_YUVA422P9
Definition: pixfmt.h:514
XMedianContext::linesize
int * linesize
Definition: vf_xmedian.c:55
AVFrame
This structure describes decoded (raw) audio or video data.
Definition: frame.h:374
pixdesc.h
AV_PIX_FMT_YUVA420P16
#define AV_PIX_FMT_YUVA420P16
Definition: pixfmt.h:521
AV_PIX_FMT_YUVA420P10
#define AV_PIX_FMT_YUVA420P10
Definition: pixfmt.h:516
AVOption
AVOption.
Definition: opt.h:346
AV_PIX_FMT_YUV420P10
#define AV_PIX_FMT_YUV420P10
Definition: pixfmt.h:478
FRAMESYNC_DEFINE_CLASS
#define FRAMESYNC_DEFINE_CLASS(name, context, field)
Definition: framesync.h:351
FLAGS
#define FLAGS
Definition: cmdutils.c:581
XMedianContext::nb_frames
int nb_frames
Definition: vf_xmedian.c:39
AV_PIX_FMT_YUV440P
@ AV_PIX_FMT_YUV440P
planar YUV 4:4:0 (1 Cr & Cb sample per 1x2 Y samples)
Definition: pixfmt.h:106
AVFilter::name
const char * name
Filter name.
Definition: avfilter.h:170
FFFrameSync
Frame sync structure.
Definition: framesync.h:168
EXT_INFINITY
@ EXT_INFINITY
Extend the frame to infinity.
Definition: framesync.h:75
ThreadData::out
AVFrame * out
Definition: af_adeclick.c:527
video.h
ThreadData::in
AVFrame * in
Definition: af_adecorrelate.c:154
AV_PIX_FMT_YUVA422P10
#define AV_PIX_FMT_YUVA422P10
Definition: pixfmt.h:517
AV_PIX_FMT_GRAY9
#define AV_PIX_FMT_GRAY9
Definition: pixfmt.h:458
av_pix_fmt_count_planes
int av_pix_fmt_count_planes(enum AVPixelFormat pix_fmt)
Definition: pixdesc.c:3005
AV_PIX_FMT_YUVA420P9
#define AV_PIX_FMT_YUVA420P9
Definition: pixfmt.h:513
EXT_STOP
@ EXT_STOP
Completely stop all streams with this one.
Definition: framesync.h:65
AV_PIX_FMT_GBRP14
#define AV_PIX_FMT_GBRP14
Definition: pixfmt.h:496
AV_PIX_FMT_GBRAP
@ AV_PIX_FMT_GBRAP
planar GBRA 4:4:4:4 32bpp
Definition: pixfmt.h:212
XMedianContext::planes
int planes
Definition: vf_xmedian.c:41
XMedianContext::fs
FFFrameSync fs
Definition: vf_xmedian.c:58
AV_PIX_FMT_GBRP10
#define AV_PIX_FMT_GBRP10
Definition: pixfmt.h:494
AV_PIX_FMT_YUVA444P16
#define AV_PIX_FMT_YUVA444P16
Definition: pixfmt.h:523
FFFrameSyncIn
Input stream structure.
Definition: framesync.h:102
AV_PIX_FMT_YUV422P9
#define AV_PIX_FMT_YUV422P9
Definition: pixfmt.h:476
AV_PIX_FMT_GRAY16
#define AV_PIX_FMT_GRAY16
Definition: pixfmt.h:462
FFFrameSyncIn::sync
unsigned sync
Synchronization level: frames on input at the highest sync level will generate output frame events.
Definition: framesync.h:160
AVFILTER_FLAG_DYNAMIC_INPUTS
#define AVFILTER_FLAG_DYNAMIC_INPUTS
The number of the filter inputs is not determined just by AVFilter.inputs.
Definition: avfilter.h:106
config_output
static int config_output(AVFilterLink *outlink)
Definition: vf_xmedian.c:234
AVFilterPad
A filter pad used for either input or output.
Definition: internal.h:33
FFDIFFSIGN
#define FFDIFFSIGN(x, y)
Comparator.
Definition: macros.h:45
AV_PIX_FMT_YUV444P10
#define AV_PIX_FMT_YUV444P10
Definition: pixfmt.h:481
AV_PIX_FMT_YUVJ411P
@ AV_PIX_FMT_YUVJ411P
planar YUV 4:1:1, 12bpp, (1 Cr & Cb sample per 4x1 Y samples) full scale (JPEG), deprecated in favor ...
Definition: pixfmt.h:283
AV_LOG_ERROR
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
Definition: log.h:180
av_cold
#define av_cold
Definition: attributes.h:90
AV_PIX_FMT_YUV422P16
#define AV_PIX_FMT_YUV422P16
Definition: pixfmt.h:490
AV_PIX_FMT_YUVJ422P
@ AV_PIX_FMT_YUVJ422P
planar YUV 4:2:2, 16bpp, full scale (JPEG), deprecated in favor of AV_PIX_FMT_YUV422P and setting col...
Definition: pixfmt.h:86
AV_PIX_FMT_GBRAP10
#define AV_PIX_FMT_GBRAP10
Definition: pixfmt.h:498
width
#define width
av_image_fill_linesizes
int av_image_fill_linesizes(int linesizes[4], enum AVPixelFormat pix_fmt, int width)
Fill plane linesizes for an image with pixel format pix_fmt and width width.
Definition: imgutils.c:89
s
#define s(width, name)
Definition: cbs_vp9.c:198
AV_PIX_FMT_GBRAP12
#define AV_PIX_FMT_GBRAP12
Definition: pixfmt.h:499
AV_PIX_FMT_YUVA420P
@ AV_PIX_FMT_YUVA420P
planar YUV 4:2:0, 20bpp, (1 Cr & Cb sample per 2x2 Y & A samples)
Definition: pixfmt.h:108
AV_PIX_FMT_YUV444P16
#define AV_PIX_FMT_YUV444P16
Definition: pixfmt.h:491
AV_CEIL_RSHIFT
#define AV_CEIL_RSHIFT(a, b)
Definition: common.h:59
XMedianContext::depth
int depth
Definition: vf_xmedian.c:47
AV_PIX_FMT_YUVA444P12
#define AV_PIX_FMT_YUVA444P12
Definition: pixfmt.h:520
AV_PIX_FMT_YUV420P9
#define AV_PIX_FMT_YUV420P9
Definition: pixfmt.h:475
AV_PIX_FMT_YUV420P16
#define AV_PIX_FMT_YUV420P16
Definition: pixfmt.h:489
process_frame
static int process_frame(FFFrameSync *fs)
Definition: vf_xmedian.c:198
ctx
AVFormatContext * ctx
Definition: movenc.c:49
AV_PIX_FMT_GRAY14
#define AV_PIX_FMT_GRAY14
Definition: pixfmt.h:461
av_frame_clone
AVFrame * av_frame_clone(const AVFrame *src)
Create a new frame that references the same data as src.
Definition: frame.c:593
av_rescale_q
int64_t av_rescale_q(int64_t a, AVRational bq, AVRational cq)
Rescale a 64-bit integer by 2 rational numbers.
Definition: mathematics.c:142
AV_PIX_FMT_YUV420P
@ AV_PIX_FMT_YUV420P
planar YUV 4:2:0, 12bpp, (1 Cr & Cb sample per 2x2 Y samples)
Definition: pixfmt.h:73
FILTER_INPUTS
#define FILTER_INPUTS(array)
Definition: internal.h:182
AV_PIX_FMT_YUVJ444P
@ AV_PIX_FMT_YUVJ444P
planar YUV 4:4:4, 24bpp, full scale (JPEG), deprecated in favor of AV_PIX_FMT_YUV444P and setting col...
Definition: pixfmt.h:87
arg
const char * arg
Definition: jacosubdec.c:67
XMedianContext::data
uint8_t ** data
Definition: vf_xmedian.c:54
AV_PIX_FMT_GRAY10
#define AV_PIX_FMT_GRAY10
Definition: pixfmt.h:459
AV_PIX_FMT_GBRP16
#define AV_PIX_FMT_GBRP16
Definition: pixfmt.h:497
XMedianContext::width
int width[4]
Definition: vf_xmedian.c:51
AVClass
Describe the class of an AVClass context structure.
Definition: log.h:66
NULL
#define NULL
Definition: coverity.c:32
fs
#define fs(width, name, subs,...)
Definition: cbs_vp9.c:200
init
static av_cold int init(AVFilterContext *ctx)
Definition: vf_xmedian.c:93
AVRational
Rational number (pair of numerator and denominator).
Definition: rational.h:58
ff_append_inpad_free_name
int ff_append_inpad_free_name(AVFilterContext *f, AVFilterPad *p)
Definition: avfilter.c:132
AV_PIX_FMT_YUVJ420P
@ AV_PIX_FMT_YUVJ420P
planar YUV 4:2:0, 12bpp, full scale (JPEG), deprecated in favor of AV_PIX_FMT_YUV420P and setting col...
Definition: pixfmt.h:85
AV_PIX_FMT_YUV440P10
#define AV_PIX_FMT_YUV440P10
Definition: pixfmt.h:480
AV_PIX_FMT_YUV422P10
#define AV_PIX_FMT_YUV422P10
Definition: pixfmt.h:479
AV_PIX_FMT_GRAY8
@ AV_PIX_FMT_GRAY8
Y , 8bpp.
Definition: pixfmt.h:81
AV_PIX_FMT_GBRP9
#define AV_PIX_FMT_GBRP9
Definition: pixfmt.h:493
XMedianContext::height
int height[4]
Definition: vf_xmedian.c:52
XMedianContext::nb_threads
int nb_threads
Definition: vf_xmedian.c:40
TFLAGS
#define TFLAGS
Definition: af_afade.c:65
qsort.h
NULL_IF_CONFIG_SMALL
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification.
Definition: internal.h:94
AV_PIX_FMT_YUV422P12
#define AV_PIX_FMT_YUV422P12
Definition: pixfmt.h:483
AV_PIX_FMT_YUV444P12
#define AV_PIX_FMT_YUV444P12
Definition: pixfmt.h:485
ff_filter_process_command
int ff_filter_process_command(AVFilterContext *ctx, const char *cmd, const char *arg, char *res, int res_len, int flags)
Generic processing of user supplied commands that are set in the same way as the filter options.
Definition: avfilter.c:887
compare8
static int compare8(const void *p1, const void *p2)
Definition: vf_xmedian.c:115
height
#define height
AV_PIX_FMT_YUVA444P
@ AV_PIX_FMT_YUVA444P
planar YUV 4:4:4 32bpp, (1 Cr & Cb sample per 1x1 Y & A samples)
Definition: pixfmt.h:174
AV_PIX_FMT_YUVA444P10
#define AV_PIX_FMT_YUVA444P10
Definition: pixfmt.h:518
ff_vf_xmedian
const AVFilter ff_vf_xmedian
XMedianContext::desc
const AVPixFmtDescriptor * desc
Definition: vf_xmedian.c:37
update_index
static void update_index(XMedianContext *s)
Definition: vf_xmedian.c:190
compare16
static int compare16(const void *p1, const void *p2)
Definition: vf_xmedian.c:122
XMedianContext
Definition: vf_xmedian.c:35
internal.h
AVFILTER_DEFINE_CLASS
#define AVFILTER_DEFINE_CLASS(fname)
Definition: internal.h:323
AV_OPT_TYPE_FLOAT
@ AV_OPT_TYPE_FLOAT
Definition: opt.h:238
XMedianContext::index
int index
Definition: vf_xmedian.c:46
pixel_fmts
static enum AVPixelFormat pixel_fmts[]
Definition: vf_xmedian.c:63
ff_vf_tmedian
const AVFilter ff_vf_tmedian
i
#define i(width, name, range_min, range_max)
Definition: cbs_h2645.c:256
AV_PIX_FMT_GBRP12
#define AV_PIX_FMT_GBRP12
Definition: pixfmt.h:495
XMedianContext::linesizes
int linesizes[4]
Definition: vf_xmedian.c:50
ff_filter_get_nb_threads
int ff_filter_get_nb_threads(AVFilterContext *ctx)
Get number of threads for current filter instance.
Definition: avfilter.c:827
XMedianContext::max
int max
Definition: vf_xmedian.c:48
ThreadData
Used for passing data between threads.
Definition: dsddec.c:71
FFMIN
#define FFMIN(a, b)
Definition: macros.h:49
AV_PIX_FMT_YUVJ440P
@ AV_PIX_FMT_YUVJ440P
planar YUV 4:4:0 full scale (JPEG), deprecated in favor of AV_PIX_FMT_YUV440P and setting color_range
Definition: pixfmt.h:107
AVFilterPad::name
const char * name
Pad name.
Definition: internal.h:39
av_calloc
void * av_calloc(size_t nmemb, size_t size)
Definition: mem.c:264
AV_PIX_FMT_YUV444P9
#define AV_PIX_FMT_YUV444P9
Definition: pixfmt.h:477
AVFilter
Filter definition.
Definition: avfilter.h:166
ret
ret
Definition: filter_design.txt:187
AVFilterPad::type
enum AVMediaType type
AVFilterPad type.
Definition: internal.h:44
XMedianContext::nb_inputs
int nb_inputs
Definition: vf_xmedian.c:38
AV_PIX_FMT_YUVA444P9
#define AV_PIX_FMT_YUVA444P9
Definition: pixfmt.h:515
ff_framesync_init
int ff_framesync_init(FFFrameSync *fs, AVFilterContext *parent, unsigned nb_in)
Initialize a frame sync structure.
Definition: framesync.c:86
AV_PIX_FMT_YUV420P12
#define AV_PIX_FMT_YUV420P12
Definition: pixfmt.h:482
XMedianContext::frames
AVFrame ** frames
Definition: vf_xmedian.c:57
left
Tag MUST be and< 10hcoeff half pel interpolation filter coefficients, hcoeff[0] are the 2 middle coefficients[1] are the next outer ones and so on, resulting in a filter like:...eff[2], hcoeff[1], hcoeff[0], hcoeff[0], hcoeff[1], hcoeff[2] ... the sign of the coefficients is not explicitly stored but alternates after each coeff and coeff[0] is positive, so ...,+,-,+,-,+,+,-,+,-,+,... hcoeff[0] is not explicitly stored but found by subtracting the sum of all stored coefficients with signs from 32 hcoeff[0]=32 - hcoeff[1] - hcoeff[2] - ... a good choice for hcoeff and htaps is htaps=6 hcoeff={40,-10, 2} an alternative which requires more computations at both encoder and decoder side and may or may not be better is htaps=8 hcoeff={42,-14, 6,-2}ref_frames minimum of the number of available reference frames and max_ref_frames for example the first frame after a key frame always has ref_frames=1spatial_decomposition_type wavelet type 0 is a 9/7 symmetric compact integer wavelet 1 is a 5/3 symmetric compact integer wavelet others are reserved stored as delta from last, last is reset to 0 if always_reset||keyframeqlog quality(logarithmic quantizer scale) stored as delta from last, last is reset to 0 if always_reset||keyframemv_scale stored as delta from last, last is reset to 0 if always_reset||keyframe FIXME check that everything works fine if this changes between framesqbias dequantization bias stored as delta from last, last is reset to 0 if always_reset||keyframeblock_max_depth maximum depth of the block tree stored as delta from last, last is reset to 0 if always_reset||keyframequant_table quantization tableHighlevel bitstream structure:==============================--------------------------------------------|Header|--------------------------------------------|------------------------------------|||Block0||||split?||||yes no||||......... intra?||||:Block01 :yes no||||:Block02 :....... ..........||||:Block03 ::y DC ::ref index:||||:Block04 ::cb DC ::motion x :||||......... :cr DC ::motion y :||||....... ..........|||------------------------------------||------------------------------------|||Block1|||...|--------------------------------------------|------------ ------------ ------------|||Y subbands||Cb subbands||Cr subbands||||--- ---||--- ---||--- ---|||||LL0||HL0||||LL0||HL0||||LL0||HL0|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||LH0||HH0||||LH0||HH0||||LH0||HH0|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||HL1||LH1||||HL1||LH1||||HL1||LH1|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||HH1||HL2||||HH1||HL2||||HH1||HL2|||||...||...||...|||------------ ------------ ------------|--------------------------------------------Decoding process:=================------------|||Subbands|------------||||------------|Intra DC||||LL0 subband prediction ------------|\ Dequantization ------------------- \||Reference frames|\ IDWT|------- -------|Motion \|||Frame 0||Frame 1||Compensation . OBMC v -------|------- -------|--------------. \------> Frame n output Frame Frame<----------------------------------/|...|------------------- Range Coder:============Binary Range Coder:------------------- The implemented range coder is an adapted version based upon "Range encoding: an algorithm for removing redundancy from a digitised message." by G. N. N. Martin. The symbols encoded by the Snow range coder are bits(0|1). The associated probabilities are not fix but change depending on the symbol mix seen so far. bit seen|new state ---------+----------------------------------------------- 0|256 - state_transition_table[256 - old_state];1|state_transition_table[old_state];state_transition_table={ 0, 0, 0, 0, 0, 0, 0, 0, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 170, 171, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181, 182, 183, 184, 185, 186, 187, 188, 189, 190, 190, 191, 192, 194, 194, 195, 196, 197, 198, 199, 200, 201, 202, 202, 204, 205, 206, 207, 208, 209, 209, 210, 211, 212, 213, 215, 215, 216, 217, 218, 219, 220, 220, 222, 223, 224, 225, 226, 227, 227, 229, 229, 230, 231, 232, 234, 234, 235, 236, 237, 238, 239, 240, 241, 242, 243, 244, 245, 246, 247, 248, 248, 0, 0, 0, 0, 0, 0, 0};FIXME Range Coding of integers:------------------------- FIXME Neighboring Blocks:===================left and top are set to the respective blocks unless they are outside of the image in which case they are set to the Null block top-left is set to the top left block unless it is outside of the image in which case it is set to the left block if this block has no larger parent block or it is at the left side of its parent block and the top right block is not outside of the image then the top right block is used for top-right else the top-left block is used Null block y, cb, cr are 128 level, ref, mx and my are 0 Motion Vector Prediction:=========================1. the motion vectors of all the neighboring blocks are scaled to compensate for the difference of reference frames scaled_mv=(mv *(256 *(current_reference+1)/(mv.reference+1))+128)> the median of the scaled left
Definition: snow.txt:386
AV_PIX_FMT_YUV422P14
#define AV_PIX_FMT_YUV422P14
Definition: pixfmt.h:487
OFFSET
it s the only field you need to keep assuming you have a context There is some magic you don t need to care about around this just let it vf default minimum maximum flags name is the option keep it simple and lowercase description are in without and describe what they for example set the foo of the bar offset is the offset of the field in your see the OFFSET() macro
FFFrameSyncIn::before
enum FFFrameSyncExtMode before
Extrapolation mode for timestamps before the first frame.
Definition: framesync.h:107
XMedianContext::percentile
float percentile
Definition: vf_xmedian.c:42
framesync.h
XMedianContext::radius
int radius
Definition: vf_xmedian.c:45
AV_PIX_FMT_NONE
@ AV_PIX_FMT_NONE
Definition: pixfmt.h:72
AV_PIX_FMT_YUVA422P12
#define AV_PIX_FMT_YUVA422P12
Definition: pixfmt.h:519
AV_OPT_TYPE_INT
@ AV_OPT_TYPE_INT
Definition: opt.h:235
avfilter.h
uninit
static av_cold void uninit(AVFilterContext *ctx)
Definition: vf_xmedian.c:312
planes
static const struct @400 planes[]
AV_PIX_FMT_YUV444P
@ AV_PIX_FMT_YUV444P
planar YUV 4:4:4, 24bpp, (1 Cr & Cb sample per 1x1 Y samples)
Definition: pixfmt.h:78
activate
static int activate(AVFilterContext *ctx)
Definition: vf_xmedian.c:325
AVFilterContext
An instance of a filter.
Definition: avfilter.h:407
XMedianContext::nb_planes
int nb_planes
Definition: vf_xmedian.c:49
AV_PIX_FMT_GBRP
@ AV_PIX_FMT_GBRP
planar GBR 4:4:4 24bpp
Definition: pixfmt.h:165
AVFILTER_FLAG_SLICE_THREADS
#define AVFILTER_FLAG_SLICE_THREADS
The filter supports multithreading by splitting frames into multiple parts and processing them concur...
Definition: avfilter.h:117
AVMEDIA_TYPE_VIDEO
@ AVMEDIA_TYPE_VIDEO
Definition: avutil.h:201
AV_PIX_FMT_YUV422P
@ AV_PIX_FMT_YUV422P
planar YUV 4:2:2, 16bpp, (1 Cr & Cb sample per 2x1 Y samples)
Definition: pixfmt.h:77
mem.h
AVPixFmtDescriptor
Descriptor that unambiguously describes how the bits of a pixel are stored in the up to 4 data planes...
Definition: pixdesc.h:69
FILTER_OUTPUTS
#define FILTER_OUTPUTS(array)
Definition: internal.h:183
outputs
static const AVFilterPad outputs[]
Definition: vf_xmedian.c:331
av_freep
#define av_freep(p)
Definition: tableprint_vlc.h:34
XMedianContext::xmedian
int xmedian
Definition: vf_xmedian.c:44
AV_PIX_FMT_YUV411P
@ AV_PIX_FMT_YUV411P
planar YUV 4:1:1, 12bpp, (1 Cr & Cb sample per 4x1 Y samples)
Definition: pixfmt.h:80
AVFILTER_FLAG_SUPPORT_TIMELINE_INTERNAL
#define AVFILTER_FLAG_SUPPORT_TIMELINE_INTERNAL
Same as AVFILTER_FLAG_SUPPORT_TIMELINE_GENERIC, except that the filter will have its filter_frame() c...
Definition: avfilter.h:155
imgutils.h
AVERROR_BUG
#define AVERROR_BUG
Internal bug, also see AVERROR_BUG2.
Definition: error.h:52
AV_PIX_FMT_YUV410P
@ AV_PIX_FMT_YUV410P
planar YUV 4:1:0, 9bpp, (1 Cr & Cb sample per 4x4 Y samples)
Definition: pixfmt.h:79
av_log
#define av_log(a,...)
Definition: tableprint_vlc.h:27
FFFrameSyncIn::after
enum FFFrameSyncExtMode after
Extrapolation mode for timestamps after the last frame.
Definition: framesync.h:112
AV_PIX_FMT_YUV440P12
#define AV_PIX_FMT_YUV440P12
Definition: pixfmt.h:484
AV_PIX_FMT_YUV444P14
#define AV_PIX_FMT_YUV444P14
Definition: pixfmt.h:488
ff_framesync_activate
int ff_framesync_activate(FFFrameSync *fs)
Examine the frames in the filter's input and try to produce output.
Definition: framesync.c:355
avstring.h
AV_PIX_FMT_GRAY12
#define AV_PIX_FMT_GRAY12
Definition: pixfmt.h:460
ff_filter_execute
static av_always_inline int ff_filter_execute(AVFilterContext *ctx, avfilter_action_func *func, void *arg, int *ret, int nb_jobs)
Definition: internal.h:134
int
int
Definition: ffmpeg_filter.c:424
AV_PIX_FMT_YUVA422P
@ AV_PIX_FMT_YUVA422P
planar YUV 4:2:2 24bpp, (1 Cr & Cb sample per 2x1 Y & A samples)
Definition: pixfmt.h:173
AV_PIX_FMT_YUV420P14
#define AV_PIX_FMT_YUV420P14
Definition: pixfmt.h:486