FFmpeg
vf_xmedian.c
Go to the documentation of this file.
1 /*
2  * Copyright (c) 2019 Paul B Mahol
3  *
4  * This file is part of FFmpeg.
5  *
6  * FFmpeg is free software; you can redistribute it and/or
7  * modify it under the terms of the GNU Lesser General Public
8  * License as published by the Free Software Foundation; either
9  * version 2.1 of the License, or (at your option) any later version.
10  *
11  * FFmpeg is distributed in the hope that it will be useful,
12  * but WITHOUT ANY WARRANTY; without even the implied warranty of
13  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14  * Lesser General Public License for more details.
15  *
16  * You should have received a copy of the GNU Lesser General Public
17  * License along with FFmpeg; if not, write to the Free Software
18  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
19  */
20 
21 #include "config_components.h"
22 
23 #include "libavutil/avstring.h"
24 #include "libavutil/imgutils.h"
25 #include "libavutil/intreadwrite.h"
26 #include "libavutil/opt.h"
27 #include "libavutil/pixdesc.h"
28 #include "libavutil/qsort.h"
29 
30 #include "avfilter.h"
31 #include "formats.h"
32 #include "internal.h"
33 #include "framesync.h"
34 #include "video.h"
35 
36 typedef struct XMedianContext {
37  const AVClass *class;
39  int nb_inputs;
40  int nb_frames;
42  int planes;
43  float percentile;
44 
45  int xmedian;
46  int radius;
47  int index;
48  int depth;
49  int max;
50  int nb_planes;
51  int linesizes[4];
52  int width[4];
53  int height[4];
54 
55  uint8_t **data;
56  int *linesize;
57 
60 
61  int (*median_frames)(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs);
63 
64 static const enum AVPixelFormat pixel_fmts[] = {
92 };
93 
95 {
96  XMedianContext *s = ctx->priv;
97 
98  if (!s->xmedian)
99  s->nb_inputs = s->radius * 2 + 1;
100 
101  if (s->nb_inputs & 1)
102  s->index = s->radius * 2.f * s->percentile;
103  else
104  s->index = av_clip(s->radius * 2.f * s->percentile, 1, s->nb_inputs - 1);
105  s->frames = av_calloc(s->nb_inputs, sizeof(*s->frames));
106  if (!s->frames)
107  return AVERROR(ENOMEM);
108 
109  return 0;
110 }
111 
112 typedef struct ThreadData {
113  AVFrame **in, *out;
114 } ThreadData;
115 
116 static int compare8(const void *p1, const void *p2)
117 {
118  int left = *(const uint8_t *)p1;
119  int right = *(const uint8_t *)p2;
120  return FFDIFFSIGN(left, right);
121 }
122 
123 static int compare16(const void *p1, const void *p2)
124 {
125  int left = *(const uint16_t *)p1;
126  int right = *(const uint16_t *)p2;
127  return FFDIFFSIGN(left, right);
128 }
129 
130 #define MEDIAN_SLICE(name, type, comparei) \
131 static int median_frames ## name(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs) \
132 { \
133  XMedianContext *s = ctx->priv; \
134  ThreadData *td = arg; \
135  AVFrame **in = td->in; \
136  AVFrame *out = td->out; \
137  const int nb_inputs = s->nb_inputs; \
138  uint8_t **srcf = s->data + jobnr * nb_inputs; \
139  int *linesize = s->linesize + jobnr * nb_inputs; \
140  const int radius = s->radius; \
141  const int index = s->index; \
142  type values[256]; \
143  \
144  for (int p = 0; p < s->nb_planes; p++) { \
145  const int slice_start = (s->height[p] * jobnr) / nb_jobs; \
146  const int slice_end = (s->height[p] * (jobnr+1)) / nb_jobs; \
147  const int width = s->width[p]; \
148  type *dst = (type *)(out->data[p] + slice_start * out->linesize[p]); \
149  ptrdiff_t dst_linesize = out->linesize[p] / sizeof(type); \
150  \
151  if (!((1 << p) & s->planes)) { \
152  av_image_copy_plane((uint8_t *)dst, out->linesize[p], \
153  in[radius]->data[p] + slice_start * in[radius]->linesize[p], \
154  in[radius]->linesize[p], \
155  s->linesizes[p], slice_end - slice_start); \
156  continue; \
157  } \
158  \
159  for (int i = 0; i < nb_inputs; i++) \
160  linesize[i] = in[i]->linesize[p]; \
161  \
162  for (int i = 0; i < nb_inputs; i++) \
163  srcf[i] = in[i]->data[p] + slice_start * linesize[i]; \
164  \
165  for (int y = slice_start; y < slice_end; y++) { \
166  for (int x = 0; x < width; x++) { \
167  for (int i = 0; i < nb_inputs; i++) { \
168  const type *src = (const type *)srcf[i]; \
169  values[i] = src[x]; \
170  } \
171  \
172  AV_QSORT(values, nb_inputs, type, comparei); \
173  if (nb_inputs & 1) \
174  dst[x] = values[index]; \
175  else \
176  dst[x] = (values[index] + values[index - 1]) >> 1; \
177  } \
178  \
179  dst += dst_linesize; \
180  for (int i = 0; i < nb_inputs; i++) \
181  srcf[i] += linesize[i]; \
182  } \
183  } \
184  \
185  return 0; \
186 }
187 
188 MEDIAN_SLICE(8, uint8_t, compare8)
189 MEDIAN_SLICE(16, uint16_t, compare16)
190 
192 {
193  if (s->nb_inputs & 1)
194  s->index = s->radius * 2.f * s->percentile;
195  else
196  s->index = av_clip(s->radius * 2.f * s->percentile, 1, s->nb_inputs - 1);
197 }
198 
200 {
201  AVFilterContext *ctx = fs->parent;
202  AVFilterLink *outlink = ctx->outputs[0];
203  XMedianContext *s = fs->opaque;
204  AVFrame **in = s->frames;
205  AVFrame *out;
206  ThreadData td;
207  int i, ret;
208 
209  update_index(s);
210 
211  for (i = 0; i < s->nb_inputs; i++) {
212  if ((ret = ff_framesync_get_frame(&s->fs, i, &in[i], 0)) < 0)
213  return ret;
214  }
215 
216  if (ctx->is_disabled) {
217  out = av_frame_clone(in[0]);
218  } else {
219  out = ff_get_video_buffer(outlink, outlink->w, outlink->h);
220  }
221  if (!out)
222  return AVERROR(ENOMEM);
223  out->pts = av_rescale_q(s->fs.pts, s->fs.time_base, outlink->time_base);
224 
225  if (!ctx->is_disabled) {
226  td.in = in;
227  td.out = out;
228  ff_filter_execute(ctx, s->median_frames, &td, NULL,
229  FFMIN(s->height[1], s->nb_threads));
230  }
231 
232  return ff_filter_frame(outlink, out);
233 }
234 
235 static int config_output(AVFilterLink *outlink)
236 {
237  AVFilterContext *ctx = outlink->src;
238  XMedianContext *s = ctx->priv;
239  AVRational frame_rate = ctx->inputs[0]->frame_rate;
240  AVRational sar = ctx->inputs[0]->sample_aspect_ratio;
241  AVFilterLink *inlink = ctx->inputs[0];
242  int height = ctx->inputs[0]->h;
243  int width = ctx->inputs[0]->w;
244  FFFrameSyncIn *in;
245  int i, ret;
246 
247  for (int i = 1; i < s->nb_inputs && s->xmedian; i++) {
248  if (ctx->inputs[i]->h != height || ctx->inputs[i]->w != width) {
249  av_log(ctx, AV_LOG_ERROR, "Input %d size (%dx%d) does not match input %d size (%dx%d).\n", i, ctx->inputs[i]->w, ctx->inputs[i]->h, 0, width, height);
250  return AVERROR(EINVAL);
251  }
252  }
253 
254  s->desc = av_pix_fmt_desc_get(outlink->format);
255  if (!s->desc)
256  return AVERROR_BUG;
257  s->nb_planes = av_pix_fmt_count_planes(outlink->format);
258  s->depth = s->desc->comp[0].depth;
259  s->max = (1 << s->depth) - 1;
260  s->nb_threads = ff_filter_get_nb_threads(ctx);
261 
262  if (s->depth <= 8)
263  s->median_frames = median_frames8;
264  else
265  s->median_frames = median_frames16;
266 
267  if ((ret = av_image_fill_linesizes(s->linesizes, inlink->format, inlink->w)) < 0)
268  return ret;
269 
270  s->width[1] = s->width[2] = AV_CEIL_RSHIFT(inlink->w, s->desc->log2_chroma_w);
271  s->width[0] = s->width[3] = inlink->w;
272  s->height[1] = s->height[2] = AV_CEIL_RSHIFT(inlink->h, s->desc->log2_chroma_h);
273  s->height[0] = s->height[3] = inlink->h;
274 
275  s->data = av_calloc(s->nb_threads * s->nb_inputs, sizeof(*s->data));
276  if (!s->data)
277  return AVERROR(ENOMEM);
278 
279  s->linesize = av_calloc(s->nb_threads * s->nb_inputs, sizeof(*s->linesize));
280  if (!s->linesize)
281  return AVERROR(ENOMEM);
282 
283  if (!s->xmedian)
284  return 0;
285 
286  outlink->w = width;
287  outlink->h = height;
288  outlink->frame_rate = frame_rate;
289  outlink->sample_aspect_ratio = sar;
290 
291  if ((ret = ff_framesync_init(&s->fs, ctx, s->nb_inputs)) < 0)
292  return ret;
293 
294  in = s->fs.in;
295  s->fs.opaque = s;
296  s->fs.on_event = process_frame;
297 
298  for (i = 0; i < s->nb_inputs; i++) {
299  AVFilterLink *inlink = ctx->inputs[i];
300 
301  in[i].time_base = inlink->time_base;
302  in[i].sync = 1;
303  in[i].before = EXT_STOP;
304  in[i].after = EXT_INFINITY;
305  }
306 
307  ret = ff_framesync_configure(&s->fs);
308  outlink->time_base = s->fs.time_base;
309 
310  return ret;
311 }
312 
314 {
315  XMedianContext *s = ctx->priv;
316 
317  ff_framesync_uninit(&s->fs);
318 
319  for (int i = 0; i < s->nb_frames && s->frames && !s->xmedian; i++)
320  av_frame_free(&s->frames[i]);
321  av_freep(&s->frames);
322  av_freep(&s->data);
323  av_freep(&s->linesize);
324 }
325 
327 {
328  XMedianContext *s = ctx->priv;
329  return ff_framesync_activate(&s->fs);
330 }
331 
332 #if CONFIG_XMEDIAN_FILTER
333 static av_cold int xmedian_init(AVFilterContext *ctx)
334 {
335  XMedianContext *s = ctx->priv;
336  int ret;
337 
338  s->xmedian = 1;
339 
340  s->radius = s->nb_inputs / 2;
341 
342  for (int i = 0; i < s->nb_inputs; i++) {
343  AVFilterPad pad = { 0 };
344 
345  pad.type = AVMEDIA_TYPE_VIDEO;
346  pad.name = av_asprintf("input%d", i);
347  if (!pad.name)
348  return AVERROR(ENOMEM);
349 
350  if ((ret = ff_append_inpad_free_name(ctx, &pad)) < 0)
351  return ret;
352  }
353 
354  return init(ctx);
355 }
356 
357 #define OFFSET(x) offsetof(XMedianContext, x)
358 #define FLAGS AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_FILTERING_PARAM
359 #define TFLAGS AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_FILTERING_PARAM | AV_OPT_FLAG_RUNTIME_PARAM
360 
361 static const AVOption xmedian_options[] = {
362  { "inputs", "set number of inputs", OFFSET(nb_inputs), AV_OPT_TYPE_INT, {.i64=3}, 3, 255, .flags = FLAGS },
363  { "planes", "set planes to filter", OFFSET(planes), AV_OPT_TYPE_INT, {.i64=15}, 0, 15, .flags =TFLAGS },
364  { "percentile", "set percentile", OFFSET(percentile),AV_OPT_TYPE_FLOAT,{.dbl=0.5}, 0, 1, .flags =TFLAGS },
365  { NULL },
366 };
367 
368 static const AVFilterPad outputs[] = {
369  {
370  .name = "default",
371  .type = AVMEDIA_TYPE_VIDEO,
372  .config_props = config_output,
373  },
374 };
375 
377 
378 const AVFilter ff_vf_xmedian = {
379  .name = "xmedian",
380  .description = NULL_IF_CONFIG_SMALL("Pick median pixels from several video inputs."),
381  .priv_size = sizeof(XMedianContext),
382  .priv_class = &xmedian_class,
385  .preinit = xmedian_framesync_preinit,
386  .init = xmedian_init,
387  .uninit = uninit,
388  .activate = activate,
391  .process_command = ff_filter_process_command,
392 };
393 
394 #endif /* CONFIG_XMEDIAN_FILTER */
395 
396 #if CONFIG_TMEDIAN_FILTER
397 static int tmedian_filter_frame(AVFilterLink *inlink, AVFrame *in)
398 {
399  AVFilterContext *ctx = inlink->dst;
400  AVFilterLink *outlink = ctx->outputs[0];
401  XMedianContext *s = ctx->priv;
402  ThreadData td;
403  AVFrame *out;
404 
405  update_index(s);
406 
407  if (s->nb_frames < s->nb_inputs) {
408  s->frames[s->nb_frames] = in;
409  s->nb_frames++;
410  if (s->nb_frames < s->nb_inputs)
411  return 0;
412  } else {
413  av_frame_free(&s->frames[0]);
414  memmove(&s->frames[0], &s->frames[1], sizeof(*s->frames) * (s->nb_inputs - 1));
415  s->frames[s->nb_inputs - 1] = in;
416  }
417 
418  if (ctx->is_disabled) {
419  out = av_frame_clone(s->frames[0]);
420  if (!out)
421  return AVERROR(ENOMEM);
422  return ff_filter_frame(outlink, out);
423  }
424 
425  out = ff_get_video_buffer(outlink, outlink->w, outlink->h);
426  if (!out)
427  return AVERROR(ENOMEM);
428  out->pts = s->frames[0]->pts;
429 
430  td.out = out;
431  td.in = s->frames;
432  ff_filter_execute(ctx, s->median_frames, &td, NULL,
433  FFMIN(s->height[1], s->nb_threads));
434 
435  return ff_filter_frame(outlink, out);
436 }
437 
438 static const AVOption tmedian_options[] = {
439  { "radius", "set median filter radius", OFFSET(radius), AV_OPT_TYPE_INT, {.i64=1}, 1, 127, .flags = FLAGS },
440  { "planes", "set planes to filter", OFFSET(planes), AV_OPT_TYPE_INT, {.i64=15}, 0, 15, .flags =TFLAGS },
441  { "percentile", "set percentile", OFFSET(percentile), AV_OPT_TYPE_FLOAT, {.dbl=0.5}, 0, 1, .flags =TFLAGS },
442  { NULL },
443 };
444 
445 static const AVFilterPad tmedian_inputs[] = {
446  {
447  .name = "default",
448  .type = AVMEDIA_TYPE_VIDEO,
449  .filter_frame = tmedian_filter_frame,
450  },
451 };
452 
453 static const AVFilterPad tmedian_outputs[] = {
454  {
455  .name = "default",
456  .type = AVMEDIA_TYPE_VIDEO,
457  .config_props = config_output,
458  },
459 };
460 
461 AVFILTER_DEFINE_CLASS(tmedian);
462 
463 const AVFilter ff_vf_tmedian = {
464  .name = "tmedian",
465  .description = NULL_IF_CONFIG_SMALL("Pick median pixels from successive frames."),
466  .priv_size = sizeof(XMedianContext),
467  .priv_class = &tmedian_class,
468  FILTER_INPUTS(tmedian_inputs),
469  FILTER_OUTPUTS(tmedian_outputs),
471  .init = init,
472  .uninit = uninit,
474  .process_command = ff_filter_process_command,
475 };
476 
477 #endif /* CONFIG_TMEDIAN_FILTER */
ff_get_video_buffer
AVFrame * ff_get_video_buffer(AVFilterLink *link, int w, int h)
Request a picture buffer with a specific set of permissions.
Definition: video.c:101
AV_PIX_FMT_YUVA422P16
#define AV_PIX_FMT_YUVA422P16
Definition: pixfmt.h:502
AV_PIX_FMT_GBRAP16
#define AV_PIX_FMT_GBRAP16
Definition: pixfmt.h:481
FFFrameSyncIn::time_base
AVRational time_base
Time base for the incoming frames.
Definition: framesync.h:117
ff_framesync_configure
int ff_framesync_configure(FFFrameSync *fs)
Configure a frame sync structure.
Definition: framesync.c:134
td
#define td
Definition: regdef.h:70
AVPixelFormat
AVPixelFormat
Pixel format.
Definition: pixfmt.h:64
planes
static const struct @346 planes[]
av_clip
#define av_clip
Definition: common.h:95
AVERROR
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
opt.h
ff_framesync_uninit
void ff_framesync_uninit(FFFrameSync *fs)
Free all memory currently allocated.
Definition: framesync.c:304
out
FILE * out
Definition: movenc.c:54
ff_filter_frame
int ff_filter_frame(AVFilterLink *link, AVFrame *frame)
Send a frame of data to the next filter.
Definition: avfilter.c:969
av_pix_fmt_desc_get
const AVPixFmtDescriptor * av_pix_fmt_desc_get(enum AVPixelFormat pix_fmt)
Definition: pixdesc.c:2888
ff_framesync_get_frame
int ff_framesync_get_frame(FFFrameSync *fs, unsigned in, AVFrame **rframe, unsigned get)
Get the current frame in an input.
Definition: framesync.c:267
FILTER_PIXFMTS_ARRAY
#define FILTER_PIXFMTS_ARRAY(array)
Definition: internal.h:174
MEDIAN_SLICE
#define MEDIAN_SLICE(name, type, comparei)
Definition: vf_xmedian.c:130
inlink
The exact code depends on how similar the blocks are and how related they are to the and needs to apply these operations to the correct inlink or outlink if there are several Macros are available to factor that when no extra processing is inlink
Definition: filter_design.txt:212
av_asprintf
char * av_asprintf(const char *fmt,...)
Definition: avstring.c:116
XMedianContext::median_frames
int(* median_frames)(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs)
Definition: vf_xmedian.c:61
av_frame_free
void av_frame_free(AVFrame **frame)
Free the frame and any dynamically allocated objects in it, e.g.
Definition: frame.c:99
AV_PIX_FMT_YUVA422P9
#define AV_PIX_FMT_YUVA422P9
Definition: pixfmt.h:494
XMedianContext::linesize
int * linesize
Definition: vf_xmedian.c:56
AVFrame
This structure describes decoded (raw) audio or video data.
Definition: frame.h:330
pixdesc.h
AV_PIX_FMT_YUVA420P16
#define AV_PIX_FMT_YUVA420P16
Definition: pixfmt.h:501
AV_PIX_FMT_YUVA420P10
#define AV_PIX_FMT_YUVA420P10
Definition: pixfmt.h:496
AVOption
AVOption.
Definition: opt.h:251
AV_PIX_FMT_YUV420P10
#define AV_PIX_FMT_YUV420P10
Definition: pixfmt.h:459
FRAMESYNC_DEFINE_CLASS
#define FRAMESYNC_DEFINE_CLASS(name, context, field)
Definition: framesync.h:351
FLAGS
#define FLAGS
Definition: cmdutils.c:515
XMedianContext::nb_frames
int nb_frames
Definition: vf_xmedian.c:40
AV_PIX_FMT_YUV440P
@ AV_PIX_FMT_YUV440P
planar YUV 4:4:0 (1 Cr & Cb sample per 1x2 Y samples)
Definition: pixfmt.h:99
AVFilter::name
const char * name
Filter name.
Definition: avfilter.h:165
FFFrameSync
Frame sync structure.
Definition: framesync.h:168
EXT_INFINITY
@ EXT_INFINITY
Extend the frame to infinity.
Definition: framesync.h:75
ThreadData::out
AVFrame * out
Definition: af_adeclick.c:473
video.h
ThreadData::in
AVFrame * in
Definition: af_adecorrelate.c:154
AV_PIX_FMT_YUVA422P10
#define AV_PIX_FMT_YUVA422P10
Definition: pixfmt.h:497
AV_PIX_FMT_GRAY9
#define AV_PIX_FMT_GRAY9
Definition: pixfmt.h:439
formats.h
av_pix_fmt_count_planes
int av_pix_fmt_count_planes(enum AVPixelFormat pix_fmt)
Definition: pixdesc.c:2928
AV_PIX_FMT_YUVA420P9
#define AV_PIX_FMT_YUVA420P9
Definition: pixfmt.h:493
EXT_STOP
@ EXT_STOP
Completely stop all streams with this one.
Definition: framesync.h:65
AV_PIX_FMT_GBRP14
#define AV_PIX_FMT_GBRP14
Definition: pixfmt.h:477
AV_PIX_FMT_GBRAP
@ AV_PIX_FMT_GBRAP
planar GBRA 4:4:4:4 32bpp
Definition: pixfmt.h:205
XMedianContext::planes
int planes
Definition: vf_xmedian.c:42
XMedianContext::fs
FFFrameSync fs
Definition: vf_xmedian.c:59
AV_PIX_FMT_GBRP10
#define AV_PIX_FMT_GBRP10
Definition: pixfmt.h:475
AV_PIX_FMT_YUVA444P16
#define AV_PIX_FMT_YUVA444P16
Definition: pixfmt.h:503
FFFrameSyncIn
Input stream structure.
Definition: framesync.h:102
AV_PIX_FMT_YUV422P9
#define AV_PIX_FMT_YUV422P9
Definition: pixfmt.h:457
AV_PIX_FMT_GRAY16
#define AV_PIX_FMT_GRAY16
Definition: pixfmt.h:443
FFFrameSyncIn::sync
unsigned sync
Synchronization level: frames on input at the highest sync level will generate output frame events.
Definition: framesync.h:160
AVFILTER_FLAG_DYNAMIC_INPUTS
#define AVFILTER_FLAG_DYNAMIC_INPUTS
The number of the filter inputs is not determined just by AVFilter.inputs.
Definition: avfilter.h:106
config_output
static int config_output(AVFilterLink *outlink)
Definition: vf_xmedian.c:235
AVFilterPad
A filter pad used for either input or output.
Definition: internal.h:49
FFDIFFSIGN
#define FFDIFFSIGN(x, y)
Comparator.
Definition: macros.h:45
AV_PIX_FMT_YUV444P10
#define AV_PIX_FMT_YUV444P10
Definition: pixfmt.h:462
AV_PIX_FMT_YUVJ411P
@ AV_PIX_FMT_YUVJ411P
planar YUV 4:1:1, 12bpp, (1 Cr & Cb sample per 4x1 Y samples) full scale (JPEG), deprecated in favor ...
Definition: pixfmt.h:276
AV_LOG_ERROR
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
Definition: log.h:180
av_cold
#define av_cold
Definition: attributes.h:90
AV_PIX_FMT_YUV422P16
#define AV_PIX_FMT_YUV422P16
Definition: pixfmt.h:471
AV_PIX_FMT_YUVJ422P
@ AV_PIX_FMT_YUVJ422P
planar YUV 4:2:2, 16bpp, full scale (JPEG), deprecated in favor of AV_PIX_FMT_YUV422P and setting col...
Definition: pixfmt.h:79
AV_PIX_FMT_GBRAP10
#define AV_PIX_FMT_GBRAP10
Definition: pixfmt.h:479
width
#define width
av_image_fill_linesizes
int av_image_fill_linesizes(int linesizes[4], enum AVPixelFormat pix_fmt, int width)
Fill plane linesizes for an image with pixel format pix_fmt and width width.
Definition: imgutils.c:89
intreadwrite.h
s
#define s(width, name)
Definition: cbs_vp9.c:256
AV_PIX_FMT_GBRAP12
#define AV_PIX_FMT_GBRAP12
Definition: pixfmt.h:480
AV_PIX_FMT_YUVA420P
@ AV_PIX_FMT_YUVA420P
planar YUV 4:2:0, 20bpp, (1 Cr & Cb sample per 2x2 Y & A samples)
Definition: pixfmt.h:101
AV_PIX_FMT_YUV444P16
#define AV_PIX_FMT_YUV444P16
Definition: pixfmt.h:472
AV_CEIL_RSHIFT
#define AV_CEIL_RSHIFT(a, b)
Definition: common.h:50
XMedianContext::depth
int depth
Definition: vf_xmedian.c:48
outputs
static const AVFilterPad outputs[]
Definition: af_acontrast.c:172
AV_PIX_FMT_YUVA444P12
#define AV_PIX_FMT_YUVA444P12
Definition: pixfmt.h:500
AV_PIX_FMT_YUV420P9
#define AV_PIX_FMT_YUV420P9
Definition: pixfmt.h:456
AV_PIX_FMT_YUV420P16
#define AV_PIX_FMT_YUV420P16
Definition: pixfmt.h:470
process_frame
static int process_frame(FFFrameSync *fs)
Definition: vf_xmedian.c:199
ctx
AVFormatContext * ctx
Definition: movenc.c:48
AV_PIX_FMT_GRAY14
#define AV_PIX_FMT_GRAY14
Definition: pixfmt.h:442
av_frame_clone
AVFrame * av_frame_clone(const AVFrame *src)
Create a new frame that references the same data as src.
Definition: frame.c:465
av_rescale_q
int64_t av_rescale_q(int64_t a, AVRational bq, AVRational cq)
Rescale a 64-bit integer by 2 rational numbers.
Definition: mathematics.c:142
AV_PIX_FMT_YUV420P
@ AV_PIX_FMT_YUV420P
planar YUV 4:2:0, 12bpp, (1 Cr & Cb sample per 2x2 Y samples)
Definition: pixfmt.h:66
FILTER_INPUTS
#define FILTER_INPUTS(array)
Definition: internal.h:194
AV_PIX_FMT_YUVJ444P
@ AV_PIX_FMT_YUVJ444P
planar YUV 4:4:4, 24bpp, full scale (JPEG), deprecated in favor of AV_PIX_FMT_YUV444P and setting col...
Definition: pixfmt.h:80
arg
const char * arg
Definition: jacosubdec.c:67
XMedianContext::data
uint8_t ** data
Definition: vf_xmedian.c:55
AV_PIX_FMT_GRAY10
#define AV_PIX_FMT_GRAY10
Definition: pixfmt.h:440
AV_PIX_FMT_GBRP16
#define AV_PIX_FMT_GBRP16
Definition: pixfmt.h:478
XMedianContext::width
int width[4]
Definition: vf_xmedian.c:52
AVClass
Describe the class of an AVClass context structure.
Definition: log.h:66
NULL
#define NULL
Definition: coverity.c:32
fs
#define fs(width, name, subs,...)
Definition: cbs_vp9.c:258
init
static av_cold int init(AVFilterContext *ctx)
Definition: vf_xmedian.c:94
AVRational
Rational number (pair of numerator and denominator).
Definition: rational.h:58
ff_append_inpad_free_name
int ff_append_inpad_free_name(AVFilterContext *f, AVFilterPad *p)
Definition: avfilter.c:131
AV_PIX_FMT_YUVJ420P
@ AV_PIX_FMT_YUVJ420P
planar YUV 4:2:0, 12bpp, full scale (JPEG), deprecated in favor of AV_PIX_FMT_YUV420P and setting col...
Definition: pixfmt.h:78
AV_PIX_FMT_YUV440P10
#define AV_PIX_FMT_YUV440P10
Definition: pixfmt.h:461
AV_PIX_FMT_YUV422P10
#define AV_PIX_FMT_YUV422P10
Definition: pixfmt.h:460
AV_PIX_FMT_GRAY8
@ AV_PIX_FMT_GRAY8
Y , 8bpp.
Definition: pixfmt.h:74
AV_PIX_FMT_GBRP9
#define AV_PIX_FMT_GBRP9
Definition: pixfmt.h:474
XMedianContext::height
int height[4]
Definition: vf_xmedian.c:53
XMedianContext::nb_threads
int nb_threads
Definition: vf_xmedian.c:41
TFLAGS
#define TFLAGS
Definition: af_afade.c:65
qsort.h
NULL_IF_CONFIG_SMALL
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification.
Definition: internal.h:115
AV_PIX_FMT_YUV422P12
#define AV_PIX_FMT_YUV422P12
Definition: pixfmt.h:464
AV_PIX_FMT_YUV444P12
#define AV_PIX_FMT_YUV444P12
Definition: pixfmt.h:466
ff_filter_process_command
int ff_filter_process_command(AVFilterContext *ctx, const char *cmd, const char *arg, char *res, int res_len, int flags)
Generic processing of user supplied commands that are set in the same way as the filter options.
Definition: avfilter.c:842
compare8
static int compare8(const void *p1, const void *p2)
Definition: vf_xmedian.c:116
height
#define height
AV_PIX_FMT_YUVA444P
@ AV_PIX_FMT_YUVA444P
planar YUV 4:4:4 32bpp, (1 Cr & Cb sample per 1x1 Y & A samples)
Definition: pixfmt.h:167
AV_PIX_FMT_YUVA444P10
#define AV_PIX_FMT_YUVA444P10
Definition: pixfmt.h:498
ff_vf_xmedian
const AVFilter ff_vf_xmedian
XMedianContext::desc
const AVPixFmtDescriptor * desc
Definition: vf_xmedian.c:38
update_index
static void update_index(XMedianContext *s)
Definition: vf_xmedian.c:191
compare16
static int compare16(const void *p1, const void *p2)
Definition: vf_xmedian.c:123
XMedianContext
Definition: vf_xmedian.c:36
internal.h
AVFILTER_DEFINE_CLASS
#define AVFILTER_DEFINE_CLASS(fname)
Definition: internal.h:329
AV_OPT_TYPE_FLOAT
@ AV_OPT_TYPE_FLOAT
Definition: opt.h:228
XMedianContext::index
int index
Definition: vf_xmedian.c:47
pixel_fmts
static enum AVPixelFormat pixel_fmts[]
Definition: vf_xmedian.c:64
ff_vf_tmedian
const AVFilter ff_vf_tmedian
i
#define i(width, name, range_min, range_max)
Definition: cbs_h2645.c:269
AV_PIX_FMT_GBRP12
#define AV_PIX_FMT_GBRP12
Definition: pixfmt.h:476
XMedianContext::linesizes
int linesizes[4]
Definition: vf_xmedian.c:51
ff_filter_get_nb_threads
int ff_filter_get_nb_threads(AVFilterContext *ctx)
Get number of threads for current filter instance.
Definition: avfilter.c:777
XMedianContext::max
int max
Definition: vf_xmedian.c:49
ThreadData
Used for passing data between threads.
Definition: dsddec.c:69
FFMIN
#define FFMIN(a, b)
Definition: macros.h:49
AV_PIX_FMT_YUVJ440P
@ AV_PIX_FMT_YUVJ440P
planar YUV 4:4:0 full scale (JPEG), deprecated in favor of AV_PIX_FMT_YUV440P and setting color_range
Definition: pixfmt.h:100
AVFilterPad::name
const char * name
Pad name.
Definition: internal.h:55
av_calloc
void * av_calloc(size_t nmemb, size_t size)
Definition: mem.c:262
AV_PIX_FMT_YUV444P9
#define AV_PIX_FMT_YUV444P9
Definition: pixfmt.h:458
AVFilter
Filter definition.
Definition: avfilter.h:161
ret
ret
Definition: filter_design.txt:187
AVFilterPad::type
enum AVMediaType type
AVFilterPad type.
Definition: internal.h:60
XMedianContext::nb_inputs
int nb_inputs
Definition: vf_xmedian.c:39
AV_PIX_FMT_YUVA444P9
#define AV_PIX_FMT_YUVA444P9
Definition: pixfmt.h:495
ff_framesync_init
int ff_framesync_init(FFFrameSync *fs, AVFilterContext *parent, unsigned nb_in)
Initialize a frame sync structure.
Definition: framesync.c:86
AV_PIX_FMT_YUV420P12
#define AV_PIX_FMT_YUV420P12
Definition: pixfmt.h:463
XMedianContext::frames
AVFrame ** frames
Definition: vf_xmedian.c:58
left
Tag MUST be and< 10hcoeff half pel interpolation filter coefficients, hcoeff[0] are the 2 middle coefficients[1] are the next outer ones and so on, resulting in a filter like:...eff[2], hcoeff[1], hcoeff[0], hcoeff[0], hcoeff[1], hcoeff[2] ... the sign of the coefficients is not explicitly stored but alternates after each coeff and coeff[0] is positive, so ...,+,-,+,-,+,+,-,+,-,+,... hcoeff[0] is not explicitly stored but found by subtracting the sum of all stored coefficients with signs from 32 hcoeff[0]=32 - hcoeff[1] - hcoeff[2] - ... a good choice for hcoeff and htaps is htaps=6 hcoeff={40,-10, 2} an alternative which requires more computations at both encoder and decoder side and may or may not be better is htaps=8 hcoeff={42,-14, 6,-2}ref_frames minimum of the number of available reference frames and max_ref_frames for example the first frame after a key frame always has ref_frames=1spatial_decomposition_type wavelet type 0 is a 9/7 symmetric compact integer wavelet 1 is a 5/3 symmetric compact integer wavelet others are reserved stored as delta from last, last is reset to 0 if always_reset||keyframeqlog quality(logarithmic quantizer scale) stored as delta from last, last is reset to 0 if always_reset||keyframemv_scale stored as delta from last, last is reset to 0 if always_reset||keyframe FIXME check that everything works fine if this changes between framesqbias dequantization bias stored as delta from last, last is reset to 0 if always_reset||keyframeblock_max_depth maximum depth of the block tree stored as delta from last, last is reset to 0 if always_reset||keyframequant_table quantization tableHighlevel bitstream structure:==============================--------------------------------------------|Header|--------------------------------------------|------------------------------------|||Block0||||split?||||yes no||||......... intra?||||:Block01 :yes no||||:Block02 :....... ..........||||:Block03 ::y DC ::ref index:||||:Block04 ::cb DC ::motion x :||||......... :cr DC ::motion y :||||....... ..........|||------------------------------------||------------------------------------|||Block1|||...|--------------------------------------------|------------ ------------ ------------|||Y subbands||Cb subbands||Cr subbands||||--- ---||--- ---||--- ---|||||LL0||HL0||||LL0||HL0||||LL0||HL0|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||LH0||HH0||||LH0||HH0||||LH0||HH0|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||HL1||LH1||||HL1||LH1||||HL1||LH1|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||HH1||HL2||||HH1||HL2||||HH1||HL2|||||...||...||...|||------------ ------------ ------------|--------------------------------------------Decoding process:=================------------|||Subbands|------------||||------------|Intra DC||||LL0 subband prediction ------------|\ Dequantization ------------------- \||Reference frames|\ IDWT|------- -------|Motion \|||Frame 0||Frame 1||Compensation . OBMC v -------|------- -------|--------------. \------> Frame n output Frame Frame<----------------------------------/|...|------------------- Range Coder:============Binary Range Coder:------------------- The implemented range coder is an adapted version based upon "Range encoding: an algorithm for removing redundancy from a digitised message." by G. N. N. Martin. The symbols encoded by the Snow range coder are bits(0|1). The associated probabilities are not fix but change depending on the symbol mix seen so far. bit seen|new state ---------+----------------------------------------------- 0|256 - state_transition_table[256 - old_state];1|state_transition_table[old_state];state_transition_table={ 0, 0, 0, 0, 0, 0, 0, 0, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 170, 171, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181, 182, 183, 184, 185, 186, 187, 188, 189, 190, 190, 191, 192, 194, 194, 195, 196, 197, 198, 199, 200, 201, 202, 202, 204, 205, 206, 207, 208, 209, 209, 210, 211, 212, 213, 215, 215, 216, 217, 218, 219, 220, 220, 222, 223, 224, 225, 226, 227, 227, 229, 229, 230, 231, 232, 234, 234, 235, 236, 237, 238, 239, 240, 241, 242, 243, 244, 245, 246, 247, 248, 248, 0, 0, 0, 0, 0, 0, 0};FIXME Range Coding of integers:------------------------- FIXME Neighboring Blocks:===================left and top are set to the respective blocks unless they are outside of the image in which case they are set to the Null block top-left is set to the top left block unless it is outside of the image in which case it is set to the left block if this block has no larger parent block or it is at the left side of its parent block and the top right block is not outside of the image then the top right block is used for top-right else the top-left block is used Null block y, cb, cr are 128 level, ref, mx and my are 0 Motion Vector Prediction:=========================1. the motion vectors of all the neighboring blocks are scaled to compensate for the difference of reference frames scaled_mv=(mv *(256 *(current_reference+1)/(mv.reference+1))+128)> the median of the scaled left
Definition: snow.txt:386
AV_PIX_FMT_YUV422P14
#define AV_PIX_FMT_YUV422P14
Definition: pixfmt.h:468
OFFSET
it s the only field you need to keep assuming you have a context There is some magic you don t need to care about around this just let it vf default minimum maximum flags name is the option keep it simple and lowercase description are in without and describe what they for example set the foo of the bar offset is the offset of the field in your see the OFFSET() macro
FFFrameSyncIn::before
enum FFFrameSyncExtMode before
Extrapolation mode for timestamps before the first frame.
Definition: framesync.h:107
XMedianContext::percentile
float percentile
Definition: vf_xmedian.c:43
framesync.h
XMedianContext::radius
int radius
Definition: vf_xmedian.c:46
AV_PIX_FMT_NONE
@ AV_PIX_FMT_NONE
Definition: pixfmt.h:65
AV_PIX_FMT_YUVA422P12
#define AV_PIX_FMT_YUVA422P12
Definition: pixfmt.h:499
AV_OPT_TYPE_INT
@ AV_OPT_TYPE_INT
Definition: opt.h:225
avfilter.h
uninit
static av_cold void uninit(AVFilterContext *ctx)
Definition: vf_xmedian.c:313
AV_PIX_FMT_YUV444P
@ AV_PIX_FMT_YUV444P
planar YUV 4:4:4, 24bpp, (1 Cr & Cb sample per 1x1 Y samples)
Definition: pixfmt.h:71
activate
static int activate(AVFilterContext *ctx)
Definition: vf_xmedian.c:326
AVFilterContext
An instance of a filter.
Definition: avfilter.h:392
XMedianContext::nb_planes
int nb_planes
Definition: vf_xmedian.c:50
AV_PIX_FMT_GBRP
@ AV_PIX_FMT_GBRP
planar GBR 4:4:4 24bpp
Definition: pixfmt.h:158
AVFILTER_FLAG_SLICE_THREADS
#define AVFILTER_FLAG_SLICE_THREADS
The filter supports multithreading by splitting frames into multiple parts and processing them concur...
Definition: avfilter.h:117
AVMEDIA_TYPE_VIDEO
@ AVMEDIA_TYPE_VIDEO
Definition: avutil.h:201
AV_PIX_FMT_YUV422P
@ AV_PIX_FMT_YUV422P
planar YUV 4:2:2, 16bpp, (1 Cr & Cb sample per 2x1 Y samples)
Definition: pixfmt.h:70
AVPixFmtDescriptor
Descriptor that unambiguously describes how the bits of a pixel are stored in the up to 4 data planes...
Definition: pixdesc.h:69
FILTER_OUTPUTS
#define FILTER_OUTPUTS(array)
Definition: internal.h:195
av_freep
#define av_freep(p)
Definition: tableprint_vlc.h:34
XMedianContext::xmedian
int xmedian
Definition: vf_xmedian.c:45
AV_PIX_FMT_YUV411P
@ AV_PIX_FMT_YUV411P
planar YUV 4:1:1, 12bpp, (1 Cr & Cb sample per 4x1 Y samples)
Definition: pixfmt.h:73
AVFILTER_FLAG_SUPPORT_TIMELINE_INTERNAL
#define AVFILTER_FLAG_SUPPORT_TIMELINE_INTERNAL
Same as AVFILTER_FLAG_SUPPORT_TIMELINE_GENERIC, except that the filter will have its filter_frame() c...
Definition: avfilter.h:150
imgutils.h
AVERROR_BUG
#define AVERROR_BUG
Internal bug, also see AVERROR_BUG2.
Definition: error.h:52
AV_PIX_FMT_YUV410P
@ AV_PIX_FMT_YUV410P
planar YUV 4:1:0, 9bpp, (1 Cr & Cb sample per 4x4 Y samples)
Definition: pixfmt.h:72
av_log
#define av_log(a,...)
Definition: tableprint_vlc.h:27
FFFrameSyncIn::after
enum FFFrameSyncExtMode after
Extrapolation mode for timestamps after the last frame.
Definition: framesync.h:112
AV_PIX_FMT_YUV440P12
#define AV_PIX_FMT_YUV440P12
Definition: pixfmt.h:465
AV_PIX_FMT_YUV444P14
#define AV_PIX_FMT_YUV444P14
Definition: pixfmt.h:469
ff_framesync_activate
int ff_framesync_activate(FFFrameSync *fs)
Examine the frames in the filter's input and try to produce output.
Definition: framesync.c:355
avstring.h
AV_PIX_FMT_GRAY12
#define AV_PIX_FMT_GRAY12
Definition: pixfmt.h:441
ff_filter_execute
static av_always_inline int ff_filter_execute(AVFilterContext *ctx, avfilter_action_func *func, void *arg, int *ret, int nb_jobs)
Definition: internal.h:146
int
int
Definition: ffmpeg_filter.c:156
AV_PIX_FMT_YUVA422P
@ AV_PIX_FMT_YUVA422P
planar YUV 4:2:2 24bpp, (1 Cr & Cb sample per 2x1 Y & A samples)
Definition: pixfmt.h:166
AV_PIX_FMT_YUV420P14
#define AV_PIX_FMT_YUV420P14
Definition: pixfmt.h:467