51 #define OFFSET(x) offsetof(VMAFMotionContext, x) 52 #define FLAGS AV_OPT_FLAG_FILTERING_PARAM|AV_OPT_FLAG_VIDEO_PARAM 62 int h, ptrdiff_t _img1_stride, ptrdiff_t _img2_stride)
64 ptrdiff_t img1_stride = _img1_stride /
sizeof(*img1);
65 ptrdiff_t img2_stride = _img2_stride /
sizeof(*img2);
69 for (i = 0; i <
h; i++) {
70 for (j = 0; j <
w; j++) {
71 sum +=
abs(img1[j] - img2[j]);
81 uint16_t *dst,
int w,
int h, ptrdiff_t _src_stride,
82 ptrdiff_t _dst_stride)
84 ptrdiff_t src_stride = _src_stride /
sizeof(*src);
85 ptrdiff_t dst_stride = _dst_stride /
sizeof(*dst);
86 int radius = filt_w / 2;
87 int borders_left = radius;
88 int borders_right = w - (filt_w - radius);
92 for (i = 0; i <
h; i++) {
93 for (j = 0; j < borders_left; j++) {
95 for (k = 0; k < filt_w; k++) {
96 int j_tap =
FFABS(j - radius + k);
98 j_tap = w - (j_tap - w + 1);
100 sum += filter[k] * src[i * src_stride + j_tap];
102 dst[i * dst_stride + j] = sum >>
BIT_SHIFT;
105 for (j = borders_left; j < borders_right; j++) {
107 for (k = 0; k < filt_w; k++) {
108 sum += filter[k] * src[i * src_stride + j - radius + k];
110 dst[i * dst_stride + j] = sum >>
BIT_SHIFT;
113 for (j = borders_right; j <
w; j++) {
115 for (k = 0; k < filt_w; k++) {
116 int j_tap =
FFABS(j - radius + k);
118 j_tap = w - (j_tap - w + 1);
120 sum += filter[k] * src[i * src_stride + j_tap];
122 dst[i * dst_stride + j] = sum >>
BIT_SHIFT;
127 #define conv_y_fn(type, bits) \ 128 static void convolution_y_##bits##bit(const uint16_t *filter, int filt_w, \ 129 const uint8_t *_src, uint16_t *dst, \ 130 int w, int h, ptrdiff_t _src_stride, \ 131 ptrdiff_t _dst_stride) \ 133 const type *src = (const type *) _src; \ 134 ptrdiff_t src_stride = _src_stride / sizeof(*src); \ 135 ptrdiff_t dst_stride = _dst_stride / sizeof(*dst); \ 136 int radius = filt_w / 2; \ 137 int borders_top = radius; \ 138 int borders_bottom = h - (filt_w - radius); \ 142 for (i = 0; i < borders_top; i++) { \ 143 for (j = 0; j < w; j++) { \ 145 for (k = 0; k < filt_w; k++) { \ 146 int i_tap = FFABS(i - radius + k); \ 148 i_tap = h - (i_tap - h + 1); \ 150 sum += filter[k] * src[i_tap * src_stride + j]; \ 152 dst[i * dst_stride + j] = sum >> bits; \ 155 for (i = borders_top; i < borders_bottom; i++) { \ 156 for (j = 0; j < w; j++) { \ 158 for (k = 0; k < filt_w; k++) { \ 159 sum += filter[k] * src[(i - radius + k) * src_stride + j]; \ 161 dst[i * dst_stride + j] = sum >> bits; \ 164 for (i = borders_bottom; i < h; i++) { \ 165 for (j = 0; j < w; j++) { \ 167 for (k = 0; k < filt_w; k++) { \ 168 int i_tap = FFABS(i - radius + k); \ 170 i_tap = h - (i_tap - h + 1); \ 172 sum += filter[k] * src[i_tap * src_stride + j]; \ 174 dst[i * dst_stride + j] = sum >> bits; \ 184 dsp->convolution_y = bpp == 10 ? convolution_y_10bit : convolution_y_8bit;
216 snprintf(value,
sizeof(value),
"%0.2f", d);
245 data_sz = (size_t) s->
stride * h;
252 for (i = 0; i < 5; i++) {
359 .
name =
"vmafmotion",
365 .priv_class = &vmafmotion_class,
366 .
inputs = vmafmotion_inputs,
#define AV_PIX_FMT_FLAG_PAL
Pixel format has a palette in data[1], values are indexes in this palette.
static int filter_frame(AVFilterLink *inlink, AVFrame *ref)
const AVPixFmtDescriptor * av_pix_fmt_desc_get(enum AVPixelFormat pix_fmt)
This structure describes decoded (raw) audio or video data.
static const AVFilterPad vmafmotion_inputs[]
Main libavfilter public API header.
AVFILTER_DEFINE_CLASS(vmafmotion)
int h
agreed upon image height
uint64_t(* sad)(const uint16_t *img1, const uint16_t *img2, int w, int h, ptrdiff_t img1_stride, ptrdiff_t img2_stride)
static av_cold void uninit(AVFilterContext *ctx)
static uint8_t img2[WIDTH *HEIGHT]
static const AVFilterPad vmafmotion_outputs[]
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample format(the sample packing is implied by the sample format) and sample rate.The lists are not just lists
static uint8_t img1[WIDTH *HEIGHT]
const char * name
Pad name.
AVFilterLink ** inputs
array of pointers to input links
int ff_filter_frame(AVFilterLink *link, AVFrame *frame)
Send a frame of data to the next filter.
AVComponentDescriptor comp[4]
Parameters that describe how pixels are packed.
GLsizei GLboolean const GLfloat * value
AVDictionary * metadata
metadata.
static int query_formats(AVFilterContext *ctx)
void(* convolution_x)(const uint16_t *filter, int filt_w, const uint16_t *src, uint16_t *dst, int w, int h, ptrdiff_t src_stride, ptrdiff_t dst_stride)
A filter pad used for either input or output.
A link between two filters.
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
filter_frame For filters that do not use the this method is called when a frame is pushed to the filter s input It can be called at any time except in a reentrant way If the input frame is enough to produce then the filter should push the output frames on the output link immediately As an exception to the previous rule if the input frame is enough to produce several output frames then the filter needs output only at least one per link The additional frames can be left buffered in the filter
#define AV_PIX_FMT_FLAG_RGB
The pixel format contains RGB-like data (as opposed to YUV/grayscale).
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification. ...
void * priv
private data for use by the filter
static uint64_t image_sad(const uint16_t *img1, const uint16_t *img2, int w, int h, ptrdiff_t _img1_stride, ptrdiff_t _img2_stride)
#define AV_PIX_FMT_FLAG_HWACCEL
Pixel format is an HW accelerated format.
static av_cold int init(AVFilterContext *ctx)
int w
agreed upon image width
uint64_t flags
Combination of AV_PIX_FMT_FLAG_...
double ff_vmafmotion_process(VMAFMotionData *s, AVFrame *ref)
uint8_t nb_components
The number of components each pixel has, (1-4)
static void do_vmafmotion(AVFilterContext *ctx, AVFrame *ref)
#define FFABS(a)
Absolute value, Note, INT_MIN / INT64_MIN result in undefined behavior as they are not representable ...
double ff_vmafmotion_uninit(VMAFMotionData *s)
static const AVFilterPad outputs[]
int format
agreed upon media format
#define AV_LOG_INFO
Standard information.
int linesize[AV_NUM_DATA_POINTERS]
For video, size in bytes of each picture line.
Descriptor that unambiguously describes how the bits of a pixel are stored in the up to 4 data planes...
these buffered frames must be flushed immediately if a new input produces new the filter must not call request_frame to get more It must just process the frame or queue it The task of requesting more frames is left to the filter s request_frame method or the application If a filter has several inputs
int av_dict_set(AVDictionary **pm, const char *key, const char *value, int flags)
Set the given entry in *pm, overwriting an existing entry.
static int config_input_ref(AVFilterLink *inlink)
Describe the class of an AVClass context structure.
const char * name
Filter name.
AVFilter ff_vf_vmafmotion
#define AV_PIX_FMT_FLAG_BITSTREAM
All values of a component are bit-wise packed end to end.
AVFilterLink ** outputs
array of pointers to output links
uint8_t * data[AV_NUM_DATA_POINTERS]
pointer to the picture/channel planes.
int ff_vmafmotion_init(VMAFMotionData *s, int w, int h, enum AVPixelFormat fmt)
static void set_meta(AVDictionary **metadata, const char *key, float d)
int av_strerror(int errnum, char *errbuf, size_t errbuf_size)
Put a description of the AVERROR code errnum in errbuf.
The exact code depends on how similar the blocks are and how related they are to the and needs to apply these operations to the correct inlink or outlink if there are several Macros are available to factor that when no extra processing is inlink
static int ref[MAX_W *MAX_W]
static const AVOption vmafmotion_options[]
#define AV_PIX_FMT_FLAG_BE
Pixel format is big-endian.
void(* convolution_y)(const uint16_t *filter, int filt_w, const uint8_t *src, uint16_t *dst, int w, int h, ptrdiff_t src_stride, ptrdiff_t dst_stride)
AVFilterContext * dst
dest filter
static void convolution_x(const uint16_t *filter, int filt_w, const uint16_t *src, uint16_t *dst, int w, int h, ptrdiff_t _src_stride, ptrdiff_t _dst_stride)
static const float FILTER_5[5]
VMAFMotionDSPContext vmafdsp
#define FFSWAP(type, a, b)
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later.That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another.Frame references ownership and permissions
int depth
Number of bits in the component.
AVPixelFormat
Pixel format.
#define AV_PIX_FMT_FLAG_PLANAR
At least one pixel component is not in the first data plane.
#define conv_y_fn(type, bits)