[FFmpeg-cvslog] avfilter/af_earwax: fix filter behavior
Paul B Mahol
git at videolan.org
Mon Dec 7 22:11:33 EET 2020
ffmpeg | branch: master | Paul B Mahol <onemda at gmail.com> | Fri Dec 4 17:54:05 2020 +0100| [f41de0436cc8ce7221cd3702a51f3676cc689cf7] | committer: Paul B Mahol
avfilter/af_earwax: fix filter behavior
Previous filter output was incorrect. New one actually follows
graph in comments described on side of filter taps.
> http://git.videolan.org/gitweb.cgi/ffmpeg.git/?a=commit;h=f41de0436cc8ce7221cd3702a51f3676cc689cf7
---
libavfilter/af_earwax.c | 124 +++++++++++++++++++++++++++++++++----------
tests/fate/filter-audio.mak | 2 +-
tests/ref/fate/filter-earwax | 40 +++++++-------
3 files changed, 117 insertions(+), 49 deletions(-)
diff --git a/libavfilter/af_earwax.c b/libavfilter/af_earwax.c
index cdd2b4fc49..921d0a4c04 100644
--- a/libavfilter/af_earwax.c
+++ b/libavfilter/af_earwax.c
@@ -34,9 +34,9 @@
#include "audio.h"
#include "formats.h"
-#define NUMTAPS 64
+#define NUMTAPS 32
-static const int8_t filt[NUMTAPS] = {
+static const int8_t filt[NUMTAPS * 2] = {
/* 30° 330° */
4, -6, /* 32 tap stereo FIR filter. */
4, -11, /* One side filters as if the */
@@ -72,7 +72,10 @@ static const int8_t filt[NUMTAPS] = {
4, 0};
typedef struct EarwaxContext {
- int16_t taps[NUMTAPS * 2];
+ int16_t filter[2][NUMTAPS];
+ int16_t taps[4][NUMTAPS * 2];
+
+ AVFrame *frame[2];
} EarwaxContext;
static int query_formats(AVFilterContext *ctx)
@@ -83,7 +86,7 @@ static int query_formats(AVFilterContext *ctx)
AVFilterFormats *formats = NULL;
AVFilterChannelLayouts *layout = NULL;
- if ((ret = ff_add_format (&formats, AV_SAMPLE_FMT_S16 )) < 0 ||
+ if ((ret = ff_add_format (&formats, AV_SAMPLE_FMT_S16P )) < 0 ||
(ret = ff_set_common_formats (ctx , formats )) < 0 ||
(ret = ff_add_channel_layout (&layout , AV_CH_LAYOUT_STEREO )) < 0 ||
(ret = ff_set_common_channel_layouts (ctx , layout )) < 0 ||
@@ -94,7 +97,8 @@ static int query_formats(AVFilterContext *ctx)
}
//FIXME: replace with DSPContext.scalarproduct_int16
-static inline int16_t *scalarproduct(const int16_t *in, const int16_t *endin, int16_t *out)
+static inline int16_t *scalarproduct(const int16_t *in, const int16_t *endin,
+ const int16_t *filt, int16_t *out)
{
int32_t sample;
int16_t j;
@@ -103,7 +107,7 @@ static inline int16_t *scalarproduct(const int16_t *in, const int16_t *endin, in
sample = 0;
for (j = 0; j < NUMTAPS; j++)
sample += in[j] * filt[j];
- *out = av_clip_int16(sample >> 6);
+ *out = av_clip_int16(sample >> 7);
out++;
in++;
}
@@ -111,40 +115,102 @@ static inline int16_t *scalarproduct(const int16_t *in, const int16_t *endin, in
return out;
}
-static int filter_frame(AVFilterLink *inlink, AVFrame *insamples)
+static int config_input(AVFilterLink *inlink)
{
- AVFilterLink *outlink = inlink->dst->outputs[0];
- int16_t *taps, *endin, *in, *out;
- AVFrame *outsamples = ff_get_audio_buffer(outlink, insamples->nb_samples);
- int len;
+ EarwaxContext *s = inlink->dst->priv;
- if (!outsamples) {
- av_frame_free(&insamples);
- return AVERROR(ENOMEM);
+ for (int i = 0; i < NUMTAPS; i++) {
+ s->filter[0][i] = filt[i * 2];
+ s->filter[1][i] = filt[i * 2 + 1];
}
- av_frame_copy_props(outsamples, insamples);
- taps = ((EarwaxContext *)inlink->dst->priv)->taps;
- out = (int16_t *)outsamples->data[0];
- in = (int16_t *)insamples ->data[0];
+ return 0;
+}
+
+static void convolve(AVFilterContext *ctx, AVFrame *in,
+ int input_ch, int output_ch,
+ int filter_ch, int tap_ch)
+{
+ EarwaxContext *s = ctx->priv;
+ int16_t *taps, *endin, *dst, *src;
+ int len;
+
+ taps = s->taps[tap_ch];
+ dst = (int16_t *)s->frame[input_ch]->data[output_ch];
+ src = (int16_t *)in->data[input_ch];
- len = FFMIN(NUMTAPS, 2*insamples->nb_samples);
+ len = FFMIN(NUMTAPS, in->nb_samples);
// copy part of new input and process with saved input
- memcpy(taps+NUMTAPS, in, len * sizeof(*taps));
- out = scalarproduct(taps, taps + len, out);
+ memcpy(taps+NUMTAPS, src, len * sizeof(*taps));
+ dst = scalarproduct(taps, taps + len, s->filter[filter_ch], dst);
// process current input
- if (2*insamples->nb_samples >= NUMTAPS ){
- endin = in + insamples->nb_samples * 2 - NUMTAPS;
- scalarproduct(in, endin, out);
+ if (2*in->nb_samples >= NUMTAPS ){
+ endin = src + in->nb_samples - NUMTAPS;
+ scalarproduct(src, endin, s->filter[filter_ch], dst);
// save part of input for next round
memcpy(taps, endin, NUMTAPS * sizeof(*taps));
- } else
- memmove(taps, taps + 2*insamples->nb_samples, NUMTAPS * sizeof(*taps));
+ } else {
+ memmove(taps, taps + in->nb_samples, NUMTAPS * sizeof(*taps));
+ }
+}
+
+static void mix(AVFilterContext *ctx, AVFrame *out,
+ int output_ch, int f0, int f1, int i0, int i1)
+{
+ EarwaxContext *s = ctx->priv;
+ const int16_t *srcl = (const int16_t *)s->frame[f0]->data[i0];
+ const int16_t *srcr = (const int16_t *)s->frame[f1]->data[i1];
+ int16_t *dst = (int16_t *)out->data[output_ch];
+
+ for (int n = 0; n < out->nb_samples; n++)
+ dst[n] = av_clip_int16(srcl[n] + srcr[n]);
+}
+
+static int filter_frame(AVFilterLink *inlink, AVFrame *in)
+{
+ AVFilterContext *ctx = inlink->dst;
+ EarwaxContext *s = ctx->priv;
+ AVFilterLink *outlink = ctx->outputs[0];
+ AVFrame *out = ff_get_audio_buffer(outlink, in->nb_samples);
+
+ for (int ch = 0; ch < 2; ch++) {
+ if (!s->frame[ch] || s->frame[ch]->nb_samples < in->nb_samples) {
+ av_frame_free(&s->frame[ch]);
+ s->frame[ch] = ff_get_audio_buffer(outlink, in->nb_samples);
+ if (!s->frame[ch]) {
+ av_frame_free(&in);
+ av_frame_free(&out);
+ return AVERROR(ENOMEM);
+ }
+ }
+ }
+
+ if (!out) {
+ av_frame_free(&in);
+ return AVERROR(ENOMEM);
+ }
+ av_frame_copy_props(out, in);
+
+ convolve(ctx, in, 0, 0, 0, 0);
+ convolve(ctx, in, 0, 1, 1, 1);
+ convolve(ctx, in, 1, 0, 0, 2);
+ convolve(ctx, in, 1, 1, 1, 3);
+
+ mix(ctx, out, 0, 0, 1, 1, 0);
+ mix(ctx, out, 1, 0, 1, 0, 1);
+
+ av_frame_free(&in);
+ return ff_filter_frame(outlink, out);
+}
+
+static av_cold void uninit(AVFilterContext *ctx)
+{
+ EarwaxContext *s = ctx->priv;
- av_frame_free(&insamples);
- return ff_filter_frame(outlink, outsamples);
+ av_frame_free(&s->frame[0]);
+ av_frame_free(&s->frame[1]);
}
static const AVFilterPad earwax_inputs[] = {
@@ -152,6 +218,7 @@ static const AVFilterPad earwax_inputs[] = {
.name = "default",
.type = AVMEDIA_TYPE_AUDIO,
.filter_frame = filter_frame,
+ .config_props = config_input,
},
{ NULL }
};
@@ -169,6 +236,7 @@ AVFilter ff_af_earwax = {
.description = NULL_IF_CONFIG_SMALL("Widen the stereo image."),
.query_formats = query_formats,
.priv_size = sizeof(EarwaxContext),
+ .uninit = uninit,
.inputs = earwax_inputs,
.outputs = earwax_outputs,
};
diff --git a/tests/fate/filter-audio.mak b/tests/fate/filter-audio.mak
index ee1a9dfc97..8b38ee5e75 100644
--- a/tests/fate/filter-audio.mak
+++ b/tests/fate/filter-audio.mak
@@ -112,7 +112,7 @@ fate-filter-dcshift: CMD = framecrc -i $(SRC) -frames:a 20 -af aresample,dcshift
FATE_AFILTER-$(call FILTERDEMDECENCMUX, EARWAX, WAV, PCM_S16LE, PCM_S16LE, WAV) += fate-filter-earwax
fate-filter-earwax: tests/data/asynth-44100-2.wav
fate-filter-earwax: SRC = $(TARGET_PATH)/tests/data/asynth-44100-2.wav
-fate-filter-earwax: CMD = framecrc -i $(SRC) -frames:a 20 -af earwax
+fate-filter-earwax: CMD = framecrc -i $(SRC) -frames:a 20 -af aresample,earwax,aresample
FATE_AFILTER-$(call FILTERDEMDECENCMUX, EXTRASTEREO, WAV, PCM_S16LE, PCM_S16LE, WAV) += fate-filter-extrastereo
fate-filter-extrastereo: tests/data/asynth-44100-2.wav
diff --git a/tests/ref/fate/filter-earwax b/tests/ref/fate/filter-earwax
index 855f579cac..6bfa725b64 100644
--- a/tests/ref/fate/filter-earwax
+++ b/tests/ref/fate/filter-earwax
@@ -4,23 +4,23 @@
#sample_rate 0: 44100
#channel_layout 0: 3
#channel_layout_name 0: stereo
-0, 0, 0, 1024, 4096, 0x900af751
-0, 1024, 1024, 1024, 4096, 0xad570065
-0, 2048, 2048, 1024, 4096, 0x93d5f494
-0, 3072, 3072, 1024, 4096, 0x2c65ef7d
-0, 4096, 4096, 1024, 4096, 0xdc8af6d2
-0, 5120, 5120, 1024, 4096, 0x7ae00249
-0, 6144, 6144, 1024, 4096, 0xaab5fdd0
-0, 7168, 7168, 1024, 4096, 0x4373ef39
-0, 8192, 8192, 1024, 4096, 0x0756eb43
-0, 9216, 9216, 1024, 4096, 0x494d06e0
-0, 10240, 10240, 1024, 4096, 0x4393ffae
-0, 11264, 11264, 1024, 4096, 0x6972f97e
-0, 12288, 12288, 1024, 4096, 0xb834ea05
-0, 13312, 13312, 1024, 4096, 0x39b8f871
-0, 14336, 14336, 1024, 4096, 0xf032fccd
-0, 15360, 15360, 1024, 4096, 0xefcd0709
-0, 16384, 16384, 1024, 4096, 0x0590ebc0
-0, 17408, 17408, 1024, 4096, 0x2e75f264
-0, 18432, 18432, 1024, 4096, 0xbea1fd03
-0, 19456, 19456, 1024, 4096, 0x9bbe0434
+0, 0, 0, 1024, 4096, 0xb7e1f437
+0, 1024, 1024, 1024, 4096, 0xa031042a
+0, 2048, 2048, 1024, 4096, 0x9b72ed0f
+0, 3072, 3072, 1024, 4096, 0xff14ed33
+0, 4096, 4096, 1024, 4096, 0x96eef519
+0, 5120, 5120, 1024, 4096, 0x290d0ca0
+0, 6144, 6144, 1024, 4096, 0x0393fbf5
+0, 7168, 7168, 1024, 4096, 0xed89ef59
+0, 8192, 8192, 1024, 4096, 0xf664e969
+0, 9216, 9216, 1024, 4096, 0x261a05e4
+0, 10240, 10240, 1024, 4096, 0xc334ff5b
+0, 11264, 11264, 1024, 4096, 0x030ffa65
+0, 12288, 12288, 1024, 4096, 0xcfb4e835
+0, 13312, 13312, 1024, 4096, 0xd9adf7ff
+0, 14336, 14336, 1024, 4096, 0x5e9001ae
+0, 15360, 15360, 1024, 4096, 0xbfaf0174
+0, 16384, 16384, 1024, 4096, 0x8cf3f061
+0, 17408, 17408, 1024, 4096, 0x35ffece5
+0, 18432, 18432, 1024, 4096, 0x1de801e2
+0, 19456, 19456, 1024, 4096, 0xa1a40372
More information about the ffmpeg-cvslog
mailing list