FFmpeg
af_anlms.c
Go to the documentation of this file.
1 /*
2  * Copyright (c) 2019 Paul B Mahol
3  *
4  * This file is part of FFmpeg.
5  *
6  * FFmpeg is free software; you can redistribute it and/or
7  * modify it under the terms of the GNU Lesser General Public
8  * License as published by the Free Software Foundation; either
9  * version 2.1 of the License, or (at your option) any later version.
10  *
11  * FFmpeg is distributed in the hope that it will be useful,
12  * but WITHOUT ANY WARRANTY; without even the implied warranty of
13  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14  * Lesser General Public License for more details.
15  *
16  * You should have received a copy of the GNU Lesser General Public
17  * License along with FFmpeg; if not, write to the Free Software
18  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
19  */
20 
22 #include "libavutil/common.h"
23 #include "libavutil/float_dsp.h"
24 #include "libavutil/opt.h"
25 
26 #include "audio.h"
27 #include "avfilter.h"
28 #include "filters.h"
29 #include "internal.h"
30 
31 enum OutModes {
38 };
39 
40 typedef struct AudioNLMSContext {
41  const AVClass *class;
42 
43  int order;
44  float mu;
45  float eps;
46  float leakage;
48 
54 
56 
57  int anlmf;
58 
61 
62 #define OFFSET(x) offsetof(AudioNLMSContext, x)
63 #define A AV_OPT_FLAG_AUDIO_PARAM|AV_OPT_FLAG_FILTERING_PARAM
64 #define AT AV_OPT_FLAG_AUDIO_PARAM|AV_OPT_FLAG_FILTERING_PARAM|AV_OPT_FLAG_RUNTIME_PARAM
65 
66 static const AVOption anlms_options[] = {
67  { "order", "set the filter order", OFFSET(order), AV_OPT_TYPE_INT, {.i64=256}, 1, INT16_MAX, A },
68  { "mu", "set the filter mu", OFFSET(mu), AV_OPT_TYPE_FLOAT, {.dbl=0.75}, 0, 2, AT },
69  { "eps", "set the filter eps", OFFSET(eps), AV_OPT_TYPE_FLOAT, {.dbl=1}, 0, 1, AT },
70  { "leakage", "set the filter leakage", OFFSET(leakage), AV_OPT_TYPE_FLOAT, {.dbl=0}, 0, 1, AT },
71  { "out_mode", "set output mode", OFFSET(output_mode), AV_OPT_TYPE_INT, {.i64=OUT_MODE}, 0, NB_OMODES-1, AT, "mode" },
72  { "i", "input", 0, AV_OPT_TYPE_CONST, {.i64=IN_MODE}, 0, 0, AT, "mode" },
73  { "d", "desired", 0, AV_OPT_TYPE_CONST, {.i64=DESIRED_MODE}, 0, 0, AT, "mode" },
74  { "o", "output", 0, AV_OPT_TYPE_CONST, {.i64=OUT_MODE}, 0, 0, AT, "mode" },
75  { "n", "noise", 0, AV_OPT_TYPE_CONST, {.i64=NOISE_MODE}, 0, 0, AT, "mode" },
76  { "e", "error", 0, AV_OPT_TYPE_CONST, {.i64=ERROR_MODE}, 0, 0, AT, "mode" },
77  { NULL }
78 };
79 
80 AVFILTER_DEFINE_CLASS_EXT(anlms, "anlm(f|s)", anlms_options);
81 
82 static float fir_sample(AudioNLMSContext *s, float sample, float *delay,
83  float *coeffs, float *tmp, int *offset)
84 {
85  const int order = s->order;
86  float output;
87 
88  delay[*offset] = sample;
89 
90  memcpy(tmp, coeffs + order - *offset, order * sizeof(float));
91 
92  output = s->fdsp->scalarproduct_float(delay, tmp, s->kernel_size);
93 
94  if (--(*offset) < 0)
95  *offset = order - 1;
96 
97  return output;
98 }
99 
100 static float process_sample(AudioNLMSContext *s, float input, float desired,
101  float *delay, float *coeffs, float *tmp, int *offsetp)
102 {
103  const int order = s->order;
104  const float leakage = s->leakage;
105  const float mu = s->mu;
106  const float a = 1.f - leakage;
107  float sum, output, e, norm, b;
108  int offset = *offsetp;
109 
110  delay[offset + order] = input;
111 
112  output = fir_sample(s, input, delay, coeffs, tmp, offsetp);
113  e = desired - output;
114 
115  sum = s->fdsp->scalarproduct_float(delay, delay, s->kernel_size);
116 
117  norm = s->eps + sum;
118  b = mu * e / norm;
119  if (s->anlmf)
120  b *= e * e;
121 
122  memcpy(tmp, delay + offset, order * sizeof(float));
123 
124  s->fdsp->vector_fmul_scalar(coeffs, coeffs, a, s->kernel_size);
125 
126  s->fdsp->vector_fmac_scalar(coeffs, tmp, b, s->kernel_size);
127 
128  memcpy(coeffs + order, coeffs, order * sizeof(float));
129 
130  switch (s->output_mode) {
131  case IN_MODE: output = input; break;
132  case DESIRED_MODE: output = desired; break;
133  case OUT_MODE: output = desired - output; break;
134  case NOISE_MODE: output = input - output; break;
135  case ERROR_MODE: break;
136  }
137  return output;
138 }
139 
140 static int process_channels(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs)
141 {
142  AudioNLMSContext *s = ctx->priv;
143  AVFrame *out = arg;
144  const int start = (out->ch_layout.nb_channels * jobnr) / nb_jobs;
145  const int end = (out->ch_layout.nb_channels * (jobnr+1)) / nb_jobs;
146 
147  for (int c = start; c < end; c++) {
148  const float *input = (const float *)s->frame[0]->extended_data[c];
149  const float *desired = (const float *)s->frame[1]->extended_data[c];
150  float *delay = (float *)s->delay->extended_data[c];
151  float *coeffs = (float *)s->coeffs->extended_data[c];
152  float *tmp = (float *)s->tmp->extended_data[c];
153  int *offset = (int *)s->offset->extended_data[c];
154  float *output = (float *)out->extended_data[c];
155 
156  for (int n = 0; n < out->nb_samples; n++) {
157  output[n] = process_sample(s, input[n], desired[n], delay, coeffs, tmp, offset);
158  if (ctx->is_disabled)
159  output[n] = input[n];
160  }
161  }
162 
163  return 0;
164 }
165 
167 {
168  AudioNLMSContext *s = ctx->priv;
169  int i, ret, status;
170  int nb_samples;
171  int64_t pts;
172 
174 
175  nb_samples = FFMIN(ff_inlink_queued_samples(ctx->inputs[0]),
176  ff_inlink_queued_samples(ctx->inputs[1]));
177  for (i = 0; i < ctx->nb_inputs && nb_samples > 0; i++) {
178  if (s->frame[i])
179  continue;
180 
181  if (ff_inlink_check_available_samples(ctx->inputs[i], nb_samples) > 0) {
182  ret = ff_inlink_consume_samples(ctx->inputs[i], nb_samples, nb_samples, &s->frame[i]);
183  if (ret < 0)
184  return ret;
185  }
186  }
187 
188  if (s->frame[0] && s->frame[1]) {
189  AVFrame *out;
190 
191  out = ff_get_audio_buffer(ctx->outputs[0], s->frame[0]->nb_samples);
192  if (!out) {
193  av_frame_free(&s->frame[0]);
194  av_frame_free(&s->frame[1]);
195  return AVERROR(ENOMEM);
196  }
197 
199  FFMIN(ctx->outputs[0]->ch_layout.nb_channels, ff_filter_get_nb_threads(ctx)));
200 
201  out->pts = s->frame[0]->pts;
202 
203  av_frame_free(&s->frame[0]);
204  av_frame_free(&s->frame[1]);
205 
206  ret = ff_filter_frame(ctx->outputs[0], out);
207  if (ret < 0)
208  return ret;
209  }
210 
211  if (!nb_samples) {
212  for (i = 0; i < 2; i++) {
213  if (ff_inlink_acknowledge_status(ctx->inputs[i], &status, &pts)) {
214  ff_outlink_set_status(ctx->outputs[0], status, pts);
215  return 0;
216  }
217  }
218  }
219 
220  if (ff_outlink_frame_wanted(ctx->outputs[0])) {
221  for (i = 0; i < 2; i++) {
222  if (ff_inlink_queued_samples(ctx->inputs[i]) > 0)
223  continue;
224  ff_inlink_request_frame(ctx->inputs[i]);
225  return 0;
226  }
227  }
228  return 0;
229 }
230 
231 static int config_output(AVFilterLink *outlink)
232 {
233  AVFilterContext *ctx = outlink->src;
234  AudioNLMSContext *s = ctx->priv;
235 
236  s->anlmf = !strcmp(ctx->filter->name, "anlmf");
237  s->kernel_size = FFALIGN(s->order, 16);
238 
239  if (!s->offset)
240  s->offset = ff_get_audio_buffer(outlink, 1);
241  if (!s->delay)
242  s->delay = ff_get_audio_buffer(outlink, 2 * s->kernel_size);
243  if (!s->coeffs)
244  s->coeffs = ff_get_audio_buffer(outlink, 2 * s->kernel_size);
245  if (!s->tmp)
246  s->tmp = ff_get_audio_buffer(outlink, s->kernel_size);
247  if (!s->delay || !s->coeffs || !s->offset || !s->tmp)
248  return AVERROR(ENOMEM);
249 
250  return 0;
251 }
252 
254 {
255  AudioNLMSContext *s = ctx->priv;
256 
257  s->fdsp = avpriv_float_dsp_alloc(0);
258  if (!s->fdsp)
259  return AVERROR(ENOMEM);
260 
261  return 0;
262 }
263 
265 {
266  AudioNLMSContext *s = ctx->priv;
267 
268  av_freep(&s->fdsp);
269  av_frame_free(&s->delay);
270  av_frame_free(&s->coeffs);
271  av_frame_free(&s->offset);
272  av_frame_free(&s->tmp);
273 }
274 
275 static const AVFilterPad inputs[] = {
276  {
277  .name = "input",
278  .type = AVMEDIA_TYPE_AUDIO,
279  },
280  {
281  .name = "desired",
282  .type = AVMEDIA_TYPE_AUDIO,
283  },
284 };
285 
286 static const AVFilterPad outputs[] = {
287  {
288  .name = "default",
289  .type = AVMEDIA_TYPE_AUDIO,
290  .config_props = config_output,
291  },
292 };
293 
295  .name = "anlms",
296  .description = NULL_IF_CONFIG_SMALL("Apply Normalized Least-Mean-Squares algorithm to first audio stream."),
297  .priv_size = sizeof(AudioNLMSContext),
298  .priv_class = &anlms_class,
299  .init = init,
300  .uninit = uninit,
301  .activate = activate,
307  .process_command = ff_filter_process_command,
308 };
309 
311  .name = "anlmf",
312  .description = NULL_IF_CONFIG_SMALL("Apply Normalized Least-Mean-Fourth algorithm to first audio stream."),
313  .priv_size = sizeof(AudioNLMSContext),
314  .priv_class = &anlms_class,
315  .init = init,
316  .uninit = uninit,
317  .activate = activate,
323  .process_command = ff_filter_process_command,
324 };
ff_get_audio_buffer
AVFrame * ff_get_audio_buffer(AVFilterLink *link, int nb_samples)
Request an audio samples buffer with a specific set of permissions.
Definition: audio.c:107
AV_SAMPLE_FMT_FLTP
@ AV_SAMPLE_FMT_FLTP
float, planar
Definition: samplefmt.h:66
process_sample
static float process_sample(AudioNLMSContext *s, float input, float desired, float *delay, float *coeffs, float *tmp, int *offsetp)
Definition: af_anlms.c:100
AVERROR
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
opt.h
out
FILE * out
Definition: movenc.c:54
ff_filter_frame
int ff_filter_frame(AVFilterLink *link, AVFrame *frame)
Send a frame of data to the next filter.
Definition: avfilter.c:978
FILTER_SINGLE_SAMPLEFMT
#define FILTER_SINGLE_SAMPLEFMT(sample_fmt_)
Definition: internal.h:185
output
filter_frame For filters that do not use the this method is called when a frame is pushed to the filter s input It can be called at any time except in a reentrant way If the input frame is enough to produce output
Definition: filter_design.txt:225
av_frame_free
void av_frame_free(AVFrame **frame)
Free the frame and any dynamically allocated objects in it, e.g.
Definition: frame.c:100
AVFrame
This structure describes decoded (raw) audio or video data.
Definition: frame.h:340
tmp
static uint8_t tmp[11]
Definition: aes_ctr.c:28
AVOption
AVOption.
Definition: opt.h:251
b
#define b
Definition: input.c:41
OUT_MODE
@ OUT_MODE
Definition: af_anlms.c:34
AudioNLMSContext::mu
float mu
Definition: af_anlms.c:44
init
static av_cold int init(AVFilterContext *ctx)
Definition: af_anlms.c:253
AVFilter::name
const char * name
Filter name.
Definition: avfilter.h:170
IN_MODE
@ IN_MODE
Definition: af_anlms.c:32
ff_af_anlms
const AVFilter ff_af_anlms
Definition: af_anlms.c:294
FF_FILTER_FORWARD_STATUS_BACK_ALL
#define FF_FILTER_FORWARD_STATUS_BACK_ALL(outlink, filter)
Forward the status on an output link to all input links.
Definition: filters.h:212
AudioNLMSContext::fdsp
AVFloatDSPContext * fdsp
Definition: af_anlms.c:59
anlms_options
static const AVOption anlms_options[]
Definition: af_anlms.c:66
pts
static int64_t pts
Definition: transcode_aac.c:643
AVFilterPad
A filter pad used for either input or output.
Definition: internal.h:47
OFFSET
#define OFFSET(x)
Definition: af_anlms.c:62
ff_inlink_check_available_samples
int ff_inlink_check_available_samples(AVFilterLink *link, unsigned min)
Test if enough samples are available on the link.
Definition: avfilter.c:1367
av_cold
#define av_cold
Definition: attributes.h:90
AudioNLMSContext::offset
AVFrame * offset
Definition: af_anlms.c:50
DESIRED_MODE
@ DESIRED_MODE
Definition: af_anlms.c:33
ff_outlink_set_status
static void ff_outlink_set_status(AVFilterLink *link, int status, int64_t pts)
Set the status field of a link from the source filter.
Definition: filters.h:189
ff_inlink_request_frame
void ff_inlink_request_frame(AVFilterLink *link)
Mark that a frame is wanted on the link.
Definition: avfilter.c:1506
AudioNLMSContext::tmp
AVFrame * tmp
Definition: af_anlms.c:53
s
#define s(width, name)
Definition: cbs_vp9.c:198
AudioNLMSContext::frame
AVFrame * frame[2]
Definition: af_anlms.c:55
AudioNLMSContext::kernel_size
int kernel_size
Definition: af_anlms.c:49
AVMEDIA_TYPE_AUDIO
@ AVMEDIA_TYPE_AUDIO
Definition: avutil.h:202
filters.h
ctx
AVFormatContext * ctx
Definition: movenc.c:48
AudioNLMSContext::leakage
float leakage
Definition: af_anlms.c:46
FILTER_INPUTS
#define FILTER_INPUTS(array)
Definition: internal.h:192
arg
const char * arg
Definition: jacosubdec.c:67
AVClass
Describe the class of an AVClass context structure.
Definition: log.h:66
ff_inlink_consume_samples
int ff_inlink_consume_samples(AVFilterLink *link, unsigned min, unsigned max, AVFrame **rframe)
Take samples from the link's FIFO and update the link's stats.
Definition: avfilter.c:1402
NULL
#define NULL
Definition: coverity.c:32
uninit
static av_cold void uninit(AVFilterContext *ctx)
Definition: af_anlms.c:264
AudioNLMSContext::anlmf
int anlmf
Definition: af_anlms.c:57
AudioNLMSContext::eps
float eps
Definition: af_anlms.c:45
ff_inlink_acknowledge_status
int ff_inlink_acknowledge_status(AVFilterLink *link, int *rstatus, int64_t *rpts)
Test and acknowledge the change of status on the link.
Definition: avfilter.c:1337
c
Undefined Behavior In the C some operations are like signed integer dereferencing freed accessing outside allocated Undefined Behavior must not occur in a C it is not safe even if the output of undefined operations is unused The unsafety may seem nit picking but Optimizing compilers have in fact optimized code on the assumption that no undefined Behavior occurs Optimizing code based on wrong assumptions can and has in some cases lead to effects beyond the output of computations The signed integer overflow problem in speed critical code Code which is highly optimized and works with signed integers sometimes has the problem that often the output of the computation does not c
Definition: undefined.txt:32
float_dsp.h
OutModes
OutModes
Definition: af_afftdn.c:42
ff_af_anlmf
const AVFilter ff_af_anlmf
Definition: af_anlms.c:310
NULL_IF_CONFIG_SMALL
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification.
Definition: internal.h:106
for
for(k=2;k<=8;++k)
Definition: h264pred_template.c:425
sample
#define sample
Definition: flacdsp_template.c:44
AVFloatDSPContext
Definition: float_dsp.h:24
ff_filter_process_command
int ff_filter_process_command(AVFilterContext *ctx, const char *cmd, const char *arg, char *res, int res_len, int flags)
Generic processing of user supplied commands that are set in the same way as the filter options.
Definition: avfilter.c:851
AudioNLMSContext::coeffs
AVFrame * coeffs
Definition: af_anlms.c:52
a
The reader does not expect b to be semantically here and if the code is changed by maybe adding a a division or other the signedness will almost certainly be mistaken To avoid this confusion a new type was SUINT is the C unsigned type but it holds a signed int to use the same example SUINT a
Definition: undefined.txt:41
offset
it s the only field you need to keep assuming you have a context There is some magic you don t need to care about around this just let it vf offset
Definition: writing_filters.txt:86
NB_OMODES
@ NB_OMODES
Definition: af_anlms.c:37
input
and forward the test the status of outputs and forward it to the corresponding return FFERROR_NOT_READY If the filters stores internally one or a few frame for some input
Definition: filter_design.txt:172
internal.h
AV_OPT_TYPE_FLOAT
@ AV_OPT_TYPE_FLOAT
Definition: opt.h:228
i
#define i(width, name, range_min, range_max)
Definition: cbs_h2645.c:255
AudioNLMSContext::order
int order
Definition: af_anlms.c:43
activate
static int activate(AVFilterContext *ctx)
Definition: af_anlms.c:166
common.h
ff_filter_get_nb_threads
int ff_filter_get_nb_threads(AVFilterContext *ctx)
Get number of threads for current filter instance.
Definition: avfilter.c:786
FFMIN
#define FFMIN(a, b)
Definition: macros.h:49
AudioNLMSContext::output_mode
int output_mode
Definition: af_anlms.c:47
AVFilterPad::name
const char * name
Pad name.
Definition: internal.h:53
ff_inlink_queued_samples
int ff_inlink_queued_samples(AVFilterLink *link)
Definition: avfilter.c:1362
AVFilter
Filter definition.
Definition: avfilter.h:166
ret
ret
Definition: filter_design.txt:187
fir_sample
static float fir_sample(AudioNLMSContext *s, float sample, float *delay, float *coeffs, float *tmp, int *offset)
Definition: af_anlms.c:82
ERROR_MODE
@ ERROR_MODE
Definition: af_anlms.c:36
NOISE_MODE
@ NOISE_MODE
Definition: af_anlms.c:35
AudioNLMSContext
Definition: af_anlms.c:40
AudioNLMSContext::delay
AVFrame * delay
Definition: af_anlms.c:51
status
ov_status_e status
Definition: dnn_backend_openvino.c:119
channel_layout.h
inputs
static const AVFilterPad inputs[]
Definition: af_anlms.c:275
AV_OPT_TYPE_INT
@ AV_OPT_TYPE_INT
Definition: opt.h:225
avfilter.h
A
#define A
Definition: af_anlms.c:63
AVFILTER_DEFINE_CLASS_EXT
AVFILTER_DEFINE_CLASS_EXT(anlms, "anlm(f|s)", anlms_options)
config_output
static int config_output(AVFilterLink *outlink)
Definition: af_anlms.c:231
process_channels
static int process_channels(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs)
Definition: af_anlms.c:140
AVFilterContext
An instance of a filter.
Definition: avfilter.h:397
AVFILTER_FLAG_SLICE_THREADS
#define AVFILTER_FLAG_SLICE_THREADS
The filter supports multithreading by splitting frames into multiple parts and processing them concur...
Definition: avfilter.h:117
audio.h
FFALIGN
#define FFALIGN(x, a)
Definition: macros.h:78
FILTER_OUTPUTS
#define FILTER_OUTPUTS(array)
Definition: internal.h:193
av_freep
#define av_freep(p)
Definition: tableprint_vlc.h:34
avpriv_float_dsp_alloc
av_cold AVFloatDSPContext * avpriv_float_dsp_alloc(int bit_exact)
Allocate a float DSP context.
Definition: float_dsp.c:135
AVFILTER_FLAG_SUPPORT_TIMELINE_INTERNAL
#define AVFILTER_FLAG_SUPPORT_TIMELINE_INTERNAL
Same as AVFILTER_FLAG_SUPPORT_TIMELINE_GENERIC, except that the filter will have its filter_frame() c...
Definition: avfilter.h:155
outputs
static const AVFilterPad outputs[]
Definition: af_anlms.c:286
ff_outlink_frame_wanted
the definition of that something depends on the semantic of the filter The callback must examine the status of the filter s links and proceed accordingly The status of output links is stored in the status_in and status_out fields and tested by the ff_outlink_frame_wanted() function. If this function returns true
AT
#define AT
Definition: af_anlms.c:64
ff_filter_execute
static av_always_inline int ff_filter_execute(AVFilterContext *ctx, avfilter_action_func *func, void *arg, int *ret, int nb_jobs)
Definition: internal.h:144
AV_OPT_TYPE_CONST
@ AV_OPT_TYPE_CONST
Definition: opt.h:234