doxygen/4.1/af__silenceremove_8c_source.html

 /*

  * Copyright (c) 2001 Heikki Leinonen

  * Copyright (c) 2001 Chris Bagwell

  * Copyright (c) 2003 Donnie Smith

  * Copyright (c) 2014 Paul B Mahol

  *

  * This file is part of FFmpeg.

  *

  * FFmpeg is free software; you can redistribute it and/or

  * modify it under the terms of the GNU Lesser General Public

  * License as published by the Free Software Foundation; either

  * version 2.1 of the License, or (at your option) any later version.

  *

  * FFmpeg is distributed in the hope that it will be useful,

  * but WITHOUT ANY WARRANTY; without even the implied warranty of

  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU

  * Lesser General Public License for more details.

  *

  * You should have received a copy of the GNU Lesser General Public

  * License along with FFmpeg; if not, write to the Free Software

  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA

  */


 #include <float.h> /* DBL_MAX */


 #include "libavutil/opt.h"

 #include "libavutil/timestamp.h"

 #include "audio.h"

 #include "formats.h"

 #include "avfilter.h"

 #include "internal.h"


 enum SilenceDetect {

     D_PEAK,

     D_RMS,

 };


 enum ThresholdMode {

     T_ANY,

     T_ALL,

 };


 enum SilenceMode {

     SILENCE_TRIM,

     SILENCE_TRIM_FLUSH,

     SILENCE_COPY,

     SILENCE_COPY_FLUSH,

     SILENCE_STOP

 };


 typedef struct SilenceRemoveContext {

     const AVClass *class;


     enum SilenceMode mode;


     int start_periods;

     int64_t start_duration;

     int64_t start_duration_opt;

     double start_threshold;

     int64_t start_silence;

     int64_t start_silence_opt;

     int start_mode;


     int stop_periods;

     int64_t stop_duration;

     int64_t stop_duration_opt;

     double stop_threshold;

     int64_t stop_silence;

     int64_t stop_silence_opt;

     int stop_mode;


     double *start_holdoff;

     double *start_silence_hold;

     size_t start_holdoff_offset;

     size_t start_holdoff_end;

     size_t start_silence_offset;

     size_t start_silence_end;

     int    start_found_periods;


     double *stop_holdoff;

     double *stop_silence_hold;

     size_t stop_holdoff_offset;

     size_t stop_holdoff_end;

     size_t stop_silence_offset;

     size_t stop_silence_end;

     int    stop_found_periods;


     double window_ratio;

     double *window;

     double *window_current;

     double *window_end;

     int window_size;

     double sum;


     int restart;

     int64_t next_pts;


     int detection;

     void (*update)(struct SilenceRemoveContext *s, double sample);

     double(*compute)(struct SilenceRemoveContext *s, double sample);

 } SilenceRemoveContext;


 #define OFFSET(x) offsetof(SilenceRemoveContext, x)

 #define AF AV_OPT_FLAG_FILTERING_PARAM|AV_OPT_FLAG_AUDIO_PARAM


 static const AVOption silenceremove_options[] = {

     { "start_periods",   NULL,                                                 OFFSET(start_periods),       AV_OPT_TYPE_INT,      {.i64=0},     0,      9000, AF },

     { "start_duration",  "set start duration of non-silence part",             OFFSET(start_duration_opt),  AV_OPT_TYPE_DURATION, {.i64=0},     0, INT32_MAX, AF },

     { "start_threshold", "set threshold for start silence detection",          OFFSET(start_threshold),     AV_OPT_TYPE_DOUBLE,   {.dbl=0},     0,   DBL_MAX, AF },

     { "start_silence",   "set start duration of silence part to keep",         OFFSET(start_silence_opt),   AV_OPT_TYPE_DURATION, {.i64=0},     0, INT32_MAX, AF },

     { "start_mode",      "set which channel will trigger trimming from start", OFFSET(start_mode),          AV_OPT_TYPE_INT,      {.i64=T_ANY}, T_ANY, T_ALL, AF, "mode" },

     {   "any",           0,                                                    0,                           AV_OPT_TYPE_CONST,    {.i64=T_ANY}, 0,         0, AF, "mode" },

     {   "all",           0,                                                    0,                           AV_OPT_TYPE_CONST,    {.i64=T_ALL}, 0,         0, AF, "mode" },

     { "stop_periods",    NULL,                                                 OFFSET(stop_periods),        AV_OPT_TYPE_INT,      {.i64=0}, -9000,      9000, AF },

     { "stop_duration",   "set stop duration of non-silence part",              OFFSET(stop_duration_opt),   AV_OPT_TYPE_DURATION, {.i64=0},     0, INT32_MAX, AF },

     { "stop_threshold",  "set threshold for stop silence detection",           OFFSET(stop_threshold),      AV_OPT_TYPE_DOUBLE,   {.dbl=0},     0,   DBL_MAX, AF },

     { "stop_silence",    "set stop duration of silence part to keep",          OFFSET(stop_silence_opt),    AV_OPT_TYPE_DURATION, {.i64=0},     0, INT32_MAX, AF },

     { "stop_mode",       "set which channel will trigger trimming from end",   OFFSET(stop_mode),           AV_OPT_TYPE_INT,      {.i64=T_ANY}, T_ANY, T_ALL, AF, "mode" },

     { "detection",       "set how silence is detected",                        OFFSET(detection),           AV_OPT_TYPE_INT,      {.i64=D_RMS}, D_PEAK,D_RMS, AF, "detection" },

     {   "peak",          "use absolute values of samples",                     0,                           AV_OPT_TYPE_CONST,    {.i64=D_PEAK},0,         0, AF, "detection" },

     {   "rms",           "use squared values of samples",                      0,                           AV_OPT_TYPE_CONST,    {.i64=D_RMS}, 0,         0, AF, "detection" },

     { "window",          "set duration of window in seconds",                  OFFSET(window_ratio),        AV_OPT_TYPE_DOUBLE,   {.dbl=0.02},  0,        10, AF },

     { NULL }

 };


 AVFILTER_DEFINE_CLASS(silenceremove);


 static double compute_peak(SilenceRemoveContext *s, double sample)

 {

     double new_sum;


     new_sum  = s->sum;

     new_sum -= *s->window_current;

     new_sum += fabs(sample);


     return new_sum / s->window_size;

 }


 static void update_peak(SilenceRemoveContext *s, double sample)

 {

     s->sum -= *s->window_current;

     *s->window_current = fabs(sample);

     s->sum += *s->window_current;


     s->window_current++;

     if (s->window_current >= s->window_end)

         s->window_current = s->window;

 }


 static double compute_rms(SilenceRemoveContext *s, double sample)

 {

     double new_sum;


     new_sum  = s->sum;

     new_sum -= *s->window_current;

     new_sum += sample * sample;


     return sqrt(new_sum / s->window_size);

 }


 static void update_rms(SilenceRemoveContext *s, double sample)

 {

     s->sum -= *s->window_current;

     *s->window_current = sample * sample;

     s->sum += *s->window_current;


     s->window_current++;

     if (s->window_current >= s->window_end)

         s->window_current = s->window;

 }


 static av_cold int init(AVFilterContext *ctx)

 {

     SilenceRemoveContext *s = ctx->priv;


     if (s->stop_periods < 0) {

         s->stop_periods = -s->stop_periods;

         s->restart = 1;

     }


     switch (s->detection) {

     case D_PEAK:

         s->update = update_peak;

         s->compute = compute_peak;

         break;

     case D_RMS:

         s->update = update_rms;

         s->compute = compute_rms;

         break;

     }


     return 0;

 }


 static void clear_window(SilenceRemoveContext *s)

 {

     memset(s->window, 0, s->window_size * sizeof(*s->window));


     s->window_current = s->window;

     s->window_end = s->window + s->window_size;

     s->sum = 0;

 }


 static int config_input(AVFilterLink *inlink)

 {

     AVFilterContext *ctx = inlink->dst;

     SilenceRemoveContext *s = ctx->priv;


     s->window_size = FFMAX((inlink->sample_rate * s->window_ratio), 1) * inlink->channels;

     s->window = av_malloc_array(s->window_size, sizeof(*s->window));

     if (!s->window)

         return AVERROR(ENOMEM);


     clear_window(s);


     s->start_duration = av_rescale(s->start_duration_opt, inlink->sample_rate,

                                    AV_TIME_BASE);

     s->start_silence  = av_rescale(s->start_silence_opt, inlink->sample_rate,

                                    AV_TIME_BASE);

     s->stop_duration  = av_rescale(s->stop_duration_opt, inlink->sample_rate,

                                    AV_TIME_BASE);

     s->stop_silence   = av_rescale(s->stop_silence_opt, inlink->sample_rate,

                                    AV_TIME_BASE);


     s->start_holdoff = av_malloc_array(FFMAX(s->start_duration, 1),

                                        sizeof(*s->start_holdoff) *

                                        inlink->channels);

     if (!s->start_holdoff)

         return AVERROR(ENOMEM);


     s->start_silence_hold = av_malloc_array(FFMAX(s->start_silence, 1),

                                             sizeof(*s->start_silence_hold) *

                                             inlink->channels);

     if (!s->start_silence_hold)

         return AVERROR(ENOMEM);


     s->start_holdoff_offset = 0;

     s->start_holdoff_end    = 0;

     s->start_found_periods  = 0;


     s->stop_holdoff = av_malloc_array(FFMAX(s->stop_duration, 1),

                                       sizeof(*s->stop_holdoff) *

                                       inlink->channels);

     if (!s->stop_holdoff)

         return AVERROR(ENOMEM);


     s->stop_silence_hold = av_malloc_array(FFMAX(s->stop_silence, 1),

                                            sizeof(*s->stop_silence_hold) *

                                            inlink->channels);

     if (!s->stop_silence_hold)

         return AVERROR(ENOMEM);


     s->stop_holdoff_offset = 0;

     s->stop_holdoff_end    = 0;

     s->stop_found_periods  = 0;


     if (s->start_periods)

         s->mode = SILENCE_TRIM;

     else

         s->mode = SILENCE_COPY;


     return 0;

 }


 static void flush(SilenceRemoveContext *s,

                   AVFrame *out, AVFilterLink *outlink,

                   int *nb_samples_written, int *ret, int flush_silence)

 {

     AVFrame *silence;


     if (*nb_samples_written) {

         out->nb_samples = *nb_samples_written / outlink->channels;


         out->pts = s->next_pts;

         s->next_pts += av_rescale_q(out->nb_samples,

                                     (AVRational){1, outlink->sample_rate},

                                     outlink->time_base);


         *ret = ff_filter_frame(outlink, out);

         if (*ret < 0)

             return;

         *nb_samples_written = 0;

     } else {

         av_frame_free(&out);

     }


     if (s->stop_silence_end <= 0 || !flush_silence)

         return;


     silence = ff_get_audio_buffer(outlink, s->stop_silence_end / outlink->channels);

     if (!silence) {

         *ret = AVERROR(ENOMEM);

         return;

     }


     if (s->stop_silence_offset < s->stop_silence_end) {

         memcpy(silence->data[0],

                &s->stop_silence_hold[s->stop_silence_offset],

                (s->stop_silence_end - s->stop_silence_offset) * sizeof(double));

     }


     if (s->stop_silence_offset > 0) {

         memcpy(silence->data[0] + (s->stop_silence_end - s->stop_silence_offset) * sizeof(double),

                &s->stop_silence_hold[0],

                s->stop_silence_offset * sizeof(double));

     }


     s->stop_silence_offset = 0;

     s->stop_silence_end = 0;


     silence->pts = s->next_pts;

     s->next_pts += av_rescale_q(silence->nb_samples,

                                 (AVRational){1, outlink->sample_rate},

                                 outlink->time_base);


     *ret = ff_filter_frame(outlink, silence);

 }


 static int filter_frame(AVFilterLink *inlink, AVFrame *in)

 {

     AVFilterContext *ctx = inlink->dst;

     AVFilterLink *outlink = ctx->outputs[0];

     SilenceRemoveContext *s = ctx->priv;

     int i, j, threshold, ret = 0;

     int nbs, nb_samples_read, nb_samples_written;

     double *obuf, *ibuf = (double *)in->data[0];

     AVFrame *out;


     nb_samples_read = nb_samples_written = 0;


     switch (s->mode) {

     case SILENCE_TRIM:

 silence_trim:

         nbs = in->nb_samples - nb_samples_read / outlink->channels;

         if (!nbs)

             break;


         for (i = 0; i < nbs; i++) {

             if (s->start_mode == T_ANY) {

                 threshold = 0;

                 for (j = 0; j < outlink->channels; j++) {

                     threshold |= s->compute(s, ibuf[j]) > s->start_threshold;

                 }

             } else {

                 threshold = 1;

                 for (j = 0; j < outlink->channels; j++) {

                     threshold &= s->compute(s, ibuf[j]) > s->start_threshold;

                 }

             }


             if (threshold) {

                 for (j = 0; j < outlink->channels; j++) {

                     s->update(s, *ibuf);

                     s->start_holdoff[s->start_holdoff_end++] = *ibuf++;

                 }

                 nb_samples_read += outlink->channels;


                 if (s->start_holdoff_end >= s->start_duration * outlink->channels) {

                     if (++s->start_found_periods >= s->start_periods) {

                         s->mode = SILENCE_TRIM_FLUSH;

                         goto silence_trim_flush;

                     }


                     s->start_holdoff_offset = 0;

                     s->start_holdoff_end = 0;

                     s->start_silence_offset = 0;

                     s->start_silence_end = 0;

                 }

             } else {

                 s->start_holdoff_end = 0;


                 for (j = 0; j < outlink->channels; j++) {

                     s->update(s, ibuf[j]);

                     if (s->start_silence) {

                         s->start_silence_hold[s->start_silence_offset++] = ibuf[j];

                         s->start_silence_end = FFMIN(s->start_silence_end + 1, outlink->channels * s->start_silence);

                         if (s->start_silence_offset >= outlink->channels * s->start_silence) {

                             s->start_silence_offset = 0;

                         }

                     }

                 }


                 ibuf += outlink->channels;

                 nb_samples_read += outlink->channels;

             }

         }

         break;


     case SILENCE_TRIM_FLUSH:

 silence_trim_flush:

         nbs  = s->start_holdoff_end - s->start_holdoff_offset;

         nbs -= nbs % outlink->channels;

         if (!nbs)

             break;


         out = ff_get_audio_buffer(outlink, nbs / outlink->channels + s->start_silence_end / outlink->channels);

         if (!out) {

             av_frame_free(&in);

             return AVERROR(ENOMEM);

         }


         if (s->start_silence_end > 0) {

             if (s->start_silence_offset < s->start_silence_end) {

                 memcpy(out->data[0],

                        &s->start_silence_hold[s->start_silence_offset],

                        (s->start_silence_end - s->start_silence_offset) * sizeof(double));

             }


             if (s->start_silence_offset > 0) {

                 memcpy(out->data[0] + (s->start_silence_end - s->start_silence_offset) * sizeof(double),

                        &s->start_silence_hold[0],

                        s->start_silence_offset * sizeof(double));

             }

         }


         memcpy(out->data[0] + s->start_silence_end * sizeof(double),

                &s->start_holdoff[s->start_holdoff_offset],

                nbs * sizeof(double));


         out->pts = s->next_pts;

         s->next_pts += av_rescale_q(out->nb_samples,

                                     (AVRational){1, outlink->sample_rate},

                                     outlink->time_base);


         s->start_holdoff_offset += nbs;


         ret = ff_filter_frame(outlink, out);


         if (s->start_holdoff_offset == s->start_holdoff_end) {

             s->start_holdoff_offset = 0;

             s->start_holdoff_end = 0;

             s->start_silence_offset = 0;

             s->start_silence_end = 0;

             s->mode = SILENCE_COPY;

             goto silence_copy;

         }

         break;


     case SILENCE_COPY:

 silence_copy:

         nbs = in->nb_samples - nb_samples_read / outlink->channels;

         if (!nbs)

             break;


         out = ff_get_audio_buffer(outlink, nbs);

         if (!out) {

             av_frame_free(&in);

             return AVERROR(ENOMEM);

         }

         obuf = (double *)out->data[0];


         if (s->stop_periods) {

             for (i = 0; i < nbs; i++) {

                 if (s->stop_mode == T_ANY) {

                     threshold = 0;

                     for (j = 0; j < outlink->channels; j++) {

                         threshold |= s->compute(s, ibuf[j]) > s->stop_threshold;

                     }

                 } else {

                     threshold = 1;

                     for (j = 0; j < outlink->channels; j++) {

                         threshold &= s->compute(s, ibuf[j]) > s->stop_threshold;

                     }

                 }


                 if (threshold && s->stop_holdoff_end && !s->stop_silence) {

                     s->mode = SILENCE_COPY_FLUSH;

                     flush(s, out, outlink, &nb_samples_written, &ret, 0);

                     goto silence_copy_flush;

                 } else if (threshold) {

                     for (j = 0; j < outlink->channels; j++) {

                         s->update(s, *ibuf);

                         *obuf++ = *ibuf++;

                     }

                     nb_samples_read    += outlink->channels;

                     nb_samples_written += outlink->channels;

                 } else if (!threshold) {

                     for (j = 0; j < outlink->channels; j++) {

                         s->update(s, *ibuf);

                         if (s->stop_silence) {

                             s->stop_silence_hold[s->stop_silence_offset++] = *ibuf;

                             s->stop_silence_end = FFMIN(s->stop_silence_end + 1, outlink->channels * s->stop_silence);

                             if (s->stop_silence_offset >= outlink->channels * s->stop_silence) {

                                 s->stop_silence_offset = 0;

                             }

                         }


                         s->stop_holdoff[s->stop_holdoff_end++] = *ibuf++;

                     }

                     nb_samples_read += outlink->channels;


                     if (s->stop_holdoff_end >= s->stop_duration * outlink->channels) {

                         if (++s->stop_found_periods >= s->stop_periods) {

                             s->stop_holdoff_offset = 0;

                             s->stop_holdoff_end = 0;


                             if (!s->restart) {

                                 s->mode = SILENCE_STOP;

                                 flush(s, out, outlink, &nb_samples_written, &ret, 1);

                                 goto silence_stop;

                             } else {

                                 s->stop_found_periods = 0;

                                 s->start_found_periods = 0;

                                 s->start_holdoff_offset = 0;

                                 s->start_holdoff_end = 0;

                                 s->start_silence_offset = 0;

                                 s->start_silence_end = 0;

                                 clear_window(s);

                                 s->mode = SILENCE_TRIM;

                                 flush(s, out, outlink, &nb_samples_written, &ret, 1);

                                 goto silence_trim;

                             }

                         }

                         s->mode = SILENCE_COPY_FLUSH;

                         flush(s, out, outlink, &nb_samples_written, &ret, 0);

                         goto silence_copy_flush;

                     }

                 }

             }

             flush(s, out, outlink, &nb_samples_written, &ret, 0);

         } else {

             memcpy(obuf, ibuf, sizeof(double) * nbs * outlink->channels);


             out->pts = s->next_pts;

             s->next_pts += av_rescale_q(out->nb_samples,

                                         (AVRational){1, outlink->sample_rate},

                                         outlink->time_base);


             ret = ff_filter_frame(outlink, out);

         }

         break;


     case SILENCE_COPY_FLUSH:

 silence_copy_flush:

         nbs  = s->stop_holdoff_end - s->stop_holdoff_offset;

         nbs -= nbs % outlink->channels;

         if (!nbs)

             break;


         out = ff_get_audio_buffer(outlink, nbs / outlink->channels);

         if (!out) {

             av_frame_free(&in);

             return AVERROR(ENOMEM);

         }


         memcpy(out->data[0], &s->stop_holdoff[s->stop_holdoff_offset],

                nbs * sizeof(double));

         s->stop_holdoff_offset += nbs;


         out->pts = s->next_pts;

         s->next_pts += av_rescale_q(out->nb_samples,

                                     (AVRational){1, outlink->sample_rate},

                                     outlink->time_base);


         ret = ff_filter_frame(outlink, out);


         if (s->stop_holdoff_offset == s->stop_holdoff_end) {

             s->stop_holdoff_offset = 0;

             s->stop_holdoff_end = 0;

             s->stop_silence_offset = 0;

             s->stop_silence_end = 0;

             s->mode = SILENCE_COPY;

             goto silence_copy;

         }

         break;

     case SILENCE_STOP:

 silence_stop:

         break;

     }


     av_frame_free(&in);


     return ret;

 }


 static int request_frame(AVFilterLink *outlink)

 {

     AVFilterContext *ctx = outlink->src;

     SilenceRemoveContext *s = ctx->priv;

     int ret;


     ret = ff_request_frame(ctx->inputs[0]);

     if (ret == AVERROR_EOF && (s->mode == SILENCE_COPY_FLUSH ||

                                s->mode == SILENCE_COPY)) {

         int nbs = s->stop_holdoff_end - s->stop_holdoff_offset;

         if (nbs) {

             AVFrame *frame;


             frame = ff_get_audio_buffer(outlink, nbs / outlink->channels);

             if (!frame)

                 return AVERROR(ENOMEM);


             memcpy(frame->data[0], &s->stop_holdoff[s->stop_holdoff_offset],

                    nbs * sizeof(double));


             frame->pts = s->next_pts;

             s->next_pts += av_rescale_q(frame->nb_samples,

                                         (AVRational){1, outlink->sample_rate},

                                         outlink->time_base);


             ret = ff_filter_frame(outlink, frame);

         }

         s->mode = SILENCE_STOP;

     }

     return ret;

 }


 static int query_formats(AVFilterContext *ctx)

 {

     AVFilterFormats *formats = NULL;

     AVFilterChannelLayouts *layouts = NULL;

     static const enum AVSampleFormat sample_fmts[] = {

         AV_SAMPLE_FMT_DBL, AV_SAMPLE_FMT_NONE

     };

     int ret;


     layouts = ff_all_channel_counts();

     if (!layouts)

         return AVERROR(ENOMEM);

     ret = ff_set_common_channel_layouts(ctx, layouts);

     if (ret < 0)

         return ret;


     formats = ff_make_format_list(sample_fmts);

     if (!formats)

         return AVERROR(ENOMEM);

     ret = ff_set_common_formats(ctx, formats);

     if (ret < 0)

         return ret;


     formats = ff_all_samplerates();

     if (!formats)

         return AVERROR(ENOMEM);

     return ff_set_common_samplerates(ctx, formats);

 }


 static av_cold void uninit(AVFilterContext *ctx)

 {

     SilenceRemoveContext *s = ctx->priv;


     av_freep(&s->start_holdoff);

     av_freep(&s->start_silence_hold);

     av_freep(&s->stop_holdoff);

     av_freep(&s->stop_silence_hold);

     av_freep(&s->window);

 }


 static const AVFilterPad silenceremove_inputs[] = {

     {

         .name         = "default",

         .type         = AVMEDIA_TYPE_AUDIO,

         .config_props = config_input,

         .filter_frame = filter_frame,

     },

     { NULL }

 };


 static const AVFilterPad silenceremove_outputs[] = {

     {

         .name          = "default",

         .type          = AVMEDIA_TYPE_AUDIO,

         .request_frame = request_frame,

     },

     { NULL }

 };


 AVFilter ff_af_silenceremove = {

     .name          = "silenceremove",

     .description   = NULL_IF_CONFIG_SMALL("Remove silence."),

     .priv_size     = sizeof(SilenceRemoveContext),

     .priv_class    = &silenceremove_class,

     .init          = init,

     .uninit        = uninit,

     .query_formats = query_formats,

     .inputs        = silenceremove_inputs,

     .outputs       = silenceremove_outputs,

 };

filter_frame
static int filter_frame(AVFilterLink *inlink, AVFrame *in)
Definition: af_silenceremove.c:319

NULL
#define NULL
Definition: coverity.c:32

ff_set_common_channel_layouts
int ff_set_common_channel_layouts(AVFilterContext *ctx, AVFilterChannelLayouts *layouts)
A helper for query_formats() which sets all links to the same list of channel layouts/sample rates...
Definition: formats.c:549

audio.h

AVFrame
This structure describes decoded (raw) audio or video data.
Definition: frame.h:226

SilenceDetect
SilenceDetect
Definition: af_silenceremove.c:33

AVOption
AVOption.
Definition: opt.h:246

flush
static void flush(SilenceRemoveContext *s, AVFrame *out, AVFilterLink *outlink, int *nb_samples_written, int *ret, int flush_silence)
Definition: af_silenceremove.c:265

SilenceRemoveContext::start_silence_hold
double * start_silence_hold
Definition: af_silenceremove.c:73

silenceremove_outputs
static const AVFilterPad silenceremove_outputs[]
Definition: af_silenceremove.c:658

SilenceRemoveContext::start_holdoff_end
size_t start_holdoff_end
Definition: af_silenceremove.c:75

avfilter.h
Main libavfilter public API header.

AV_OPT_TYPE_INT
Definition: opt.h:223

SilenceRemoveContext::update
void(* update)(struct SilenceRemoveContext *s, double sample)
Definition: af_silenceremove.c:99

AV_SAMPLE_FMT_NONE
Definition: samplefmt.h:59

ff_af_silenceremove
AVFilter ff_af_silenceremove
Definition: af_silenceremove.c:667

SilenceRemoveContext::start_silence_opt
int64_t start_silence_opt
Definition: af_silenceremove.c:61

SilenceRemoveContext::next_pts
int64_t next_pts
Definition: af_silenceremove.c:96

sample
#define sample
Definition: flacdsp_template.c:44

SilenceRemoveContext::window_ratio
double window_ratio
Definition: af_silenceremove.c:88

ff_make_format_list
AVFilterFormats * ff_make_format_list(const int *fmts)
Create a list of supported formats.
Definition: formats.c:283

SilenceRemoveContext::compute
double(* compute)(struct SilenceRemoveContext *s, double sample)
Definition: af_silenceremove.c:100

SilenceRemoveContext::detection
int detection
Definition: af_silenceremove.c:98

AVFilterPad::name
const char * name
Pad name.
Definition: internal.h:60

AVFilterContext::inputs
AVFilterLink ** inputs
array of pointers to input links
Definition: avfilter.h:346

SilenceRemoveContext::stop_silence
int64_t stop_silence
Definition: af_silenceremove.c:68

AV_OPT_TYPE_CONST
Definition: opt.h:232

ff_filter_frame
int ff_filter_frame(AVFilterLink *link, AVFrame *frame)
Send a frame of data to the next filter.
Definition: avfilter.c:1080

av_cold
#define av_cold
Definition: attributes.h:82

opt.h
AVOptions.

timestamp.h
timestamp utils, mostly useful for debugging/logging purposes

SilenceMode
SilenceMode
Definition: af_silenceremove.c:43

AVFrame::pts
int64_t pts
Presentation timestamp in time_base units (time when frame should be shown to user).
Definition: frame.h:319

SilenceRemoveContext::stop_mode
int stop_mode
Definition: af_silenceremove.c:70

frame
static AVFrame * frame
Definition: demuxing_decoding.c:53

SilenceRemoveContext::stop_silence_offset
size_t stop_silence_offset
Definition: af_silenceremove.c:84

init
static av_cold int init(AVFilterContext *ctx)
Definition: af_silenceremove.c:172

T_ALL
Definition: af_silenceremove.c:40

AVERROR_EOF
#define AVERROR_EOF
End of file.
Definition: error.h:55

float.h

SilenceRemoveContext::start_duration
int64_t start_duration
Definition: af_silenceremove.c:57

SilenceRemoveContext::start_holdoff
double * start_holdoff
Definition: af_silenceremove.c:72

SilenceRemoveContext
Definition: af_silenceremove.c:51

SilenceRemoveContext::stop_threshold
double stop_threshold
Definition: af_silenceremove.c:67

SilenceRemoveContext::window_current
double * window_current
Definition: af_silenceremove.c:90

AVFilterPad
A filter pad used for either input or output.
Definition: internal.h:54

SilenceRemoveContext::window
double * window
Definition: af_silenceremove.c:89

SilenceRemoveContext::start_duration_opt
int64_t start_duration_opt
Definition: af_silenceremove.c:58

av_rescale_q
int64_t av_rescale_q(int64_t a, AVRational bq, AVRational cq)
Rescale a 64-bit integer by 2 rational numbers.
Definition: mathematics.c:142

SILENCE_COPY
Definition: af_silenceremove.c:46

AVFilterLink
A link between two filters.
Definition: avfilter.h:439

D_PEAK
Definition: af_silenceremove.c:34

ff_set_common_formats
int ff_set_common_formats(AVFilterContext *ctx, AVFilterFormats *formats)
A helper for query_formats() which sets all links to the same list of formats.
Definition: formats.c:568

AVFilterLink::sample_rate
int sample_rate
samples per second
Definition: avfilter.h:454

ff_get_audio_buffer
AVFrame * ff_get_audio_buffer(AVFilterLink *link, int nb_samples)
Request an audio samples buffer with a specific set of permissions.
Definition: audio.c:86

AVERROR
#define AVERROR(e)
Definition: error.h:43

av_frame_free
void av_frame_free(AVFrame **frame)
Free the frame and any dynamically allocated objects in it, e.g.
Definition: frame.c:202

NULL_IF_CONFIG_SMALL
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification. ...
Definition: internal.h:186

AVFilterContext::priv
void * priv
private data for use by the filter
Definition: avfilter.h:353

AVMEDIA_TYPE_AUDIO
Definition: avutil.h:202

AVFilterLink::time_base
AVRational time_base
Define the time base used by the PTS of the frames/samples which will pass through this link...
Definition: avfilter.h:465

FFMAX
#define FFMAX(a, b)
Definition: common.h:94

SilenceRemoveContext::start_periods
int start_periods
Definition: af_silenceremove.c:56

SilenceRemoveContext::start_threshold
double start_threshold
Definition: af_silenceremove.c:59

ThresholdMode
ThresholdMode
Definition: af_silenceremove.c:38

query_formats
static int query_formats(AVFilterContext *ctx)
Definition: af_silenceremove.c:608

config_input
static int config_input(AVFilterLink *inlink)
Definition: af_silenceremove.c:204

av_rescale
int64_t av_rescale(int64_t a, int64_t b, int64_t c)
Rescale a 64-bit integer with rounding to nearest.
Definition: mathematics.c:129

AV_TIME_BASE
#define AV_TIME_BASE
Internal time base represented as integer.
Definition: avutil.h:254

FFMIN
#define FFMIN(a, b)
Definition: common.h:96

silenceremove_inputs
static const AVFilterPad silenceremove_inputs[]
Definition: af_silenceremove.c:648

SilenceRemoveContext::start_mode
int start_mode
Definition: af_silenceremove.c:62

void
typedef void(APIENTRY *FF_PFNGLACTIVETEXTUREPROC)(GLenum texture)

ctx
AVFormatContext * ctx
Definition: movenc.c:48

s
#define s(width, name)
Definition: cbs_vp9.c:257

request_frame
static int request_frame(AVFilterLink *outlink)
Definition: af_silenceremove.c:576

AVFILTER_DEFINE_CLASS
AVFILTER_DEFINE_CLASS(silenceremove)

AV_SAMPLE_FMT_DBL
double
Definition: samplefmt.h:64

SilenceRemoveContext::restart
int restart
Definition: af_silenceremove.c:95

AVFilterLink::src
AVFilterContext * src
source filter
Definition: avfilter.h:440

SilenceRemoveContext::mode
enum SilenceMode mode
Definition: af_silenceremove.c:54

D_RMS
Definition: af_silenceremove.c:35

inputs
static const AVFilterPad inputs[]
Definition: af_acontrast.c:193

outputs
static const AVFilterPad outputs[]
Definition: af_acontrast.c:203

AVFilterChannelLayouts
A list of supported channel layouts.
Definition: formats.h:85

T_ANY
Definition: af_silenceremove.c:39

compute_peak
static double compute_peak(SilenceRemoveContext *s, double sample)
Definition: af_silenceremove.c:128

SilenceRemoveContext::start_silence_end
size_t start_silence_end
Definition: af_silenceremove.c:77

AV_OPT_TYPE_DOUBLE
Definition: opt.h:225

AVSampleFormat
AVSampleFormat
Audio sample formats.
Definition: samplefmt.h:58

SilenceRemoveContext::stop_duration
int64_t stop_duration
Definition: af_silenceremove.c:65

in
uint8_t pi<< 24) CONV_FUNC_GROUP(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_U8, uint8_t,(*(constuint8_t *) pi-0x80)*(1.0f/(1<< 7))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_U8, uint8_t,(*(constuint8_t *) pi-0x80)*(1.0/(1<< 7))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_S16, int16_t,(*(constint16_t *) pi >>8)+0x80) CONV_FUNC_GROUP(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_S16, int16_t,*(constint16_t *) pi *(1.0f/(1<< 15))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_S16, int16_t,*(constint16_t *) pi *(1.0/(1<< 15))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_S32, int32_t,(*(constint32_t *) pi >>24)+0x80) CONV_FUNC_GROUP(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_S32, int32_t,*(constint32_t *) pi *(1.0f/(1U<< 31))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_S32, int32_t,*(constint32_t *) pi *(1.0/(1U<< 31))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_FLT, float, av_clip_uint8(lrintf(*(constfloat *) pi *(1<< 7))+0x80)) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S16, int16_t, AV_SAMPLE_FMT_FLT, float, av_clip_int16(lrintf(*(constfloat *) pi *(1<< 15)))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S32, int32_t, AV_SAMPLE_FMT_FLT, float, av_clipl_int32(llrintf(*(constfloat *) pi *(1U<< 31)))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_DBL, double, av_clip_uint8(lrint(*(constdouble *) pi *(1<< 7))+0x80)) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S16, int16_t, AV_SAMPLE_FMT_DBL, double, av_clip_int16(lrint(*(constdouble *) pi *(1<< 15)))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S32, int32_t, AV_SAMPLE_FMT_DBL, double, av_clipl_int32(llrint(*(constdouble *) pi *(1U<< 31))))#defineSET_CONV_FUNC_GROUP(ofmt, ifmt) staticvoidset_generic_function(AudioConvert *ac){}voidff_audio_convert_free(AudioConvert **ac){if(!*ac) return;ff_dither_free(&(*ac) ->dc);av_freep(ac);}AudioConvert *ff_audio_convert_alloc(AVAudioResampleContext *avr, enumAVSampleFormatout_fmt, enumAVSampleFormatin_fmt, intchannels, intsample_rate, intapply_map){AudioConvert *ac;intin_planar, out_planar;ac=av_mallocz(sizeof(*ac));if(!ac) returnNULL;ac->avr=avr;ac->out_fmt=out_fmt;ac->in_fmt=in_fmt;ac->channels=channels;ac->apply_map=apply_map;if(avr->dither_method!=AV_RESAMPLE_DITHER_NONE &&av_get_packed_sample_fmt(out_fmt)==AV_SAMPLE_FMT_S16 &&av_get_bytes_per_sample(in_fmt)>2){ac->dc=ff_dither_alloc(avr, out_fmt, in_fmt, channels, sample_rate, apply_map);if(!ac->dc){av_free(ac);returnNULL;}returnac;}in_planar=ff_sample_fmt_is_planar(in_fmt, channels);out_planar=ff_sample_fmt_is_planar(out_fmt, channels);if(in_planar==out_planar){ac->func_type=CONV_FUNC_TYPE_FLAT;ac->planes=in_planar?ac->channels:1;}elseif(in_planar) ac->func_type=CONV_FUNC_TYPE_INTERLEAVE;elseac->func_type=CONV_FUNC_TYPE_DEINTERLEAVE;set_generic_function(ac);if(ARCH_AARCH64) ff_audio_convert_init_aarch64(ac);if(ARCH_ARM) ff_audio_convert_init_arm(ac);if(ARCH_X86) ff_audio_convert_init_x86(ac);returnac;}intff_audio_convert(AudioConvert *ac, AudioData *out, AudioData *in){intuse_generic=1;intlen=in->nb_samples;intp;if(ac->dc){av_log(ac->avr, AV_LOG_TRACE,"%dsamples-audio_convert:%sto%s(dithered)\n", len, av_get_sample_fmt_name(ac->in_fmt), av_get_sample_fmt_name(ac->out_fmt));returnff_convert_dither(ac-> in
Definition: audio_convert.c:194

uninit
static av_cold void uninit(AVFilterContext *ctx)
Definition: af_silenceremove.c:637

AVClass
Describe the class of an AVClass context structure.
Definition: log.h:67

AVFilter
Filter definition.
Definition: avfilter.h:144

update_rms
static void update_rms(SilenceRemoveContext *s, double sample)
Definition: af_silenceremove.c:161

SilenceRemoveContext::start_silence_offset
size_t start_silence_offset
Definition: af_silenceremove.c:76

AVRational
Rational number (pair of numerator and denominator).
Definition: rational.h:58

compute_rms
static double compute_rms(SilenceRemoveContext *s, double sample)
Definition: af_silenceremove.c:150

clear_window
static void clear_window(SilenceRemoveContext *s)
Definition: af_silenceremove.c:195

AF
#define AF
Definition: af_silenceremove.c:104

AVFilter::name
const char * name
Filter name.
Definition: avfilter.h:148

SilenceRemoveContext::start_silence
int64_t start_silence
Definition: af_silenceremove.c:60

AVFilterContext::outputs
AVFilterLink ** outputs
array of pointers to output links
Definition: avfilter.h:350

layouts
enum MovChannelLayoutTag * layouts
Definition: mov_chan.c:434

ff_all_samplerates
AVFilterFormats * ff_all_samplerates(void)
Definition: formats.c:395

SilenceRemoveContext::window_size
int window_size
Definition: af_silenceremove.c:92

SilenceRemoveContext::stop_periods
int stop_periods
Definition: af_silenceremove.c:64

SilenceRemoveContext::stop_holdoff_end
size_t stop_holdoff_end
Definition: af_silenceremove.c:83

SilenceRemoveContext::window_end
double * window_end
Definition: af_silenceremove.c:91

AVFrame::data
uint8_t * data[AV_NUM_DATA_POINTERS]
pointer to the picture/channel planes.
Definition: frame.h:240

SILENCE_TRIM_FLUSH
Definition: af_silenceremove.c:45

AV_OPT_TYPE_DURATION
Definition: opt.h:237

SilenceRemoveContext::stop_holdoff_offset
size_t stop_holdoff_offset
Definition: af_silenceremove.c:82

update_peak
static void update_peak(SilenceRemoveContext *s, double sample)
Definition: af_silenceremove.c:139

if
if(ret< 0)
Definition: vf_mcdeint.c:279

SILENCE_COPY_FLUSH
Definition: af_silenceremove.c:47

SILENCE_TRIM
Definition: af_silenceremove.c:44

SilenceRemoveContext::stop_holdoff
double * stop_holdoff
Definition: af_silenceremove.c:80

SilenceRemoveContext::stop_duration_opt
int64_t stop_duration_opt
Definition: af_silenceremove.c:66

AVFilterLink::channels
int channels
Number of channels.
Definition: avfilter.h:573

SilenceRemoveContext::sum
double sum
Definition: af_silenceremove.c:93

silenceremove_options
static const AVOption silenceremove_options[]
Definition: af_silenceremove.c:106

AVFilterLink::dst
AVFilterContext * dst
dest filter
Definition: avfilter.h:443

SILENCE_STOP
Definition: af_silenceremove.c:48

SilenceRemoveContext::start_holdoff_offset
size_t start_holdoff_offset
Definition: af_silenceremove.c:74

AVFilterFormats
A list of supported formats for one end of a filter link.
Definition: formats.h:64

formats.h

SilenceRemoveContext::start_found_periods
int start_found_periods
Definition: af_silenceremove.c:78

AVFilterContext
An instance of a filter.
Definition: avfilter.h:338

SilenceRemoveContext::stop_silence_opt
int64_t stop_silence_opt
Definition: af_silenceremove.c:69

sample_fmts
static enum AVSampleFormat sample_fmts[]
Definition: adpcmenc.c:701

out
FILE * out
Definition: movenc.c:54

av_freep
#define av_freep(p)
Definition: tableprint_vlc.h:35

av_malloc_array
#define av_malloc_array(a, b)
Definition: tableprint_vlc.h:32

ff_request_frame
int ff_request_frame(AVFilterLink *link)
Request an input frame from the filter at the other end of the link.
Definition: avfilter.c:407

formats
formats
Definition: signature.h:48

internal.h
internal API functions

ff_all_channel_counts
AVFilterChannelLayouts * ff_all_channel_counts(void)
Construct an AVFilterChannelLayouts coding for any channel layout, with known or unknown disposition...
Definition: formats.c:410

SilenceRemoveContext::stop_silence_end
size_t stop_silence_end
Definition: af_silenceremove.c:85

OFFSET
#define OFFSET(x)
Definition: af_silenceremove.c:103

SilenceRemoveContext::stop_found_periods
int stop_found_periods
Definition: af_silenceremove.c:86

AVFrame::nb_samples
int nb_samples
number of audio samples (per channel) described by this frame
Definition: frame.h:292

ff_set_common_samplerates
int ff_set_common_samplerates(AVFilterContext *ctx, AVFilterFormats *samplerates)
Definition: formats.c:556

SilenceRemoveContext::stop_silence_hold
double * stop_silence_hold
Definition: af_silenceremove.c:81