FFmpeg
af_rubberband.c
Go to the documentation of this file.
1 /*
2  * This file is part of FFmpeg.
3  *
4  * FFmpeg is free software; you can redistribute it and/or
5  * modify it under the terms of the GNU Lesser General Public
6  * License as published by the Free Software Foundation; either
7  * version 2.1 of the License, or (at your option) any later version.
8  *
9  * FFmpeg is distributed in the hope that it will be useful,
10  * but WITHOUT ANY WARRANTY; without even the implied warranty of
11  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
12  * Lesser General Public License for more details.
13  *
14  * You should have received a copy of the GNU Lesser General Public
15  * License along with FFmpeg; if not, write to the Free Software
16  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
17  */
18 
19 #include <rubberband/rubberband-c.h>
20 
22 #include "libavutil/common.h"
23 #include "libavutil/opt.h"
24 
25 #include "audio.h"
26 #include "avfilter.h"
27 #include "filters.h"
28 
29 typedef struct RubberBandContext {
30  const AVClass *class;
31  RubberBandState rbs;
32 
33  double tempo, pitch;
41  int eof;
43 
44 #define OFFSET(x) offsetof(RubberBandContext, x)
45 #define A AV_OPT_FLAG_AUDIO_PARAM|AV_OPT_FLAG_FILTERING_PARAM
46 #define AT AV_OPT_FLAG_AUDIO_PARAM|AV_OPT_FLAG_FILTERING_PARAM|AV_OPT_FLAG_RUNTIME_PARAM
47 
48 static const AVOption rubberband_options[] = {
49  { "tempo", "set tempo scale factor", OFFSET(tempo), AV_OPT_TYPE_DOUBLE, {.dbl=1}, 0.01, 100, AT },
50  { "pitch", "set pitch scale factor", OFFSET(pitch), AV_OPT_TYPE_DOUBLE, {.dbl=1}, 0.01, 100, AT },
51  { "transients", "set transients", OFFSET(transients), AV_OPT_TYPE_INT, {.i64=0}, 0, INT_MAX, A, .unit = "transients" },
52  { "crisp", 0, 0, AV_OPT_TYPE_CONST, {.i64=RubberBandOptionTransientsCrisp}, 0, 0, A, .unit = "transients" },
53  { "mixed", 0, 0, AV_OPT_TYPE_CONST, {.i64=RubberBandOptionTransientsMixed}, 0, 0, A, .unit = "transients" },
54  { "smooth", 0, 0, AV_OPT_TYPE_CONST, {.i64=RubberBandOptionTransientsSmooth}, 0, 0, A, .unit = "transients" },
55  { "detector", "set detector", OFFSET(detector), AV_OPT_TYPE_INT, {.i64=0}, 0, INT_MAX, A, .unit = "detector" },
56  { "compound", 0, 0, AV_OPT_TYPE_CONST, {.i64=RubberBandOptionDetectorCompound}, 0, 0, A, .unit = "detector" },
57  { "percussive", 0, 0, AV_OPT_TYPE_CONST, {.i64=RubberBandOptionDetectorPercussive}, 0, 0, A, .unit = "detector" },
58  { "soft", 0, 0, AV_OPT_TYPE_CONST, {.i64=RubberBandOptionDetectorSoft}, 0, 0, A, .unit = "detector" },
59  { "phase", "set phase", OFFSET(phase), AV_OPT_TYPE_INT, {.i64=0}, 0, INT_MAX, A, .unit = "phase" },
60  { "laminar", 0, 0, AV_OPT_TYPE_CONST, {.i64=RubberBandOptionPhaseLaminar}, 0, 0, A, .unit = "phase" },
61  { "independent", 0, 0, AV_OPT_TYPE_CONST, {.i64=RubberBandOptionPhaseIndependent}, 0, 0, A, .unit = "phase" },
62  { "window", "set window", OFFSET(window), AV_OPT_TYPE_INT, {.i64=0}, 0, INT_MAX, A, .unit = "window" },
63  { "standard", 0, 0, AV_OPT_TYPE_CONST, {.i64=RubberBandOptionWindowStandard}, 0, 0, A, .unit = "window" },
64  { "short", 0, 0, AV_OPT_TYPE_CONST, {.i64=RubberBandOptionWindowShort}, 0, 0, A, .unit = "window" },
65  { "long", 0, 0, AV_OPT_TYPE_CONST, {.i64=RubberBandOptionWindowLong}, 0, 0, A, .unit = "window" },
66  { "smoothing", "set smoothing", OFFSET(smoothing), AV_OPT_TYPE_INT, {.i64=0}, 0, INT_MAX, A, .unit = "smoothing" },
67  { "off", 0, 0, AV_OPT_TYPE_CONST, {.i64=RubberBandOptionSmoothingOff}, 0, 0, A, .unit = "smoothing" },
68  { "on", 0, 0, AV_OPT_TYPE_CONST, {.i64=RubberBandOptionSmoothingOn}, 0, 0, A, .unit = "smoothing" },
69  { "formant", "set formant", OFFSET(formant), AV_OPT_TYPE_INT, {.i64=0}, 0, INT_MAX, A, .unit = "formant" },
70  { "shifted", 0, 0, AV_OPT_TYPE_CONST, {.i64=RubberBandOptionFormantShifted}, 0, 0, A, .unit = "formant" },
71  { "preserved", 0, 0, AV_OPT_TYPE_CONST, {.i64=RubberBandOptionFormantPreserved}, 0, 0, A, .unit = "formant" },
72  { "pitchq", "set pitch quality", OFFSET(opitch), AV_OPT_TYPE_INT, {.i64=0}, 0, INT_MAX, A, .unit = "pitch" },
73  { "quality", 0, 0, AV_OPT_TYPE_CONST, {.i64=RubberBandOptionPitchHighQuality}, 0, 0, A, .unit = "pitch" },
74  { "speed", 0, 0, AV_OPT_TYPE_CONST, {.i64=RubberBandOptionPitchHighSpeed}, 0, 0, A, .unit = "pitch" },
75  { "consistency", 0, 0, AV_OPT_TYPE_CONST, {.i64=RubberBandOptionPitchHighConsistency}, 0, 0, A, .unit = "pitch" },
76  { "channels", "set channels", OFFSET(channels), AV_OPT_TYPE_INT, {.i64=0}, 0, INT_MAX, A, .unit = "channels" },
77  { "apart", 0, 0, AV_OPT_TYPE_CONST, {.i64=RubberBandOptionChannelsApart}, 0, 0, A, .unit = "channels" },
78  { "together", 0, 0, AV_OPT_TYPE_CONST, {.i64=RubberBandOptionChannelsTogether}, 0, 0, A, .unit = "channels" },
79  { NULL },
80 };
81 
82 AVFILTER_DEFINE_CLASS(rubberband);
83 
85 {
86  RubberBandContext *s = ctx->priv;
87 
88  if (s->rbs)
89  rubberband_delete(s->rbs);
90 }
91 
93 {
94  AVFilterContext *ctx = inlink->dst;
95  RubberBandContext *s = ctx->priv;
96  AVFilterLink *outlink = ctx->outputs[0];
97  AVFrame *out;
98  int ret = 0, nb_samples;
99 
100  if (s->first_pts == AV_NOPTS_VALUE)
101  s->first_pts = in->pts;
102 
103  rubberband_process(s->rbs, (const float *const *)in->extended_data, in->nb_samples, s->eof);
104  s->nb_samples_in += in->nb_samples;
105 
106  nb_samples = rubberband_available(s->rbs);
107  if (nb_samples > 0) {
108  out = ff_get_audio_buffer(outlink, nb_samples);
109  if (!out) {
110  av_frame_free(&in);
111  return AVERROR(ENOMEM);
112  }
113  out->pts = s->first_pts + av_rescale_q(s->nb_samples_out,
114  (AVRational){ 1, outlink->sample_rate },
115  outlink->time_base);
116  s->last_pts = out->pts;
117  nb_samples = rubberband_retrieve(s->rbs, (float *const *)out->extended_data, nb_samples);
118  out->nb_samples = nb_samples;
119  ret = ff_filter_frame(outlink, out);
120  s->nb_samples_out += nb_samples;
121  }
122 
123  av_frame_free(&in);
124  if (ff_inlink_queued_samples(inlink) >= s->nb_samples)
125  ff_filter_set_ready(ctx, 100);
126  return ret < 0 ? ret : nb_samples;
127 }
128 
130 {
131  AVFilterContext *ctx = inlink->dst;
132  RubberBandContext *s = ctx->priv;
133  int opts = s->transients|s->detector|s->phase|s->window|
134  s->smoothing|s->formant|s->opitch|s->channels|
135  RubberBandOptionProcessRealTime;
136 
137  if (s->rbs)
138  rubberband_delete(s->rbs);
139  s->rbs = rubberband_new(inlink->sample_rate, inlink->ch_layout.nb_channels, opts, 1. / s->tempo, s->pitch);
140  if (!s->rbs)
141  return AVERROR(ENOMEM);
142 
143  s->nb_samples = rubberband_get_samples_required(s->rbs);
144  s->first_pts = AV_NOPTS_VALUE;
145 
146  return 0;
147 }
148 
150 {
151  AVFilterLink *inlink = ctx->inputs[0];
152  AVFilterLink *outlink = ctx->outputs[0];
153  RubberBandContext *s = ctx->priv;
154  AVFrame *in = NULL;
155  int64_t pts;
156  int status, ret;
157 
159 
160  ret = ff_inlink_consume_samples(inlink, s->nb_samples, s->nb_samples, &in);
161 
163  s->eof |= status == AVERROR_EOF;
164 
165  if (ret < 0)
166  return ret;
167  if (ret > 0) {
168  ret = filter_frame(inlink, in);
169  if (ret != 0)
170  return ret;
171  }
172 
173  if (s->eof) {
174  ff_outlink_set_status(outlink, AVERROR_EOF, s->last_pts);
175  return 0;
176  }
177 
179 
180  return FFERROR_NOT_READY;
181 }
182 
183 static int process_command(AVFilterContext *ctx, const char *cmd, const char *args,
184  char *res, int res_len, int flags)
185 {
186  RubberBandContext *s = ctx->priv;
187  int ret;
188 
189  ret = ff_filter_process_command(ctx, cmd, args, res, res_len, flags);
190  if (ret < 0)
191  return ret;
192 
193  rubberband_set_time_ratio(s->rbs, 1. / s->tempo);
194  rubberband_set_pitch_scale(s->rbs, s->pitch);
195  s->nb_samples = rubberband_get_samples_required(s->rbs);
196 
197  return 0;
198 }
199 
200 static const AVFilterPad rubberband_inputs[] = {
201  {
202  .name = "default",
203  .type = AVMEDIA_TYPE_AUDIO,
204  .config_props = config_input,
205  },
206 };
207 
209  .name = "rubberband",
210  .description = NULL_IF_CONFIG_SMALL("Apply time-stretching and pitch-shifting."),
211  .priv_size = sizeof(RubberBandContext),
212  .priv_class = &rubberband_class,
213  .uninit = uninit,
214  .activate = activate,
218  .process_command = process_command,
219 };
ff_get_audio_buffer
AVFrame * ff_get_audio_buffer(AVFilterLink *link, int nb_samples)
Request an audio samples buffer with a specific set of permissions.
Definition: audio.c:98
AV_SAMPLE_FMT_FLTP
@ AV_SAMPLE_FMT_FLTP
float, planar
Definition: samplefmt.h:66
AVERROR
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
opt.h
RubberBandContext::last_pts
int64_t last_pts
Definition: af_rubberband.c:39
out
FILE * out
Definition: movenc.c:55
RubberBandContext::nb_samples
int nb_samples
Definition: af_rubberband.c:40
ff_filter_frame
int ff_filter_frame(AVFilterLink *link, AVFrame *frame)
Send a frame of data to the next filter.
Definition: avfilter.c:1061
AVERROR_EOF
#define AVERROR_EOF
End of file.
Definition: error.h:57
FFERROR_NOT_READY
return FFERROR_NOT_READY
Definition: filter_design.txt:204
ff_af_rubberband
const AVFilter ff_af_rubberband
Definition: af_rubberband.c:208
int64_t
long long int64_t
Definition: coverity.c:34
filter_frame
static int filter_frame(AVFilterLink *inlink, AVFrame *in)
Definition: af_rubberband.c:92
config_input
static int config_input(AVFilterLink *inlink)
Definition: af_rubberband.c:129
inlink
The exact code depends on how similar the blocks are and how related they are to the and needs to apply these operations to the correct inlink or outlink if there are several Macros are available to factor that when no extra processing is inlink
Definition: filter_design.txt:212
av_frame_free
void av_frame_free(AVFrame **frame)
Free the frame and any dynamically allocated objects in it, e.g.
Definition: frame.c:163
RubberBandContext::transients
int transients
Definition: af_rubberband.c:34
FILTER_INPUTS
#define FILTER_INPUTS(array)
Definition: filters.h:262
AVFrame
This structure describes decoded (raw) audio or video data.
Definition: frame.h:403
AVFrame::pts
int64_t pts
Presentation timestamp in time_base units (time when frame should be shown to user).
Definition: frame.h:515
AVOption
AVOption.
Definition: opt.h:429
rubberband_options
static const AVOption rubberband_options[]
Definition: af_rubberband.c:48
AVFilter::name
const char * name
Filter name.
Definition: avfilter.h:205
FF_FILTER_FORWARD_STATUS_BACK
#define FF_FILTER_FORWARD_STATUS_BACK(outlink, inlink)
Forward the status on an output link to an input link.
Definition: filters.h:434
window
static SDL_Window * window
Definition: ffplay.c:361
process_command
static int process_command(AVFilterContext *ctx, const char *cmd, const char *args, char *res, int res_len, int flags)
Definition: af_rubberband.c:183
OFFSET
#define OFFSET(x)
Definition: af_rubberband.c:44
pts
static int64_t pts
Definition: transcode_aac.c:644
RubberBandContext
Definition: af_rubberband.c:29
AVFilterPad
A filter pad used for either input or output.
Definition: filters.h:38
rubberband_inputs
static const AVFilterPad rubberband_inputs[]
Definition: af_rubberband.c:200
av_cold
#define av_cold
Definition: attributes.h:90
ff_outlink_set_status
static void ff_outlink_set_status(AVFilterLink *link, int status, int64_t pts)
Set the status field of a link from the source filter.
Definition: filters.h:424
activate
static int activate(AVFilterContext *ctx)
Definition: af_rubberband.c:149
s
#define s(width, name)
Definition: cbs_vp9.c:198
AV_OPT_TYPE_DOUBLE
@ AV_OPT_TYPE_DOUBLE
Underlying C type is double.
Definition: opt.h:267
AVMEDIA_TYPE_AUDIO
@ AVMEDIA_TYPE_AUDIO
Definition: avutil.h:202
filters.h
ctx
AVFormatContext * ctx
Definition: movenc.c:49
channels
channels
Definition: aptx.h:31
av_rescale_q
int64_t av_rescale_q(int64_t a, AVRational bq, AVRational cq)
Rescale a 64-bit integer by 2 rational numbers.
Definition: mathematics.c:142
FILTER_OUTPUTS
#define FILTER_OUTPUTS(array)
Definition: filters.h:263
opts
AVDictionary * opts
Definition: movenc.c:51
AVClass
Describe the class of an AVClass context structure.
Definition: log.h:75
ff_inlink_consume_samples
int ff_inlink_consume_samples(AVFilterLink *link, unsigned min, unsigned max, AVFrame **rframe)
Take samples from the link's FIFO and update the link's stats.
Definition: avfilter.c:1510
NULL
#define NULL
Definition: coverity.c:32
AVRational
Rational number (pair of numerator and denominator).
Definition: rational.h:58
RubberBandContext::window
int window
Definition: af_rubberband.c:34
ff_audio_default_filterpad
const AVFilterPad ff_audio_default_filterpad[1]
An AVFilterPad array whose only entry has name "default" and is of type AVMEDIA_TYPE_AUDIO.
Definition: audio.c:34
ff_inlink_acknowledge_status
int ff_inlink_acknowledge_status(AVFilterLink *link, int *rstatus, int64_t *rpts)
Test and acknowledge the change of status on the link.
Definition: avfilter.c:1437
FILTER_SINGLE_SAMPLEFMT
#define FILTER_SINGLE_SAMPLEFMT(sample_fmt_)
Definition: filters.h:255
A
#define A
Definition: af_rubberband.c:45
NULL_IF_CONFIG_SMALL
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification.
Definition: internal.h:94
RubberBandContext::opitch
int opitch
Definition: af_rubberband.c:35
RubberBandContext::smoothing
int smoothing
Definition: af_rubberband.c:35
AV_NOPTS_VALUE
#define AV_NOPTS_VALUE
Undefined timestamp value.
Definition: avutil.h:248
ff_filter_process_command
int ff_filter_process_command(AVFilterContext *ctx, const char *cmd, const char *arg, char *res, int res_len, int flags)
Generic processing of user supplied commands that are set in the same way as the filter options.
Definition: avfilter.c:900
RubberBandContext::channels
int channels
Definition: af_rubberband.c:35
RubberBandContext::pitch
double pitch
Definition: af_rubberband.c:33
FF_FILTER_FORWARD_WANTED
FF_FILTER_FORWARD_WANTED(outlink, inlink)
AVFrame::nb_samples
int nb_samples
number of audio samples (per channel) described by this frame
Definition: frame.h:483
AVFrame::extended_data
uint8_t ** extended_data
pointers to the data planes/channels.
Definition: frame.h:464
common.h
RubberBandContext::rbs
RubberBandState rbs
Definition: af_rubberband.c:31
RubberBandContext::eof
int eof
Definition: af_rubberband.c:41
AVFilterPad::name
const char * name
Pad name.
Definition: filters.h:44
ff_inlink_queued_samples
int ff_inlink_queued_samples(AVFilterLink *link)
Definition: avfilter.c:1465
RubberBandContext::phase
int phase
Definition: af_rubberband.c:34
AVFilter
Filter definition.
Definition: avfilter.h:201
ret
ret
Definition: filter_design.txt:187
status
ov_status_e status
Definition: dnn_backend_openvino.c:100
channel_layout.h
AVFILTER_DEFINE_CLASS
AVFILTER_DEFINE_CLASS(rubberband)
AV_OPT_TYPE_INT
@ AV_OPT_TYPE_INT
Underlying C type is int.
Definition: opt.h:259
avfilter.h
RubberBandContext::nb_samples_in
int64_t nb_samples_in
Definition: af_rubberband.c:37
AVFilterContext
An instance of a filter.
Definition: avfilter.h:457
RubberBandContext::first_pts
int64_t first_pts
Definition: af_rubberband.c:38
audio.h
uninit
static av_cold void uninit(AVFilterContext *ctx)
Definition: af_rubberband.c:84
RubberBandContext::nb_samples_out
int64_t nb_samples_out
Definition: af_rubberband.c:36
RubberBandContext::formant
int formant
Definition: af_rubberband.c:35
RubberBandContext::tempo
double tempo
Definition: af_rubberband.c:33
flags
#define flags(name, subs,...)
Definition: cbs_av1.c:482
AT
#define AT
Definition: af_rubberband.c:46
RubberBandContext::detector
int detector
Definition: af_rubberband.c:34
AV_OPT_TYPE_CONST
@ AV_OPT_TYPE_CONST
Special option type for declaring named constants.
Definition: opt.h:299
ff_filter_set_ready
void ff_filter_set_ready(AVFilterContext *filter, unsigned priority)
Mark a filter ready and schedule it for activation.
Definition: avfilter.c:239