Go to the documentation of this file.
51 float two_cos_w = 2.0f * cos_val;
53 for (j = 0; j + 1 < order; j += 2 * 2) {
55 q *= lsp[j] - two_cos_w;
56 p *= lsp[j + 1] - two_cos_w;
58 q *= lsp[j + 2] - two_cos_w;
59 p *= lsp[j + 3] - two_cos_w;
62 p *= p * (2.0f - two_cos_w);
63 q *= q * (2.0f + two_cos_w);
77 for (
i = 0;
i < size_s / 2;
i++) {
117 float *
out,
const float *in,
153 const float *buf,
float *lpc,
174 const int16_t *cb0,
const int16_t *cb1,
int cb_len)
183 const int16_t *tab0, *
tab1;
203 tab0 = cb0 + tmp0 * cb_len;
204 tab1 = cb1 + tmp1 * cb_len;
206 for (j = 0; j < length; j++)
227 out[
i] = (1.0 / (1 << 13)) *
232 float val = (1.0 / (1 << 23)) *
236 for (j = 0; j < sub; j++)
239 sub_step *
bits->sub_gain_bits[
i * sub + j],
254 float min_dist2 = min_dist * 0.5;
255 for (
i = 1;
i < order;
i++)
256 if (lsp[
i] - lsp[
i - 1] < min_dist) {
257 float avg = (lsp[
i] + lsp[
i - 1]) * 0.5;
259 lsp[
i - 1] =
avg - min_dist2;
260 lsp[
i] =
avg + min_dist2;
265 int lpc_hist_idx,
float *lsp,
float *hist)
272 const float *cb3 = cb2 + (1 << mtab->
lsp_bit2) * mtab->
n_lsp;
274 const int8_t funny_rounding[4] = {
286 lsp[j] =
cb[lpc_idx1 * mtab->
n_lsp + j] +
287 cb2[lpc_idx2[
i] * mtab->
n_lsp + j];
293 float tmp1 = 1.0 - cb3[lpc_hist_idx * mtab->
n_lsp +
i];
294 float tmp2 = hist[
i] * cb3[lpc_hist_idx * mtab->
n_lsp +
i];
296 lsp[
i] = lsp[
i] * tmp1 + tmp2;
311 lsp[
i] = 2 * cos(lsp[
i]);
329 int wtype,
float *in,
float *prev,
int ch)
337 int j, first_wsize, wsize;
341 int types_sizes[] = {
349 prev_buf = prev + (
size - bsize) / 2;
354 if (!j && wtype == 4)
361 tx_fn(tx, buf1 + bsize * j, in + bsize * j,
sizeof(
float));
369 memcpy(out2, buf1 + bsize * j + wsize / 2,
370 (bsize - wsize / 2) *
sizeof(
float));
374 prev_buf = buf1 + bsize * j + bsize / 2;
392 prev_buf + 2 *
i * mtab->
size,
399 size1 = mtab->
size - size2;
402 memcpy(out1, prev_buf, size1 *
sizeof(*out1));
403 memcpy(out1 + size1, tctx->
curr_frame, size2 *
sizeof(*out1));
407 memcpy(out2, &prev_buf[2 * mtab->
size],
408 size1 *
sizeof(*out2));
410 size2 *
sizeof(*out2));
422 int block_size = mtab->
size / sub;
444 float *chunk =
out + mtab->
size *
i;
447 for (j = 0; j < sub; j++) {
449 bits->bark_use_hist[
i][j],
i,
453 chunk + block_size * j,
480 int *got_frame_ptr,
AVPacket *avpkt)
482 const uint8_t *buf = avpkt->
data;
483 int buf_size = avpkt->
size;
497 if (buf_size < avctx->block_align) {
499 "Frame too small (%d bytes). Truncated file?\n", buf_size);
542 float norm =
channels == 1 ? 2.0 : 1.0;
545 for (
i = 0;
i < 3;
i++) {
547 const float scale = -sqrt(norm / bsize) / (1 << 15);
549 1, bsize, &
scale, 0)))
559 for (
i = 0;
i < 3;
i++) {
561 double freq = 2 *
M_PI / m;
564 for (j = 0; j <= m / 8; j++)
565 tctx->
cos_tabs[
i][j] = cos((2 * j + 1) * freq);
566 for (j = 1; j < m / 8; j++)
585 const uint8_t line_len[2],
int length_div,
590 for (
i = 0;
i < line_len[0];
i++) {
593 if (num_blocks == 1 ||
603 for (j = 0; j < num_vect && (j + num_vect *
i < block_size * num_blocks); j++)
604 tab[
i * num_vect + j] =
i * num_vect + (j +
shift) % num_vect;
624 const uint8_t line_len[2],
int length_div)
629 for (
i = 0;
i < num_vect;
i++)
630 for (j = 0; j < line_len[i >= length_div]; j++)
631 out[cont++] = in[j * num_vect +
i];
636 int block_size =
size / n_blocks;
640 out[
i] = block_size * (in[
i] % n_blocks) + in[
i] / n_blocks;
646 int block_size,
size;
648 int16_t *tmp_perm = (int16_t *)tctx->
tmp_buf;
682 int bsize_no_main_cb[3], bse_bits[3],
i;
685 for (
i = 0;
i < 3;
i++)
691 bsize_no_main_cb[2] = bse_bits[2] + lsp_bits_per_block + ppc_bits +
694 for (
i = 0;
i < 2;
i++)
695 bsize_no_main_cb[
i] =
701 bsize_no_main_cb[1] += 2;
702 bsize_no_main_cb[2] += 2;
706 for (
i = 0;
i < 4;
i++) {
707 int bit_size, vect_size;
708 int rounded_up, rounded_down, num_rounded_down, num_rounded_up;
713 bit_size = total_fr_bits - bsize_no_main_cb[
i];
714 vect_size = n_ch * mtab->
size;
717 tctx->
n_div[
i] = (bit_size + 13) / 14;
719 rounded_up = (bit_size + tctx->
n_div[
i] - 1) /
721 rounded_down = (bit_size) / tctx->
n_div[
i];
722 num_rounded_down = rounded_up * tctx->
n_div[
i] - bit_size;
723 num_rounded_up = tctx->
n_div[
i] - num_rounded_down;
730 rounded_up = (vect_size + tctx->
n_div[
i] - 1) /
732 rounded_down = (vect_size) / tctx->
n_div[
i];
733 num_rounded_down = rounded_up * tctx->
n_div[
i] - vect_size;
734 num_rounded_up = tctx->
n_div[
i] - num_rounded_down;
735 tctx->
length[
i][0] = rounded_up;
736 tctx->
length[
i][1] = rounded_down;
749 for (
i = 0;
i < 3;
i++) {
767 int64_t frames_per_packet;
776 if (frames_per_packet <= 0) {
const float * lspcodebook
@ AV_SAMPLE_FMT_FLTP
float, planar
static void linear_perm(int16_t *out, int16_t *in, int n_blocks, int size)
#define TWINVQ_SUB_AMP_MAX
const TwinVQModeTab * mtab
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
SINETABLE_CONST float *const ff_sine_windows[]
uint8_t sub
Number subblocks in each frame.
int sample_rate
samples per second
uint8_t bits_main_spec[2][4][2]
bits for the main codebook
static double cb(void *priv, double x, double y)
static void dequant(TwinVQContext *tctx, const uint8_t *cb_bits, float *out, enum TwinVQFrameType ftype, const int16_t *cb0, const int16_t *cb1, int cb_len)
Inverse quantization.
static void decode_lsp(TwinVQContext *tctx, int lpc_idx1, uint8_t *lpc_idx2, int lpc_hist_idx, float *lsp, float *hist)
float * curr_frame
non-interleaved output
This structure describes decoded (raw) audio or video data.
trying all byte sequences megabyte in length and selecting the best looking sequence will yield cases to try But a word about which is also called distortion Distortion can be quantified by almost any quality measurement one chooses the sum of squared differences is used but more complex methods that consider psychovisual effects can be used as well It makes no difference in this discussion First step
TwinVQFrameData bits[TWINVQ_MAX_FRAMES_PER_PACKET]
uint8_t ppc_shape_len
size of PPC shape CB
av_cold int ff_twinvq_decode_init(AVCodecContext *avctx)
Requires the caller to call ff_twinvq_decode_close() upon failure.
static void imdct_output(TwinVQContext *tctx, enum TwinVQFrameType ftype, int wtype, float **out, int offset)
void ff_sort_nearly_sorted_floats(float *vals, int len)
Sort values in ascending order.
uint8_t pgain_bit
bits for PPC gain
int nb_channels
Number of channels in this layout.
av_cold int av_tx_init(AVTXContext **ctx, av_tx_fn *tx, enum AVTXType type, int inv, int len, const void *scale, uint64_t flags)
Initialize a transform context with the given configuration (i)MDCTs with an odd length are currently...
#define TWINVQ_PPC_SHAPE_CB_SIZE
void(* butterflies_float)(float *av_restrict v1, float *av_restrict v2, int len)
Calculate the sum and difference of two vectors of floats.
const int16_t * cb0
main codebooks for spectrum data
#define TWINVQ_WINDOW_TYPE_BITS
AVChannelLayout ch_layout
Audio channel layout.
uint8_t bark_n_coef
number of BSE CB coefficients to read
static const struct twinvq_data tab
int flags
AV_CODEC_FLAG_*.
static double val(void *priv, double ch)
#define FF_ALLOC_TYPED_ARRAY(p, nelem)
static av_always_inline float scale(float x, float s)
uint16_t size
frame size in samples
static float twinvq_mulawinv(float y, float clip, float mu)
void(* dec_bark_env)(struct TwinVQContext *tctx, const uint8_t *in, int use_hist, int ch, float *out, float gain, enum TwinVQFrameType ftype)
void(* decode_ppc)(struct TwinVQContext *tctx, int period_coef, int g_coef, const float *shape, float *speech)
static int chunk_end(AVFormatContext *s, int flush)
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
static const uint8_t wtype_to_wsize[]
#define FF_ARRAY_ELEMS(a)
void(* av_tx_fn)(AVTXContext *s, void *out, void *in, ptrdiff_t stride)
Function pointer to a function to perform the transform.
float lsp_hist[2][20]
LSP coefficients of the last frame.
uint8_t ppc_shape_bit
number of bits of the PPC shape CB coeffs
@ AV_TX_FLOAT_MDCT
Standard MDCT with a sample data type of float, double or int32_t, respecively.
static void rearrange_lsp(int order, float *lsp, float min_dist)
Rearrange the LSP coefficients so that they have a minimum distance of min_dist.
#define TWINVQ_LSP_COEFS_MAX
@ TWINVQ_FT_MEDIUM
Medium frame (divided in m<n sub-blocks)
Parameters and tables that are different for every combination of bitrate/sample rate.
static void twinvq_memset_float(float *buf, float val, int size)
float * prev_frame
non-interleaved previous frame
@ TWINVQ_FT_PPC
Periodic Peak Component (part of the long frame)
static void eval_lpcenv(TwinVQContext *tctx, const float *cos_vals, float *lpc)
Evaluate the LPC amplitude spectrum envelope from the line spectrum pairs.
av_cold int ff_twinvq_decode_close(AVCodecContext *avctx)
uint8_t length[4][2]
main codebook stride
int64_t bit_rate
the average bitrate
static float get_cos(int idx, int part, const float *cos_tab, int size)
static float eval_lpc_spectrum(const float *lsp, float cos_val, int order)
Evaluate a single LPC amplitude spectrum envelope coefficient from the line spectrum pairs.
int ff_twinvq_decode_frame(AVCodecContext *avctx, AVFrame *frame, int *got_frame_ptr, AVPacket *avpkt)
static void transpose_perm(int16_t *out, int16_t *in, int num_vect, const uint8_t line_len[2], int length_div)
Interpret the input data as in the following table:
static void dec_lpc_spectrum_inv(TwinVQContext *tctx, float *lsp, enum TwinVQFrameType ftype, float *lpc)
static void read_and_decode_spectrum(TwinVQContext *tctx, float *out, enum TwinVQFrameType ftype)
@ TWINVQ_FT_LONG
Long frame (single sub-block + PPC)
int ff_get_buffer(AVCodecContext *avctx, AVFrame *frame, int flags)
Get a buffer for a frame.
void(* vector_fmul)(float *dst, const float *src0, const float *src1, int len)
Calculate the entry wise product of two vectors of floats and store the result in a vector of floats.
static int shift(int a, int b)
enum AVSampleFormat sample_fmt
audio sample format
uint8_t bark_n_bit
number of bits of the BSE coefs
uint8_t ppc_period_bit
number of the bits for the PPC period value
int bits_main_spec_change[4]
#define TWINVQ_PPC_SHAPE_LEN_MAX
#define TWINVQ_CHANNELS_MAX
const int16_t * ppc_shape_cb
PPC shape CB.
static av_cold void init_bitstream_params(TwinVQContext *tctx)
it s the only field you need to keep assuming you have a context There is some magic you don t need to care about around this just let it vf offset
static av_cold int init_mdct_win(TwinVQContext *tctx)
Init IMDCT and windowing tables.
static void interpolate(float *out, float v1, float v2, int size)
av_cold void av_tx_uninit(AVTXContext **ctx)
Frees a context and sets *ctx to NULL, does nothing when *ctx == NULL.
int(* read_bitstream)(AVCodecContext *avctx, struct TwinVQContext *tctx, const uint8_t *buf, int buf_size)
#define TWINVQ_SUB_GAIN_BITS
int nb_samples
number of audio samples (per channel) described by this frame
#define i(width, name, range_min, range_max)
float bark_hist[3][2][40]
BSE coefficients of last frame.
uint8_t ** extended_data
pointers to the data planes/channels.
static void permutate_in_line(int16_t *tab, int num_vect, int num_blocks, int block_size, const uint8_t line_len[2], int length_div, enum TwinVQFrameType ftype)
Interpret the data as if it were a num_blocks x line_len[0] matrix and for each line do a cyclic perm...
int block_align
number of bytes per packet if constant and known or 0 Used by some WAV based audio codecs.
#define FFSWAP(type, a, b)
@ TWINVQ_FT_SHORT
Short frame (divided in n sub-blocks)
static void imdct_and_window(TwinVQContext *tctx, enum TwinVQFrameType ftype, int wtype, float *in, float *prev, int ch)
main external API structure.
static av_cold void construct_perm_table(TwinVQContext *tctx, enum TwinVQFrameType ftype)
void ff_init_ff_sine_windows(int index)
initialize the specified entry of ff_sine_windows
uint8_t cb_len_read
number of spectrum coefficients to read
enum TwinVQFrameType ftype
static void eval_lpcenv_or_interp(TwinVQContext *tctx, enum TwinVQFrameType ftype, float *out, const float *in, int size, int step, int part)
Evaluate the LPC amplitude spectrum envelope from the line spectrum pairs.
#define AV_CODEC_FLAG_BITEXACT
Use only bitexact stuff (except (I)DCT).
static void dec_gain(TwinVQContext *tctx, enum TwinVQFrameType ftype, float *out)
static void eval_lpcenv_2parts(TwinVQContext *tctx, enum TwinVQFrameType ftype, const float *buf, float *lpc, int size, int step)
void(* vector_fmul_window)(float *dst, const float *src0, const float *src1, const float *win, int len)
Overlap/add with window function.
This structure stores compressed data.
#define TWINVQ_SUBBLOCKS_MAX
av_cold AVFloatDSPContext * avpriv_float_dsp_alloc(int bit_exact)
Allocate a float DSP context.
#define TWINVQ_MAX_FRAMES_PER_PACKET
#define AVERROR_INVALIDDATA
Invalid data found when processing input.
static float cos_tab[256]
uint8_t lsp_split
number of CB entries for the LSP decoding
enum TwinVQFrameType ff_twinvq_wtype_to_ftype_table[]
struct TwinVQFrameMode fmode[3]
frame type-dependent parameters
uint8_t n_lsp
number of lsp coefficients