doxygen/5.1/g723__1_8h_source.html

/*

 * G.723.1 common header and data tables

 * Copyright (c) 2006 Benjamin Larsson

 * Copyright (c) 2010 Mohamed Naufal Basheer

 *

 * This file is part of FFmpeg.

 *

 * FFmpeg is free software; you can redistribute it and/or

 * modify it under the terms of the GNU Lesser General Public

 * License as published by the Free Software Foundation; either

 * version 2.1 of the License, or (at your option) any later version.

 *

 * FFmpeg is distributed in the hope that it will be useful,

 * but WITHOUT ANY WARRANTY; without even the implied warranty of

 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU

 * Lesser General Public License for more details.

 *

 * You should have received a copy of the GNU Lesser General Public

 * License along with FFmpeg; if not, write to the Free Software

 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA

 */


/**

 * @file

 * G.723.1 types, functions and data tables

 */


#ifndef AVCODEC_G723_1_H

#define AVCODEC_G723_1_H


#include <stdint.h>


#include "libavutil/log.h"


#define SUBFRAMES       4

#define SUBFRAME_LEN    60

#define FRAME_LEN       (SUBFRAME_LEN << 2)

#define HALF_FRAME_LEN  (FRAME_LEN / 2)

#define LPC_FRAME       (HALF_FRAME_LEN + SUBFRAME_LEN)

#define LPC_ORDER       10

#define LSP_BANDS       3

#define LSP_CB_SIZE     256

#define PITCH_MIN       18

#define PITCH_MAX       (PITCH_MIN + 127)

#define PITCH_ORDER     5

#define GRID_SIZE       2

#define PULSE_MAX       6

#define GAIN_LEVELS     24

#define COS_TBL_SIZE    512


/**

 * Bitexact implementation of 2ab scaled by 1/2^16.

 *

 * @param a 32 bit multiplicand

 * @param b 16 bit multiplier

 */

#define MULL2(a, b) \

        ((((a) >> 16) * (b) * 2) + (((a) & 0xffff) * (b) >> 15))


/**

 * G723.1 frame types

 */

enum FrameType {

    ACTIVE_FRAME,        ///< Active speech

    SID_FRAME,           ///< Silence Insertion Descriptor frame

    UNTRANSMITTED_FRAME

};


/**

 * G723.1 rate values

 */

enum Rate {

    RATE_6300,

    RATE_5300

};


/**

 * G723.1 unpacked data subframe

 */

typedef struct G723_1_Subframe {

    int ad_cb_lag;     ///< adaptive codebook lag

    int ad_cb_gain;

    int dirac_train;

    int pulse_sign;

    int grid_index;

    int amp_index;

    int pulse_pos;

} G723_1_Subframe;


/**

 * Pitch postfilter parameters

 */

typedef struct PPFParam {

    int     index;    ///< postfilter backward/forward lag

    int16_t opt_gain; ///< optimal gain

    int16_t sc_gain;  ///< scaling gain

} PPFParam;


/**

 * Harmonic filter parameters

 */

typedef struct HFParam {

    int index;

    int gain;

} HFParam;


/**

 * Optimized fixed codebook excitation parameters

 */

typedef struct FCBParam {

    int min_err;

    int amp_index;

    int grid_index;

    int dirac_train;

    int pulse_pos[PULSE_MAX];

    int pulse_sign[PULSE_MAX];

} FCBParam;


typedef struct G723_1_ChannelContext {

    G723_1_Subframe subframe[4];

    enum FrameType cur_frame_type;

    enum FrameType past_frame_type;

    enum Rate cur_rate;

    uint8_t lsp_index[LSP_BANDS];

    int pitch_lag[2];

    int erased_frames;


    int16_t prev_lsp[LPC_ORDER];

    int16_t sid_lsp[LPC_ORDER];

    int16_t prev_excitation[PITCH_MAX];

    int16_t excitation[PITCH_MAX + FRAME_LEN + 4];

    int16_t synth_mem[LPC_ORDER];

    int16_t fir_mem[LPC_ORDER];

    int     iir_mem[LPC_ORDER];


    int random_seed;

    int cng_random_seed;

    int interp_index;

    int interp_gain;

    int sid_gain;

    int cur_gain;

    int reflection_coef;

    int pf_gain;                 ///< formant postfilter

                                 ///< gain scaling unit memory

    int16_t audio[FRAME_LEN + LPC_ORDER + PITCH_MAX + 4];


    /* encoder */

    int16_t prev_data[HALF_FRAME_LEN];

    int16_t prev_weight_sig[PITCH_MAX];


    int16_t hpf_fir_mem;                   ///< highpass filter fir

    int     hpf_iir_mem;                   ///< and iir memories

    int16_t perf_fir_mem[LPC_ORDER];       ///< perceptual filter fir

    int16_t perf_iir_mem[LPC_ORDER];       ///< and iir memories


    int16_t harmonic_mem[PITCH_MAX];

} G723_1_ChannelContext;


typedef struct G723_1_Context {

    AVClass *class;

    int postfilter;


    G723_1_ChannelContext ch[2];

} G723_1_Context;


/**

 * Scale vector contents based on the largest of their absolutes.

 */

int ff_g723_1_scale_vector(int16_t *dst, const int16_t *vector, int length);


/**

 * Calculate the number of left-shifts required for normalizing the input.

 *

 * @param num   input number

 * @param width width of the input, 16 bits(0) / 32 bits(1)

 */

int ff_g723_1_normalize_bits(int num, int width);


int ff_g723_1_dot_product(const int16_t *a, const int16_t *b, int length);


/**

 * Get delayed contribution from the previous excitation vector.

 */

void ff_g723_1_get_residual(int16_t *residual, int16_t *prev_excitation,

                            int lag);


/**

 * Generate a train of dirac functions with period as pitch lag.

 */

void ff_g723_1_gen_dirac_train(int16_t *buf, int pitch_lag);


/**

 * Generate adaptive codebook excitation.

 */

void ff_g723_1_gen_acb_excitation(int16_t *vector, int16_t *prev_excitation,

                                  int pitch_lag, G723_1_Subframe *subfrm,

                                  enum Rate cur_rate);

/**

 * Quantize LSP frequencies by interpolation and convert them to

 * the corresponding LPC coefficients.

 *

 * @param lpc      buffer for LPC coefficients

 * @param cur_lsp  the current LSP vector

 * @param prev_lsp the previous LSP vector

 */

void ff_g723_1_lsp_interpolate(int16_t *lpc, int16_t *cur_lsp,

                               int16_t *prev_lsp);


/**

 * Perform inverse quantization of LSP frequencies.

 *

 * @param cur_lsp    the current LSP vector

 * @param prev_lsp   the previous LSP vector

 * @param lsp_index  VQ indices

 * @param bad_frame  bad frame flag

 */

void ff_g723_1_inverse_quant(int16_t *cur_lsp, int16_t *prev_lsp,

                             uint8_t *lsp_index, int bad_frame);


static const uint8_t frame_size[4] = { 24, 20, 4, 1 };


/**

 * LSP DC component

 */

static const int16_t dc_lsp[LPC_ORDER] = {

    0x0c3b,

    0x1271,

    0x1e0a,

    0x2a36,

    0x3630,

    0x406f,

    0x4d28,

    0x56f4,

    0x638c,

    0x6c46

};


/* Cosine table scaled by 2^14 */

extern const int16_t ff_g723_1_cos_tab[COS_TBL_SIZE + 1];

#define G723_1_COS_TAB_FIRST_ELEMENT 16384


/**

 *  LSP VQ tables

 */

extern const int16_t ff_g723_1_lsp_band0[LSP_CB_SIZE][3];

extern const int16_t ff_g723_1_lsp_band1[LSP_CB_SIZE][3];

extern const int16_t ff_g723_1_lsp_band2[LSP_CB_SIZE][4];


/**

 * Used for the coding/decoding of the pulses positions

 * for the MP-MLQ codebook

 */

extern const int32_t ff_g723_1_combinatorial_table[PULSE_MAX][SUBFRAME_LEN/GRID_SIZE];


/**

 * Number of non-zero pulses in the MP-MLQ excitation

 */

static const int8_t pulses[4] = {6, 5, 6, 5};


extern const int16_t ff_g723_1_fixed_cb_gain[GAIN_LEVELS];


extern const int16_t ff_g723_1_adaptive_cb_gain85 [ 85 * 20];

extern const int16_t ff_g723_1_adaptive_cb_gain170[170 * 20];


#endif /* AVCODEC_G723_1_H */