doxygen/trunk/libmp3lame_8c_source.html

/*

 * Interface to libmp3lame for mp3 encoding

 * Copyright (c) 2002 Lennert Buytenhek <buytenh@gnu.org>

 *

 * This file is part of FFmpeg.

 *

 * FFmpeg is free software; you can redistribute it and/or

 * modify it under the terms of the GNU Lesser General Public

 * License as published by the Free Software Foundation; either

 * version 2.1 of the License, or (at your option) any later version.

 *

 * FFmpeg is distributed in the hope that it will be useful,

 * but WITHOUT ANY WARRANTY; without even the implied warranty of

 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU

 * Lesser General Public License for more details.

 *

 * You should have received a copy of the GNU Lesser General Public

 * License along with FFmpeg; if not, write to the Free Software

 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA

 */


/**

 * @file

 * Interface to libmp3lame for mp3 encoding.

 */


#include <lame/lame.h>


#include "libavutil/channel_layout.h"

#include "libavutil/common.h"

#include "libavutil/float_dsp.h"

#include "libavutil/intreadwrite.h"

#include "libavutil/log.h"

#include "libavutil/mem.h"

#include "libavutil/opt.h"

#include "avcodec.h"

#include "audio_frame_queue.h"

#include "codec_internal.h"

#include "encode.h"

#include "mpegaudio.h"

#include "mpegaudiodecheader.h"


#define BUFFER_SIZE (7200 + 2 * MPA_FRAME_SIZE + MPA_FRAME_SIZE / 4+1000) // FIXME: Buffer size to small? Adding 1000 to make up for it.


typedef struct LAMEContext {

    AVClass *class;

    AVCodecContext *avctx;

    lame_global_flags *gfp;

    uint8_t *buffer;

    int buffer_index;

    int buffer_size;

    int reservoir;

    int joint_stereo;

    int abr;

    int delay_sent;

    float *samples_flt[2];

    AudioFrameQueue afq;

    AVFloatDSPContext *fdsp;

    int copyright;

    int original;

} LAMEContext;


static int realloc_buffer(LAMEContext *s)

{

    if (!s->buffer || s->buffer_size - s->buffer_index < BUFFER_SIZE) {

        int new_size = s->buffer_index + 2 * BUFFER_SIZE, err;


        ff_dlog(s->avctx, "resizing output buffer: %d -> %d\n", s->buffer_size,

                new_size);

        if ((err = av_reallocp(&s->buffer, new_size)) < 0) {

            s->buffer_size = s->buffer_index = 0;

            return err;

        }

        s->buffer_size = new_size;

    }

    return 0;

}


static av_cold int mp3lame_encode_close(AVCodecContext *avctx)

{

    LAMEContext *s = avctx->priv_data;


    av_freep(&s->samples_flt[0]);

    av_freep(&s->samples_flt[1]);

    av_freep(&s->buffer);

    av_freep(&s->fdsp);


    ff_af_queue_close(&s->afq);


    lame_close(s->gfp);

    return 0;

}


static av_cold int mp3lame_encode_init(AVCodecContext *avctx)

{

    LAMEContext *s = avctx->priv_data;

    int ret;


    s->avctx = avctx;


    /* initialize LAME and get defaults */

    if (!(s->gfp = lame_init()))

        return AVERROR(ENOMEM);


    lame_set_num_channels(s->gfp, avctx->ch_layout.nb_channels);

    lame_set_mode(s->gfp, avctx->ch_layout.nb_channels > 1 ?

                          s->joint_stereo ? JOINT_STEREO : STEREO : MONO);


    /* sample rate */

    lame_set_in_samplerate (s->gfp, avctx->sample_rate);

    lame_set_out_samplerate(s->gfp, avctx->sample_rate);


    /* algorithmic quality */

    if (avctx->compression_level != FF_COMPRESSION_DEFAULT)

        lame_set_quality(s->gfp, avctx->compression_level);


    /* rate control */

    if (avctx->flags & AV_CODEC_FLAG_QSCALE) { // VBR

        lame_set_VBR(s->gfp, vbr_default);

        lame_set_VBR_quality(s->gfp, avctx->global_quality / (float)FF_QP2LAMBDA);

    } else {

        if (avctx->bit_rate) {

            if (s->abr) {                   // ABR

                lame_set_VBR(s->gfp, vbr_abr);

                lame_set_VBR_mean_bitrate_kbps(s->gfp, avctx->bit_rate / 1000);

            } else                          // CBR

                lame_set_brate(s->gfp, avctx->bit_rate / 1000);

        }

    }


    /* lowpass cutoff frequency */

    if (avctx->cutoff)

        lame_set_lowpassfreq(s->gfp, avctx->cutoff);


    /* do not get a Xing VBR header frame from LAME */

    lame_set_bWriteVbrTag(s->gfp,0);


    /* bit reservoir usage */

    lame_set_disable_reservoir(s->gfp, !s->reservoir);


    /* copyright flag */

    lame_set_copyright(s->gfp, s->copyright);


    /* original flag */

    lame_set_original(s->gfp, s->original);


    /* set specified parameters */

    if (lame_init_params(s->gfp) < 0) {

        ret = AVERROR_EXTERNAL;

        goto error;

    }


    /* get encoder delay */

    avctx->initial_padding = lame_get_encoder_delay(s->gfp) + 528 + 1;

    ff_af_queue_init(avctx, &s->afq);


    avctx->frame_size  = lame_get_framesize(s->gfp);


    /* allocate float sample buffers */

    if (avctx->sample_fmt == AV_SAMPLE_FMT_FLTP) {

        int ch;

        for (ch = 0; ch < avctx->ch_layout.nb_channels; ch++) {

            s->samples_flt[ch] = av_malloc_array(avctx->frame_size,

                                           sizeof(*s->samples_flt[ch]));

            if (!s->samples_flt[ch]) {

                ret = AVERROR(ENOMEM);

                goto error;

            }

        }

    }


    ret = realloc_buffer(s);

    if (ret < 0)

        goto error;


    s->fdsp = avpriv_float_dsp_alloc(avctx->flags & AV_CODEC_FLAG_BITEXACT);

    if (!s->fdsp) {

        ret = AVERROR(ENOMEM);

        goto error;

    }


    return 0;

error:

    mp3lame_encode_close(avctx);

    return ret;

}


#define ENCODE_BUFFER(func, buf_type, buf_name) do {                        \

    lame_result = func(s->gfp,                                              \

                       (const buf_type *)buf_name[0],                       \

                       (const buf_type *)buf_name[1], frame->nb_samples,    \

                       s->buffer + s->buffer_index,                         \

                       s->buffer_size - s->buffer_index);                   \

} while (0)


static int mp3lame_encode_frame(AVCodecContext *avctx, AVPacket *avpkt,

                                const AVFrame *frame, int *got_packet_ptr)

{

    LAMEContext *s = avctx->priv_data;

    MPADecodeHeader hdr;

    int len, ret, ch, discard_padding;

    int lame_result;

    uint32_t h;


    if (frame) {

        switch (avctx->sample_fmt) {

        case AV_SAMPLE_FMT_S16P:

            ENCODE_BUFFER(lame_encode_buffer, int16_t, frame->data);

            break;

        case AV_SAMPLE_FMT_S32P:

            ENCODE_BUFFER(lame_encode_buffer_int, int32_t, frame->data);

            break;

        case AV_SAMPLE_FMT_FLTP:

            if (frame->linesize[0] < 4 * FFALIGN(frame->nb_samples, 8)) {

                av_log(avctx, AV_LOG_ERROR, "inadequate AVFrame plane padding\n");

                return AVERROR(EINVAL);

            }

            for (ch = 0; ch < avctx->ch_layout.nb_channels; ch++) {

                s->fdsp->vector_fmul_scalar(s->samples_flt[ch],

                                           (const float *)frame->data[ch],

                                           32768.0f,

                                           FFALIGN(frame->nb_samples, 8));

            }

            ENCODE_BUFFER(lame_encode_buffer_float, float, s->samples_flt);

            break;

        default:

            return AVERROR_BUG;

        }

    } else if (!s->afq.frame_alloc) {

        lame_result = 0;

    } else {

        lame_result = lame_encode_flush(s->gfp, s->buffer + s->buffer_index,

                                        s->buffer_size - s->buffer_index);

    }

    if (lame_result < 0) {

        if (lame_result == -1) {

            av_log(avctx, AV_LOG_ERROR,

                   "lame: output buffer too small (buffer index: %d, free bytes: %d)\n",

                   s->buffer_index, s->buffer_size - s->buffer_index);

        }

        return AVERROR(ENOMEM);

    }

    s->buffer_index += lame_result;

    ret = realloc_buffer(s);

    if (ret < 0) {

        av_log(avctx, AV_LOG_ERROR, "error reallocating output buffer\n");

        return ret;

    }


    /* add current frame to the queue */

    if (frame) {

        if ((ret = ff_af_queue_add(&s->afq, frame)) < 0)

            return ret;

    }


    /* Move 1 frame from the LAME buffer to the output packet, if available.

       We have to parse the first frame header in the output buffer to

       determine the frame size. */

    if (s->buffer_index < 4)

        return 0;

    h = AV_RB32(s->buffer);


    ret = avpriv_mpegaudio_decode_header(&hdr, h);

    if (ret < 0) {

        av_log(avctx, AV_LOG_ERROR, "Invalid mp3 header at start of buffer\n");

        return AVERROR_BUG;

    } else if (ret) {

        av_log(avctx, AV_LOG_ERROR, "free format output not supported\n");

        return AVERROR_INVALIDDATA;

    }

    len = hdr.frame_size;

    ff_dlog(avctx, "in:%d packet-len:%d index:%d\n", avctx->frame_size, len,

            s->buffer_index);

    if (len <= s->buffer_index) {

        if ((ret = ff_get_encode_buffer(avctx, avpkt, len, 0)) < 0)

            return ret;

        memcpy(avpkt->data, s->buffer, len);

        s->buffer_index -= len;

        memmove(s->buffer, s->buffer + len, s->buffer_index);


        /* Get the next frame pts/duration */

        ff_af_queue_remove(&s->afq, avctx->frame_size, &avpkt->pts,

                           &avpkt->duration);


        discard_padding = avctx->frame_size - avpkt->duration;

        // Check if subtraction resulted in an overflow

        if ((discard_padding < avctx->frame_size) != (avpkt->duration > 0)) {

            av_log(avctx, AV_LOG_ERROR, "discard padding overflow\n");

            return AVERROR(EINVAL);

        }

        if ((!s->delay_sent && avctx->initial_padding > 0) || discard_padding > 0) {

            uint8_t* side_data = av_packet_new_side_data(avpkt,

                                                         AV_PKT_DATA_SKIP_SAMPLES,

                                                         10);

            if (!side_data)

                return AVERROR(ENOMEM);

            if (!s->delay_sent) {

                AV_WL32(side_data, avctx->initial_padding);

                s->delay_sent = 1;

            }

            AV_WL32(side_data + 4, discard_padding);

        }


        *got_packet_ptr = 1;

    }

    return 0;

}


#define OFFSET(x) offsetof(LAMEContext, x)

#define AE AV_OPT_FLAG_AUDIO_PARAM | AV_OPT_FLAG_ENCODING_PARAM

static const AVOption options[] = {

    { "reservoir",    "use bit reservoir",  OFFSET(reservoir),    AV_OPT_TYPE_BOOL, { .i64 = 1 }, 0, 1, AE },

    { "joint_stereo", "use joint stereo",   OFFSET(joint_stereo), AV_OPT_TYPE_BOOL, { .i64 = 1 }, 0, 1, AE },

    { "abr",          "use ABR",            OFFSET(abr),          AV_OPT_TYPE_BOOL, { .i64 = 0 }, 0, 1, AE },

    { "copyright",    "set copyright flag", OFFSET(copyright),    AV_OPT_TYPE_BOOL, { .i64 = 0 }, 0, 1, AE},

    { "original",     "set original flag",  OFFSET(original),     AV_OPT_TYPE_BOOL, { .i64 = 1 }, 0, 1, AE},

    { NULL },

};


static const AVClass libmp3lame_class = {

    .class_name = "libmp3lame encoder",

    .item_name  = av_default_item_name,

    .option     = options,

    .version    = LIBAVUTIL_VERSION_INT,

};


static const FFCodecDefault libmp3lame_defaults[] = {

    { "b",          "0" },

    { NULL },

};


static const int libmp3lame_sample_rates[] = {

    44100, 48000,  32000, 22050, 24000, 16000, 11025, 12000, 8000, 0

};


const FFCodec ff_libmp3lame_encoder = {

    .p.name                = "libmp3lame",

    CODEC_LONG_NAME("libmp3lame MP3 (MPEG audio layer 3)"),

    .p.type                = AVMEDIA_TYPE_AUDIO,

    .p.id                  = AV_CODEC_ID_MP3,

    .p.capabilities        = AV_CODEC_CAP_DR1 | AV_CODEC_CAP_DELAY |

                             AV_CODEC_CAP_SMALL_LAST_FRAME,

    .caps_internal         = FF_CODEC_CAP_NOT_INIT_THREADSAFE,

    .priv_data_size        = sizeof(LAMEContext),

    .init                  = mp3lame_encode_init,

    FF_CODEC_ENCODE_CB(mp3lame_encode_frame),

    .close                 = mp3lame_encode_close,

    CODEC_SAMPLEFMTS(AV_SAMPLE_FMT_S32P, AV_SAMPLE_FMT_FLTP, AV_SAMPLE_FMT_S16P),

    CODEC_SAMPLERATES_ARRAY(libmp3lame_sample_rates),

    CODEC_CH_LAYOUTS(AV_CHANNEL_LAYOUT_MONO, AV_CHANNEL_LAYOUT_STEREO),

    .p.priv_class          = &libmp3lame_class,

    .defaults              = libmp3lame_defaults,

    .p.wrapper_name        = "libmp3lame",

};